> -----Original Message-----
> From: Jani Nikula <jani.nik...@linux.intel.com>
> Sent: Monday, May 19, 2025 6:22 PM
> To: Garg, Nemesa <nemesa.g...@intel.com>; intel-...@lists.freedesktop.org;
> intel...@lists.freedesktop.org; dri-devel@lists.freedesktop.org
> Cc: Garg, Nemesa <nemesa.g...@intel.com>; Nautiyal, Ankit K
> <ankit.k.nauti...@intel.com>
> Subject: Re: [PATCH 05/10] drm/i915/display: Compute the scaler coefficients
> 
> On Mon, 19 May 2025, Nemesa Garg <nemesa.g...@intel.com> wrote:
> > The sharpness property requires the use of one of the scaler so need
> > to set the sharpness scaler coefficient values.
> > These values are based on experiments and vary for different tap
> > value/win size. These values are normalized by taking the sum of all
> > values and then dividing each value with a sum.
> >
> > v2: Fix ifndef header naming issue reported by kernel test robot
> > v3: Rename file name[Arun]
> >     Replace array size number with macro[Arun]
> > v4: Correct the register format[Jani]
> >     Add brief comment and expalin about file[Jani]
> >     Remove coefficient value from crtc_state[Jani]
> > v5: Fix build issue
> > v6: Add new function for writing coefficients[Ankit]
> > v7: Add cooments and add a scaler id check [Ankit]
> > v8: Remove casf_enable from here[Ankit]
> >
> > Signed-off-by: Nemesa Garg <nemesa.g...@intel.com>
> > Reviewed-by: Ankit Nautiyal <ankit.k.nauti...@intel.com>
> > ---
> >  drivers/gpu/drm/i915/display/intel_casf.c     | 120 ++++++++++++++++++
> >  drivers/gpu/drm/i915/display/intel_casf.h     |   1 +
> >  .../gpu/drm/i915/display/intel_casf_regs.h    |   7 +
> >  .../drm/i915/display/intel_display_types.h    |   8 ++
> >  4 files changed, 136 insertions(+)
> >
> > diff --git a/drivers/gpu/drm/i915/display/intel_casf.c
> > b/drivers/gpu/drm/i915/display/intel_casf.c
> > index 6dab67eb77ab..f5ae5e1efbd5 100644
> > --- a/drivers/gpu/drm/i915/display/intel_casf.c
> > +++ b/drivers/gpu/drm/i915/display/intel_casf.c
> > @@ -15,6 +15,13 @@
> >  #define MAX_PIXELS_FOR_3_TAP_FILTER (1920 * 1080)  #define
> > MAX_PIXELS_FOR_5_TAP_FILTER (3840 * 2160)
> >
> > +#define FILTER_COEFF_0_125 125
> > +#define FILTER_COEFF_0_25 250
> > +#define FILTER_COEFF_0_5 500
> > +#define FILTER_COEFF_1_0 1000
> > +#define FILTER_COEFF_0_0 0
> > +#define SET_POSITIVE_SIGN(x) ((x) & (~SIGN))
> > +
> >  /**
> >   * DOC: Content Adaptive Sharpness Filter (CASF)
> >   *
> > @@ -38,6 +45,24 @@ static const u16 sharpness_lut[] = {
> >     73, 60, 48, 36, 24, 12, 0
> >  };
> >
> > +const u16 filtercoeff_1[] = {
> > +   FILTER_COEFF_0_0, FILTER_COEFF_0_0, FILTER_COEFF_0_5,
> > +   FILTER_COEFF_1_0, FILTER_COEFF_0_5, FILTER_COEFF_0_0,
> > +   FILTER_COEFF_0_0,
> > +};
> > +
> > +const u16 filtercoeff_2[] = {
> > +   FILTER_COEFF_0_0, FILTER_COEFF_0_25, FILTER_COEFF_0_5,
> > +   FILTER_COEFF_1_0, FILTER_COEFF_0_5, FILTER_COEFF_0_25,
> > +   FILTER_COEFF_0_0,
> > +};
> > +
> > +const u16 filtercoeff_3[] = {
> > +   FILTER_COEFF_0_125, FILTER_COEFF_0_25, FILTER_COEFF_0_5,
> > +   FILTER_COEFF_1_0, FILTER_COEFF_0_5, FILTER_COEFF_0_25,
> > +   FILTER_COEFF_0_125,
> > +};
> > +
> >  void intel_filter_lut_load(struct intel_crtc *crtc,
> >                        const struct intel_crtc_state *crtc_state)  { @@ -
> 107,6 +132,8
> > @@ int intel_casf_compute_config(struct intel_crtc_state *crtc_state)
> >
> >     intel_casf_compute_win_size(crtc_state);
> >
> > +   intel_casf_scaler_compute_config(crtc_state);
> > +
> >     return 0;
> >  }
> >
> > @@ -129,3 +156,96 @@ void intel_casf_sharpness_get_config(struct
> intel_crtc_state *crtc_state)
> >                     REG_FIELD_GET(FILTER_SIZE_MASK, sharp);
> >     }
> >  }
> > +
> > +static int casf_coeff_tap(int i)
> > +{
> > +   return i % SCALER_FILTER_NUM_TAPS;
> > +}
> > +
> > +static u16 casf_coeff(struct intel_crtc_state *crtc_state, int t)
> 
> The result is stuff that gets shoved into registers. u32 would be in order.
> 
> > +{
> > +   struct scaler_filter_coeff value;
> > +   u16 coeff;
> > +
> > +   value = crtc_state->hw.casf_params.coeff[t];
> > +   coeff = SET_POSITIVE_SIGN(0) | EXPONENT(value.exp) |
> > +MANTISSA(value.mantissa);
> 
> Those macros return u32 values. coeff should be u32 too.
> 
> > +   return coeff;
> > +}
> > +
> > +/*
> > + * 17 phase of 7 taps requires 119 coefficients in 60 dwords per set.
> > + * To enable casf:  program scaler coefficients with the coeffients
> > + * that are calculated and stored in hw.casf_params.coeff as per
> > + * SCALER_COEFFICIENT_FORMAT
> > + */
> > +static void intel_casf_write_coeff(struct intel_crtc_state
> > +*crtc_state) {
> > +   struct intel_display *display = to_intel_display(crtc_state);
> > +   struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
> > +   int id = crtc_state->scaler_state.scaler_id;
> > +   int i;
> > +
> > +   if (id != 1) {
> > +           drm_WARN(display->drm, 0, "Second scaler not enabled\n");
> > +           return;
> > +   }
> > +
> > +   intel_de_write_fw(display, GLK_PS_COEF_INDEX_SET(crtc->pipe, id,
> 0),
> > +                     PS_COEF_INDEX_AUTO_INC);
> > +
> > +   for (i = 0; i < 17 * SCALER_FILTER_NUM_TAPS; i += 2) {
> > +           u32 tmp;
> > +           int t;
> > +
> > +           t = casf_coeff_tap(i);
> > +           tmp = casf_coeff(crtc_state, t);
> > +
> > +           t = casf_coeff_tap(i + 1);
> > +           tmp |= casf_coeff(crtc_state, t) << 16;
> > +
> > +           intel_de_write_fw(display, GLK_PS_COEF_DATA_SET(crtc-
> >pipe, id, 0),
> > +                             tmp);
> > +   }
> > +}
> > +
> > +static void convert_sharpness_coef_binary(struct scaler_filter_coeff 
> > *coeff,
> > +                                     u16 coefficient)
> > +{
> > +   if (coefficient < 25) {
> > +           coeff->mantissa = (coefficient * 2048) / 100;
> > +           coeff->exp = 3;
> > +   } else if (coefficient < 50) {
> > +           coeff->mantissa = (coefficient * 1024) / 100;
> > +           coeff->exp = 2;
> > +   } else if (coefficient < 100) {
> > +           coeff->mantissa = (coefficient * 512) / 100;
> > +           coeff->exp = 1;
> > +   } else {
> > +           coeff->mantissa = (coefficient * 256) / 100;
> > +           coeff->exp = 0;
> > +   }
> > +}
> > +
> > +void intel_casf_scaler_compute_config(struct intel_crtc_state
> > +*crtc_state) {
> > +   const u16 *filtercoeff;
> > +   u16 filter_coeff[SCALER_FILTER_NUM_TAPS];
> > +   u16 sumcoeff = 0;
> > +   u8 i;
> 
> It's used for looping. It's an int.
Ack
> 
> > +
> > +   if (crtc_state->hw.casf_params.win_size == 0)
> > +           filtercoeff = filtercoeff_1;
> > +   else if (crtc_state->hw.casf_params.win_size == 1)
> > +           filtercoeff = filtercoeff_2;
> > +   else
> > +           filtercoeff = filtercoeff_3;
> > +
> > +   for (i = 0; i < SCALER_FILTER_NUM_TAPS; i++)
> > +           sumcoeff += *(filtercoeff + i);
> > +
> > +   for (i = 0; i < SCALER_FILTER_NUM_TAPS; i++) {
> > +           filter_coeff[i] = (*(filtercoeff + i) * 100 / sumcoeff);
> > +           convert_sharpness_coef_binary(&crtc_state-
> >hw.casf_params.coeff[i],
> > +                                         filter_coeff[i]);
> 
> Are you should u16 is the right type to use here?
Here I am using 16 bit value and further combining 2 16-bit values to form 32 
bit value.
> 
> > +   }
> > +}
> > diff --git a/drivers/gpu/drm/i915/display/intel_casf.h
> > b/drivers/gpu/drm/i915/display/intel_casf.h
> > index 80642809c08b..381d5e10c70d 100644
> > --- a/drivers/gpu/drm/i915/display/intel_casf.h
> > +++ b/drivers/gpu/drm/i915/display/intel_casf.h
> > @@ -16,5 +16,6 @@ void intel_casf_update_strength(struct
> > intel_crtc_state *new_crtc_state);  void
> > intel_casf_sharpness_get_config(struct intel_crtc_state *crtc_state);  void
> intel_filter_lut_load(struct intel_crtc *crtc,
> >                        const struct intel_crtc_state *crtc_state);
> > +void intel_casf_scaler_compute_config(struct intel_crtc_state
> > +*crtc_state);
> >
> >  #endif /* __INTEL_CASF_H__ */
> > diff --git a/drivers/gpu/drm/i915/display/intel_casf_regs.h
> > b/drivers/gpu/drm/i915/display/intel_casf_regs.h
> > index b96950a48335..f8c3c86f2949 100644
> > --- a/drivers/gpu/drm/i915/display/intel_casf_regs.h
> > +++ b/drivers/gpu/drm/i915/display/intel_casf_regs.h
> > @@ -30,4 +30,11 @@
> >  #define   INDEX_VALUE_MASK             REG_GENMASK(4, 0)
> >  #define   INDEX_VALUE(x)               REG_FIELD_PREP(INDEX_VALUE_MASK,
> (x))
> >
> > +/* Scaler Coefficient structure */
> > +#define SIGN                           REG_BIT(15)
> > +#define EXPONENT_MASK                  REG_GENMASK(13, 12)
> > +#define EXPONENT(x)                    REG_FIELD_PREP(EXPONENT_MASK, (x))
> > +#define MANTISSA_MASK                  REG_GENMASK(11, 3)
> > +#define MANTISSA(x)                    REG_FIELD_PREP(MANTISSA_MASK, (x))
> 
> I think the macro names are way too generic, and likely to conflict with other
> headers, in the future if not now.
Will change.
> 
> Please define these as part of the register as described by the big comment at
> the top of i915_reg.h. Please do not add comments or vertical space in
> between. Please indent them. These need to be attached to the register they
> describe.
> 
> > +
> >  #endif /* __INTEL_CASF_REGS__ */
> > diff --git a/drivers/gpu/drm/i915/display/intel_display_types.h
> > b/drivers/gpu/drm/i915/display/intel_display_types.h
> > index 3a2e2bdfd356..3de4738f4080 100644
> > --- a/drivers/gpu/drm/i915/display/intel_display_types.h
> > +++ b/drivers/gpu/drm/i915/display/intel_display_types.h
> > @@ -935,7 +935,15 @@ struct intel_csc_matrix {
> >     u16 postoff[3];
> >  };
> >
> > +struct scaler_filter_coeff {
> > +   u16 sign;
> > +   u16 exp;
> > +   u16 mantissa;
> > +};
> > +
> >  struct intel_casf {
> > +#define SCALER_FILTER_NUM_TAPS 7
> > +   struct scaler_filter_coeff coeff[SCALER_FILTER_NUM_TAPS];
> >     u8 strength;
> >     u8 win_size;
> >     bool casf_enable;
> 
> --
> Jani Nikula, Intel

Reply via email to