[AMD Official Use Only - AMD Internal Distribution Only]

The flush reg is read/write. If the reads are not working on those platforms, I 
think the writes may be dropped silently.

Thanks,
Lijo
________________________________
From: Alex Deucher <alexdeuc...@gmail.com>
Sent: Wednesday, May 7, 2025 8:43:51 PM
To: Deucher, Alexander <alexander.deuc...@amd.com>; Lazar, Lijo 
<lijo.la...@amd.com>; Kuehling, Felix <felix.kuehl...@amd.com>; Koenig, 
Christian <christian.koe...@amd.com>
Cc: amd-gfx@lists.freedesktop.org <amd-gfx@lists.freedesktop.org>
Subject: Re: [PATCH 1/7] Revert "drm/amdgpu: Use generic hdp flush function"

Ping again on this series?

Alex

On Tue, May 6, 2025 at 11:17 AM Alex Deucher <alexdeuc...@gmail.com> wrote:
>
> Ping on this series?  This fixes a regression.
>
> Alex
>
> On Mon, May 5, 2025 at 9:05 AM Alex Deucher <alexander.deuc...@amd.com> wrote:
> >
> > This reverts commit 18a878fd8aef0ec21648a3782f55a79790cd4073.
> >
> > Revert this temporarily to make it easier to fix a regression
> > in the HDP handling.
> >
> > Signed-off-by: Alex Deucher <alexander.deuc...@amd.com>
> > ---
> >  drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.c | 21 ---------------------
> >  drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.h |  2 --
> >  drivers/gpu/drm/amd/amdgpu/hdp_v4_0.c   | 13 ++++++++++++-
> >  drivers/gpu/drm/amd/amdgpu/hdp_v5_0.c   | 13 ++++++++++++-
> >  drivers/gpu/drm/amd/amdgpu/hdp_v6_0.c   | 13 ++++++++++++-
> >  drivers/gpu/drm/amd/amdgpu/hdp_v7_0.c   | 13 ++++++++++++-
> >  6 files changed, 48 insertions(+), 27 deletions(-)
> >
> > diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.c 
> > b/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.c
> > index 7fd8f09c28e66..b6cf801939aa5 100644
> > --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.c
> > +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.c
> > @@ -22,7 +22,6 @@
> >   */
> >  #include "amdgpu.h"
> >  #include "amdgpu_ras.h"
> > -#include <uapi/linux/kfd_ioctl.h>
> >
> >  int amdgpu_hdp_ras_sw_init(struct amdgpu_device *adev)
> >  {
> > @@ -47,23 +46,3 @@ int amdgpu_hdp_ras_sw_init(struct amdgpu_device *adev)
> >         /* hdp ras follows amdgpu_ras_block_late_init_default for late init 
> > */
> >         return 0;
> >  }
> > -
> > -void amdgpu_hdp_generic_flush(struct amdgpu_device *adev,
> > -                             struct amdgpu_ring *ring)
> > -{
> > -       if (!ring || !ring->funcs->emit_wreg) {
> > -               WREG32((adev->rmmio_remap.reg_offset +
> > -                       KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >>
> > -                              2,
> > -                      0);
> > -               RREG32((adev->rmmio_remap.reg_offset +
> > -                       KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >>
> > -                      2);
> > -       } else {
> > -               amdgpu_ring_emit_wreg(ring,
> > -                                     (adev->rmmio_remap.reg_offset +
> > -                                      KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >>
> > -                                             2,
> > -                                     0);
> > -       }
> > -}
> > \ No newline at end of file
> > diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.h 
> > b/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.h
> > index 4cfd932b7e91e..7b8a6152dc8d9 100644
> > --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.h
> > +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.h
> > @@ -44,6 +44,4 @@ struct amdgpu_hdp {
> >  };
> >
> >  int amdgpu_hdp_ras_sw_init(struct amdgpu_device *adev);
> > -void amdgpu_hdp_generic_flush(struct amdgpu_device *adev,
> > -                             struct amdgpu_ring *ring);
> >  #endif /* __AMDGPU_HDP_H__ */
> > diff --git a/drivers/gpu/drm/amd/amdgpu/hdp_v4_0.c 
> > b/drivers/gpu/drm/amd/amdgpu/hdp_v4_0.c
> > index e6c0d86d34865..f1dc13b3ab38e 100644
> > --- a/drivers/gpu/drm/amd/amdgpu/hdp_v4_0.c
> > +++ b/drivers/gpu/drm/amd/amdgpu/hdp_v4_0.c
> > @@ -36,6 +36,17 @@
> >  #define HDP_MEM_POWER_CTRL__RC_MEM_POWER_LS_EN_MASK     0x00020000L
> >  #define mmHDP_MEM_POWER_CTRL_BASE_IDX   0
> >
> > +static void hdp_v4_0_flush_hdp(struct amdgpu_device *adev,
> > +                               struct amdgpu_ring *ring)
> > +{
> > +       if (!ring || !ring->funcs->emit_wreg) {
> > +               WREG32((adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > +               RREG32((adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2);
> > +       } else {
> > +               amdgpu_ring_emit_wreg(ring, (adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > +       }
> > +}
> > +
> >  static void hdp_v4_0_invalidate_hdp(struct amdgpu_device *adev,
> >                                     struct amdgpu_ring *ring)
> >  {
> > @@ -169,7 +180,7 @@ struct amdgpu_hdp_ras hdp_v4_0_ras = {
> >  };
> >
> >  const struct amdgpu_hdp_funcs hdp_v4_0_funcs = {
> > -       .flush_hdp = amdgpu_hdp_generic_flush,
> > +       .flush_hdp = hdp_v4_0_flush_hdp,
> >         .invalidate_hdp = hdp_v4_0_invalidate_hdp,
> >         .update_clock_gating = hdp_v4_0_update_clock_gating,
> >         .get_clock_gating_state = hdp_v4_0_get_clockgating_state,
> > diff --git a/drivers/gpu/drm/amd/amdgpu/hdp_v5_0.c 
> > b/drivers/gpu/drm/amd/amdgpu/hdp_v5_0.c
> > index 8bc001dc9f631..43195c0797480 100644
> > --- a/drivers/gpu/drm/amd/amdgpu/hdp_v5_0.c
> > +++ b/drivers/gpu/drm/amd/amdgpu/hdp_v5_0.c
> > @@ -27,6 +27,17 @@
> >  #include "hdp/hdp_5_0_0_sh_mask.h"
> >  #include <uapi/linux/kfd_ioctl.h>
> >
> > +static void hdp_v5_0_flush_hdp(struct amdgpu_device *adev,
> > +                               struct amdgpu_ring *ring)
> > +{
> > +       if (!ring || !ring->funcs->emit_wreg) {
> > +               WREG32((adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > +               RREG32((adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2);
> > +       } else {
> > +               amdgpu_ring_emit_wreg(ring, (adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > +       }
> > +}
> > +
> >  static void hdp_v5_0_invalidate_hdp(struct amdgpu_device *adev,
> >                                     struct amdgpu_ring *ring)
> >  {
> > @@ -206,7 +217,7 @@ static void hdp_v5_0_init_registers(struct 
> > amdgpu_device *adev)
> >  }
> >
> >  const struct amdgpu_hdp_funcs hdp_v5_0_funcs = {
> > -       .flush_hdp = amdgpu_hdp_generic_flush,
> > +       .flush_hdp = hdp_v5_0_flush_hdp,
> >         .invalidate_hdp = hdp_v5_0_invalidate_hdp,
> >         .update_clock_gating = hdp_v5_0_update_clock_gating,
> >         .get_clock_gating_state = hdp_v5_0_get_clockgating_state,
> > diff --git a/drivers/gpu/drm/amd/amdgpu/hdp_v6_0.c 
> > b/drivers/gpu/drm/amd/amdgpu/hdp_v6_0.c
> > index ec20daf4272c5..a88d25a06c29b 100644
> > --- a/drivers/gpu/drm/amd/amdgpu/hdp_v6_0.c
> > +++ b/drivers/gpu/drm/amd/amdgpu/hdp_v6_0.c
> > @@ -30,6 +30,17 @@
> >  #define regHDP_CLK_CNTL_V6_1   0xd5
> >  #define regHDP_CLK_CNTL_V6_1_BASE_IDX 0
> >
> > +static void hdp_v6_0_flush_hdp(struct amdgpu_device *adev,
> > +                               struct amdgpu_ring *ring)
> > +{
> > +       if (!ring || !ring->funcs->emit_wreg) {
> > +               WREG32((adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > +               RREG32((adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2);
> > +       } else {
> > +               amdgpu_ring_emit_wreg(ring, (adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > +       }
> > +}
> > +
> >  static void hdp_v6_0_update_clock_gating(struct amdgpu_device *adev,
> >                                          bool enable)
> >  {
> > @@ -138,7 +149,7 @@ static void hdp_v6_0_get_clockgating_state(struct 
> > amdgpu_device *adev,
> >  }
> >
> >  const struct amdgpu_hdp_funcs hdp_v6_0_funcs = {
> > -       .flush_hdp = amdgpu_hdp_generic_flush,
> > +       .flush_hdp = hdp_v6_0_flush_hdp,
> >         .update_clock_gating = hdp_v6_0_update_clock_gating,
> >         .get_clock_gating_state = hdp_v6_0_get_clockgating_state,
> >  };
> > diff --git a/drivers/gpu/drm/amd/amdgpu/hdp_v7_0.c 
> > b/drivers/gpu/drm/amd/amdgpu/hdp_v7_0.c
> > index ed1debc035073..49f7eb4fbd117 100644
> > --- a/drivers/gpu/drm/amd/amdgpu/hdp_v7_0.c
> > +++ b/drivers/gpu/drm/amd/amdgpu/hdp_v7_0.c
> > @@ -27,6 +27,17 @@
> >  #include "hdp/hdp_7_0_0_sh_mask.h"
> >  #include <uapi/linux/kfd_ioctl.h>
> >
> > +static void hdp_v7_0_flush_hdp(struct amdgpu_device *adev,
> > +                               struct amdgpu_ring *ring)
> > +{
> > +       if (!ring || !ring->funcs->emit_wreg) {
> > +               WREG32((adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > +               RREG32((adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2);
> > +       } else {
> > +               amdgpu_ring_emit_wreg(ring, (adev->rmmio_remap.reg_offset + 
> > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > +       }
> > +}
> > +
> >  static void hdp_v7_0_update_clock_gating(struct amdgpu_device *adev,
> >                                          bool enable)
> >  {
> > @@ -126,7 +137,7 @@ static void hdp_v7_0_get_clockgating_state(struct 
> > amdgpu_device *adev,
> >  }
> >
> >  const struct amdgpu_hdp_funcs hdp_v7_0_funcs = {
> > -       .flush_hdp = amdgpu_hdp_generic_flush,
> > +       .flush_hdp = hdp_v7_0_flush_hdp,
> >         .update_clock_gating = hdp_v7_0_update_clock_gating,
> >         .get_clock_gating_state = hdp_v7_0_get_clockgating_state,
> >  };
> > --
> > 2.49.0
> >

Reply via email to