On Wed, May 7, 2025 at 12:43 PM Lazar, Lijo <lijo.la...@amd.com> wrote:
>
> [AMD Official Use Only - AMD Internal Distribution Only]
>
>
> The flush reg is read/write. If the reads are not working on those platforms, 
> I think the writes may be dropped silently.

The problem only happens when we remap the register to the unused MMIO
space.  In that case, we end up with a PCI AER when reading the
remapped register.  Seems to happen on x86 platforms as well.  Writes
don't seem to be a problem.

Alex

>
> Thanks,
> Lijo
> ________________________________
> From: Alex Deucher <alexdeuc...@gmail.com>
> Sent: Wednesday, May 7, 2025 8:43:51 PM
> To: Deucher, Alexander <alexander.deuc...@amd.com>; Lazar, Lijo 
> <lijo.la...@amd.com>; Kuehling, Felix <felix.kuehl...@amd.com>; Koenig, 
> Christian <christian.koe...@amd.com>
> Cc: amd-gfx@lists.freedesktop.org <amd-gfx@lists.freedesktop.org>
> Subject: Re: [PATCH 1/7] Revert "drm/amdgpu: Use generic hdp flush function"
>
> Ping again on this series?
>
> Alex
>
> On Tue, May 6, 2025 at 11:17 AM Alex Deucher <alexdeuc...@gmail.com> wrote:
> >
> > Ping on this series?  This fixes a regression.
> >
> > Alex
> >
> > On Mon, May 5, 2025 at 9:05 AM Alex Deucher <alexander.deuc...@amd.com> 
> > wrote:
> > >
> > > This reverts commit 18a878fd8aef0ec21648a3782f55a79790cd4073.
> > >
> > > Revert this temporarily to make it easier to fix a regression
> > > in the HDP handling.
> > >
> > > Signed-off-by: Alex Deucher <alexander.deuc...@amd.com>
> > > ---
> > >  drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.c | 21 ---------------------
> > >  drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.h |  2 --
> > >  drivers/gpu/drm/amd/amdgpu/hdp_v4_0.c   | 13 ++++++++++++-
> > >  drivers/gpu/drm/amd/amdgpu/hdp_v5_0.c   | 13 ++++++++++++-
> > >  drivers/gpu/drm/amd/amdgpu/hdp_v6_0.c   | 13 ++++++++++++-
> > >  drivers/gpu/drm/amd/amdgpu/hdp_v7_0.c   | 13 ++++++++++++-
> > >  6 files changed, 48 insertions(+), 27 deletions(-)
> > >
> > > diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.c 
> > > b/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.c
> > > index 7fd8f09c28e66..b6cf801939aa5 100644
> > > --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.c
> > > +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.c
> > > @@ -22,7 +22,6 @@
> > >   */
> > >  #include "amdgpu.h"
> > >  #include "amdgpu_ras.h"
> > > -#include <uapi/linux/kfd_ioctl.h>
> > >
> > >  int amdgpu_hdp_ras_sw_init(struct amdgpu_device *adev)
> > >  {
> > > @@ -47,23 +46,3 @@ int amdgpu_hdp_ras_sw_init(struct amdgpu_device *adev)
> > >         /* hdp ras follows amdgpu_ras_block_late_init_default for late 
> > > init */
> > >         return 0;
> > >  }
> > > -
> > > -void amdgpu_hdp_generic_flush(struct amdgpu_device *adev,
> > > -                             struct amdgpu_ring *ring)
> > > -{
> > > -       if (!ring || !ring->funcs->emit_wreg) {
> > > -               WREG32((adev->rmmio_remap.reg_offset +
> > > -                       KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >>
> > > -                              2,
> > > -                      0);
> > > -               RREG32((adev->rmmio_remap.reg_offset +
> > > -                       KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >>
> > > -                      2);
> > > -       } else {
> > > -               amdgpu_ring_emit_wreg(ring,
> > > -                                     (adev->rmmio_remap.reg_offset +
> > > -                                      KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) 
> > > >>
> > > -                                             2,
> > > -                                     0);
> > > -       }
> > > -}
> > > \ No newline at end of file
> > > diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.h 
> > > b/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.h
> > > index 4cfd932b7e91e..7b8a6152dc8d9 100644
> > > --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.h
> > > +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_hdp.h
> > > @@ -44,6 +44,4 @@ struct amdgpu_hdp {
> > >  };
> > >
> > >  int amdgpu_hdp_ras_sw_init(struct amdgpu_device *adev);
> > > -void amdgpu_hdp_generic_flush(struct amdgpu_device *adev,
> > > -                             struct amdgpu_ring *ring);
> > >  #endif /* __AMDGPU_HDP_H__ */
> > > diff --git a/drivers/gpu/drm/amd/amdgpu/hdp_v4_0.c 
> > > b/drivers/gpu/drm/amd/amdgpu/hdp_v4_0.c
> > > index e6c0d86d34865..f1dc13b3ab38e 100644
> > > --- a/drivers/gpu/drm/amd/amdgpu/hdp_v4_0.c
> > > +++ b/drivers/gpu/drm/amd/amdgpu/hdp_v4_0.c
> > > @@ -36,6 +36,17 @@
> > >  #define HDP_MEM_POWER_CTRL__RC_MEM_POWER_LS_EN_MASK     0x00020000L
> > >  #define mmHDP_MEM_POWER_CTRL_BASE_IDX   0
> > >
> > > +static void hdp_v4_0_flush_hdp(struct amdgpu_device *adev,
> > > +                               struct amdgpu_ring *ring)
> > > +{
> > > +       if (!ring || !ring->funcs->emit_wreg) {
> > > +               WREG32((adev->rmmio_remap.reg_offset + 
> > > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > > +               RREG32((adev->rmmio_remap.reg_offset + 
> > > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2);
> > > +       } else {
> > > +               amdgpu_ring_emit_wreg(ring, (adev->rmmio_remap.reg_offset 
> > > + KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > > +       }
> > > +}
> > > +
> > >  static void hdp_v4_0_invalidate_hdp(struct amdgpu_device *adev,
> > >                                     struct amdgpu_ring *ring)
> > >  {
> > > @@ -169,7 +180,7 @@ struct amdgpu_hdp_ras hdp_v4_0_ras = {
> > >  };
> > >
> > >  const struct amdgpu_hdp_funcs hdp_v4_0_funcs = {
> > > -       .flush_hdp = amdgpu_hdp_generic_flush,
> > > +       .flush_hdp = hdp_v4_0_flush_hdp,
> > >         .invalidate_hdp = hdp_v4_0_invalidate_hdp,
> > >         .update_clock_gating = hdp_v4_0_update_clock_gating,
> > >         .get_clock_gating_state = hdp_v4_0_get_clockgating_state,
> > > diff --git a/drivers/gpu/drm/amd/amdgpu/hdp_v5_0.c 
> > > b/drivers/gpu/drm/amd/amdgpu/hdp_v5_0.c
> > > index 8bc001dc9f631..43195c0797480 100644
> > > --- a/drivers/gpu/drm/amd/amdgpu/hdp_v5_0.c
> > > +++ b/drivers/gpu/drm/amd/amdgpu/hdp_v5_0.c
> > > @@ -27,6 +27,17 @@
> > >  #include "hdp/hdp_5_0_0_sh_mask.h"
> > >  #include <uapi/linux/kfd_ioctl.h>
> > >
> > > +static void hdp_v5_0_flush_hdp(struct amdgpu_device *adev,
> > > +                               struct amdgpu_ring *ring)
> > > +{
> > > +       if (!ring || !ring->funcs->emit_wreg) {
> > > +               WREG32((adev->rmmio_remap.reg_offset + 
> > > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > > +               RREG32((adev->rmmio_remap.reg_offset + 
> > > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2);
> > > +       } else {
> > > +               amdgpu_ring_emit_wreg(ring, (adev->rmmio_remap.reg_offset 
> > > + KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > > +       }
> > > +}
> > > +
> > >  static void hdp_v5_0_invalidate_hdp(struct amdgpu_device *adev,
> > >                                     struct amdgpu_ring *ring)
> > >  {
> > > @@ -206,7 +217,7 @@ static void hdp_v5_0_init_registers(struct 
> > > amdgpu_device *adev)
> > >  }
> > >
> > >  const struct amdgpu_hdp_funcs hdp_v5_0_funcs = {
> > > -       .flush_hdp = amdgpu_hdp_generic_flush,
> > > +       .flush_hdp = hdp_v5_0_flush_hdp,
> > >         .invalidate_hdp = hdp_v5_0_invalidate_hdp,
> > >         .update_clock_gating = hdp_v5_0_update_clock_gating,
> > >         .get_clock_gating_state = hdp_v5_0_get_clockgating_state,
> > > diff --git a/drivers/gpu/drm/amd/amdgpu/hdp_v6_0.c 
> > > b/drivers/gpu/drm/amd/amdgpu/hdp_v6_0.c
> > > index ec20daf4272c5..a88d25a06c29b 100644
> > > --- a/drivers/gpu/drm/amd/amdgpu/hdp_v6_0.c
> > > +++ b/drivers/gpu/drm/amd/amdgpu/hdp_v6_0.c
> > > @@ -30,6 +30,17 @@
> > >  #define regHDP_CLK_CNTL_V6_1   0xd5
> > >  #define regHDP_CLK_CNTL_V6_1_BASE_IDX 0
> > >
> > > +static void hdp_v6_0_flush_hdp(struct amdgpu_device *adev,
> > > +                               struct amdgpu_ring *ring)
> > > +{
> > > +       if (!ring || !ring->funcs->emit_wreg) {
> > > +               WREG32((adev->rmmio_remap.reg_offset + 
> > > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > > +               RREG32((adev->rmmio_remap.reg_offset + 
> > > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2);
> > > +       } else {
> > > +               amdgpu_ring_emit_wreg(ring, (adev->rmmio_remap.reg_offset 
> > > + KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > > +       }
> > > +}
> > > +
> > >  static void hdp_v6_0_update_clock_gating(struct amdgpu_device *adev,
> > >                                          bool enable)
> > >  {
> > > @@ -138,7 +149,7 @@ static void hdp_v6_0_get_clockgating_state(struct 
> > > amdgpu_device *adev,
> > >  }
> > >
> > >  const struct amdgpu_hdp_funcs hdp_v6_0_funcs = {
> > > -       .flush_hdp = amdgpu_hdp_generic_flush,
> > > +       .flush_hdp = hdp_v6_0_flush_hdp,
> > >         .update_clock_gating = hdp_v6_0_update_clock_gating,
> > >         .get_clock_gating_state = hdp_v6_0_get_clockgating_state,
> > >  };
> > > diff --git a/drivers/gpu/drm/amd/amdgpu/hdp_v7_0.c 
> > > b/drivers/gpu/drm/amd/amdgpu/hdp_v7_0.c
> > > index ed1debc035073..49f7eb4fbd117 100644
> > > --- a/drivers/gpu/drm/amd/amdgpu/hdp_v7_0.c
> > > +++ b/drivers/gpu/drm/amd/amdgpu/hdp_v7_0.c
> > > @@ -27,6 +27,17 @@
> > >  #include "hdp/hdp_7_0_0_sh_mask.h"
> > >  #include <uapi/linux/kfd_ioctl.h>
> > >
> > > +static void hdp_v7_0_flush_hdp(struct amdgpu_device *adev,
> > > +                               struct amdgpu_ring *ring)
> > > +{
> > > +       if (!ring || !ring->funcs->emit_wreg) {
> > > +               WREG32((adev->rmmio_remap.reg_offset + 
> > > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > > +               RREG32((adev->rmmio_remap.reg_offset + 
> > > KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2);
> > > +       } else {
> > > +               amdgpu_ring_emit_wreg(ring, (adev->rmmio_remap.reg_offset 
> > > + KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0);
> > > +       }
> > > +}
> > > +
> > >  static void hdp_v7_0_update_clock_gating(struct amdgpu_device *adev,
> > >                                          bool enable)
> > >  {
> > > @@ -126,7 +137,7 @@ static void hdp_v7_0_get_clockgating_state(struct 
> > > amdgpu_device *adev,
> > >  }
> > >
> > >  const struct amdgpu_hdp_funcs hdp_v7_0_funcs = {
> > > -       .flush_hdp = amdgpu_hdp_generic_flush,
> > > +       .flush_hdp = hdp_v7_0_flush_hdp,
> > >         .update_clock_gating = hdp_v7_0_update_clock_gating,
> > >         .get_clock_gating_state = hdp_v7_0_get_clockgating_state,
> > >  };
> > > --
> > > 2.49.0
> > >

Reply via email to