cmd_buffer: Use the new emit macro for compute shader dispatch

Jason Ekstrand Mon, 18 Apr 2016 19:37:35 -0700

On Mon, Apr 18, 2016 at 5:30 PM, Ian Romanick <i...@freedesktop.org> wrote:


> On 04/18/2016 05:10 PM, Jason Ekstrand wrote:
> > ---
> >  src/intel/vulkan/genX_cmd_buffer.c | 116
> ++++++++++++++++++++-----------------
> >  1 file changed, 64 insertions(+), 52 deletions(-)
> >
> > diff --git a/src/intel/vulkan/genX_cmd_buffer.c
> b/src/intel/vulkan/genX_cmd_buffer.c
> > index 45b009b..4a75825 100644
> > --- a/src/intel/vulkan/genX_cmd_buffer.c
> > +++ b/src/intel/vulkan/genX_cmd_buffer.c
> > @@ -572,17 +572,19 @@ static void
> >  emit_lrm(struct anv_batch *batch,
> >           uint32_t reg, struct anv_bo *bo, uint32_t offset)
> >  {
> > -   anv_batch_emit(batch, GENX(MI_LOAD_REGISTER_MEM),
> > -                  .RegisterAddress = reg,
> > -                  .MemoryAddress = { bo, offset });
> > +   anv_batch_emit_blk(batch, GENX(MI_LOAD_REGISTER_MEM), lrm) {
> > +      lrm.RegisterAddress  = reg;
> > +      lrm.MemoryAddress    = (struct anv_address) { bo, offset };
> > +   }
> >  }
> >
> >  static void
> >  emit_lri(struct anv_batch *batch, uint32_t reg, uint32_t imm)
>
> In patch 8 the Gen8 emit_lri helper is removed, but this one stays.  It
> seems like either both should go or both should stay.  I also thought it
> was odd that the Gen8 emit_lri was a #define while this is a function.
> Perhaps there's something else happening here that I don't see.
>

Right.  I wanted to just move it out of genX to some place shared and use
it in gen7 and gen8.  Unfortunately, I'm not sure exactly where to do
that.  The reason I kept the genX one is because it's used some 8 times
while the gen7 and gen8 versions are used once or twice and they didn't
seem worth keeping.


> >  {
> > -   anv_batch_emit(batch, GENX(MI_LOAD_REGISTER_IMM),
> > -                  .RegisterOffset = reg,
> > -                  .DataDWord = imm);
> > +   anv_batch_emit_blk(batch, GENX(MI_LOAD_REGISTER_IMM), lri) {
> > +      lri.RegisterOffset   = reg;
> > +      lri.DataDWord        = imm;
> > +   }
> >  }
> >
> >  void genX(CmdDrawIndirect)(
> > @@ -695,18 +697,19 @@ void genX(CmdDispatch)(
> >
> >     genX(cmd_buffer_flush_compute_state)(cmd_buffer);
> >
> > -   anv_batch_emit(&cmd_buffer->batch, GENX(GPGPU_WALKER),
> > -                  .SIMDSize = prog_data->simd_size / 16,
> > -                  .ThreadDepthCounterMaximum = 0,
> > -                  .ThreadHeightCounterMaximum = 0,
> > -                  .ThreadWidthCounterMaximum =
> pipeline->cs_thread_width_max - 1,
> > -                  .ThreadGroupIDXDimension = x,
> > -                  .ThreadGroupIDYDimension = y,
> > -                  .ThreadGroupIDZDimension = z,
> > -                  .RightExecutionMask = pipeline->cs_right_mask,
> > -                  .BottomExecutionMask = 0xffffffff);
> > -
> > -   anv_batch_emit(&cmd_buffer->batch, GENX(MEDIA_STATE_FLUSH));
> > +   anv_batch_emit_blk(&cmd_buffer->batch, GENX(GPGPU_WALKER), ggw) {
> > +      ggw.SIMDSize                     = prog_data->simd_size / 16;
> > +      ggw.ThreadDepthCounterMaximum    = 0;
> > +      ggw.ThreadHeightCounterMaximum   = 0;
> > +      ggw.ThreadWidthCounterMaximum    = pipeline->cs_thread_width_max
> - 1;
> > +      ggw.ThreadGroupIDXDimension      = x;
> > +      ggw.ThreadGroupIDYDimension      = y;
> > +      ggw.ThreadGroupIDZDimension      = z;
> > +      ggw.RightExecutionMask           = pipeline->cs_right_mask;
> > +      ggw.BottomExecutionMask          = 0xffffffff;
> > +   }
> > +
> > +   anv_batch_emit_blk(&cmd_buffer->batch, GENX(MEDIA_STATE_FLUSH), msf);
> >  }
> >
> >  #define GPGPU_DISPATCHDIMX 0x2500
> > @@ -758,48 +761,53 @@ void genX(CmdDispatchIndirect)(
> >     emit_lrm(batch, MI_PREDICATE_SRC0, bo, bo_offset + 0);
> >
> >     /* predicate = (compute_dispatch_indirect_x_size == 0); */
> > -   anv_batch_emit(batch, GENX(MI_PREDICATE),
> > -                  .LoadOperation = LOAD_LOAD,
> > -                  .CombineOperation = COMBINE_SET,
> > -                  .CompareOperation = COMPARE_SRCS_EQUAL);
> > +   anv_batch_emit_blk(batch, GENX(MI_PREDICATE), mip) {
> > +      mip.LoadOperation    = LOAD_LOAD;
> > +      mip.CombineOperation = COMBINE_SET;
> > +      mip.CompareOperation = COMPARE_SRCS_EQUAL;
> > +   }
> >
> >     /* Load compute_dispatch_indirect_y_size into SRC0 */
> >     emit_lrm(batch, MI_PREDICATE_SRC0, bo, bo_offset + 4);
> >
> >     /* predicate |= (compute_dispatch_indirect_y_size == 0); */
> > -   anv_batch_emit(batch, GENX(MI_PREDICATE),
> > -                  .LoadOperation = LOAD_LOAD,
> > -                  .CombineOperation = COMBINE_OR,
> > -                  .CompareOperation = COMPARE_SRCS_EQUAL);
> > +   anv_batch_emit_blk(batch, GENX(MI_PREDICATE), mip) {
> > +      mip.LoadOperation    = LOAD_LOAD;
> > +      mip.CombineOperation = COMBINE_OR;
> > +      mip.CompareOperation = COMPARE_SRCS_EQUAL;
> > +   }
> >
> >     /* Load compute_dispatch_indirect_z_size into SRC0 */
> >     emit_lrm(batch, MI_PREDICATE_SRC0, bo, bo_offset + 8);
> >
> >     /* predicate |= (compute_dispatch_indirect_z_size == 0); */
> > -   anv_batch_emit(batch, GENX(MI_PREDICATE),
> > -                  .LoadOperation = LOAD_LOAD,
> > -                  .CombineOperation = COMBINE_OR,
> > -                  .CompareOperation = COMPARE_SRCS_EQUAL);
> > +   anv_batch_emit_blk(batch, GENX(MI_PREDICATE), mip) {
> > +      mip.LoadOperation    = LOAD_LOAD;
> > +      mip.CombineOperation = COMBINE_OR;
> > +      mip.CompareOperation = COMPARE_SRCS_EQUAL;
> > +   }
> >
> >     /* predicate = !predicate; */
> >  #define COMPARE_FALSE                           1
> > -   anv_batch_emit(batch, GENX(MI_PREDICATE),
> > -                  .LoadOperation = LOAD_LOADINV,
> > -                  .CombineOperation = COMBINE_OR,
> > -                  .CompareOperation = COMPARE_FALSE);
> > +   anv_batch_emit_blk(batch, GENX(MI_PREDICATE), mip) {
> > +      mip.LoadOperation    = LOAD_LOADINV;
> > +      mip.CombineOperation = COMBINE_OR;
> > +      mip.CompareOperation = COMPARE_FALSE;
> > +   }
> >  #endif
> >
> > -   anv_batch_emit(batch, GENX(GPGPU_WALKER),
> > -                  .IndirectParameterEnable = true,
> > -                  .PredicateEnable = GEN_GEN <= 7,
> > -                  .SIMDSize = prog_data->simd_size / 16,
> > -                  .ThreadDepthCounterMaximum = 0,
> > -                  .ThreadHeightCounterMaximum = 0,
> > -                  .ThreadWidthCounterMaximum =
> pipeline->cs_thread_width_max - 1,
> > -                  .RightExecutionMask = pipeline->cs_right_mask,
> > -                  .BottomExecutionMask = 0xffffffff);
> > -
> > -   anv_batch_emit(batch, GENX(MEDIA_STATE_FLUSH));
> > +   anv_batch_emit_blk(batch, GENX(GPGPU_WALKER), ggw) {
> > +      ggw.IndirectParameterEnable      = true;
> > +      ggw.PredicateEnable              = GEN_GEN <= 7;
> > +      ggw.SIMDSize                     = prog_data->simd_size / 16;
> > +      ggw.ThreadDepthCounterMaximum    = 0;
> > +      ggw.ThreadHeightCounterMaximum   = 0;
> > +      ggw.ThreadWidthCounterMaximum    = pipeline->cs_thread_width_max
> - 1;
> > +      ggw.RightExecutionMask           = pipeline->cs_right_mask;
> > +      ggw.BottomExecutionMask          = 0xffffffff;
> > +   }
> > +
> > +   anv_batch_emit_blk(batch, GENX(MEDIA_STATE_FLUSH), msf);
> >  }
> >
> >  static void
> > @@ -817,7 +825,7 @@ flush_pipeline_before_pipeline_select(struct
> anv_cmd_buffer *cmd_buffer,
> >      * hardware too.
> >      */
> >     if (pipeline == GPGPU)
> > -      anv_batch_emit(&cmd_buffer->batch,
> GENX(3DSTATE_CC_STATE_POINTERS));
> > +      anv_batch_emit_blk(&cmd_buffer->batch,
> GENX(3DSTATE_CC_STATE_POINTERS), t);
> >  #elif GEN_GEN <= 7
> >        /* From "BXML » GT » MI » vol1a GPU Overview » [Instruction]
> >         * PIPELINE_SELECT [DevBWR+]":
> > @@ -853,11 +861,13 @@ genX(flush_pipeline_select_3d)(struct
> anv_cmd_buffer *cmd_buffer)
> >     if (cmd_buffer->state.current_pipeline != _3D) {
> >        flush_pipeline_before_pipeline_select(cmd_buffer, _3D);
> >
> > -      anv_batch_emit(&cmd_buffer->batch, GENX(PIPELINE_SELECT),
> > +      anv_batch_emit_blk(&cmd_buffer->batch, GENX(PIPELINE_SELECT), ps)
> {
> >  #if GEN_GEN >= 9
> > -                     .MaskBits = 3,
> > +         ps.MaskBits = 3;
> >  #endif
> > -                     .PipelineSelection = _3D);
> > +         ps.PipelineSelection = _3D;
> > +      }
> > +
> >        cmd_buffer->state.current_pipeline = _3D;
> >     }
> >  }
> > @@ -868,11 +878,13 @@ genX(flush_pipeline_select_gpgpu)(struct
> anv_cmd_buffer *cmd_buffer)
> >     if (cmd_buffer->state.current_pipeline != GPGPU) {
> >        flush_pipeline_before_pipeline_select(cmd_buffer, GPGPU);
> >
> > -      anv_batch_emit(&cmd_buffer->batch, GENX(PIPELINE_SELECT),
> > +      anv_batch_emit_blk(&cmd_buffer->batch, GENX(PIPELINE_SELECT), ps)
> {
> >  #if GEN_GEN >= 9
> > -                     .MaskBits = 3,
> > +         ps.MaskBits = 3;
> >  #endif
> > -                     .PipelineSelection = GPGPU);
> > +         ps.PipelineSelection = GPGPU;
> > +      }
> > +
> >        cmd_buffer->state.current_pipeline = GPGPU;
> >     }
> >  }
> >
>
>

_______________________________________________
mesa-dev mailing list
mesa-dev@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/mesa-dev

Re: [Mesa-dev] [PATCH 07/18] anv/cmd_buffer: Use the new emit macro for compute shader dispatch

Reply via email to