On Thu, May 24, 2018 at 2:56 PM, Jason Ekstrand <ja...@jlekstrand.net> wrote: > From: Francisco Jerez <curroje...@riseup.net> > > v2 (Jason Ekstrand): > - Disallow gl_SampleId in SIMD32 on gen7 > > Reviewed-by: Jason Ekstrand <ja...@jlekstrand.net> > --- > src/intel/compiler/brw_fs.cpp | 31 ++++++++++++++++++++++--------- > 1 file changed, 22 insertions(+), 9 deletions(-) > > diff --git a/src/intel/compiler/brw_fs.cpp b/src/intel/compiler/brw_fs.cpp > index ae59716..9ffa3ca 100644 > --- a/src/intel/compiler/brw_fs.cpp > +++ b/src/intel/compiler/brw_fs.cpp > @@ -861,6 +861,11 @@ fs_inst::size_read(int arg) const > return mlen * REG_SIZE; > break; > > + case FS_OPCODE_SET_SAMPLE_ID: > + if (arg == 1) > + return 1; > + break; > + > case FS_OPCODE_UNIFORM_PULL_CONSTANT_LOAD_GEN7: > /* The payload is actually stored in src1 */ > if (arg == 1) > @@ -1284,16 +1289,20 @@ fs_visitor::emit_sampleid_setup() > * TODO: These payload bits exist on Gen7 too, but they appear to > always > * be zero, so this code fails to work. We should find out why. > */ > - fs_reg tmp(VGRF, alloc.allocate(1), BRW_REGISTER_TYPE_UW); > + const fs_reg tmp = abld.vgrf(BRW_REGISTER_TYPE_UW); > + > + for (unsigned i = 0; i < DIV_ROUND_UP(dispatch_width, 16); i++) { > + const fs_builder hbld = abld.group(MIN2(16, dispatch_width), i); > + hbld.SHR(offset(tmp, hbld, i), > + stride(retype(brw_vec1_grf(1 + i, 0), > BRW_REGISTER_TYPE_UB), > + 1, 8, 0), > + brw_imm_v(0x44440000)); > + } > > - abld.SHR(tmp, fs_reg(stride(retype(brw_vec1_grf(1, 0), > - BRW_REGISTER_TYPE_UB), 1, 8, 0)), > - brw_imm_v(0x44440000)); > abld.AND(*reg, tmp, brw_imm_w(0xf)); > } else { > - const fs_reg t1 = component(fs_reg(VGRF, alloc.allocate(1), > - BRW_REGISTER_TYPE_UD), 0); > - const fs_reg t2(VGRF, alloc.allocate(1), BRW_REGISTER_TYPE_UW); > + const fs_reg t1 = component(abld.vgrf(BRW_REGISTER_TYPE_UD), 0); > + const fs_reg t2 = abld.vgrf(BRW_REGISTER_TYPE_UW); > > /* The PS will be run in MSDISPMODE_PERSAMPLE. For example with > * 8x multisampling, subspan 0 will represent sample N (where N > @@ -1323,8 +1332,12 @@ fs_visitor::emit_sampleid_setup() > brw_imm_ud(0xc0)); > abld.exec_all().group(1, 0).SHR(t1, t1, brw_imm_d(5)); > > - /* This works for both SIMD8 and SIMD16 */ > - abld.exec_all().group(4, 0).MOV(t2, brw_imm_v(0x3210)); > + /* This works for SIMD8-SIMD16. It also works for SIMD32 but only if > we > + * can assume 4x MSAA. Disallow it on IVB+ > + */ > + if (devinfo->gen >= 7) > + limit_dispatch_width(16, "gl_SampleId is unsupported in SIMD32 on > gen7"); > + abld.exec_all().group(8, 0).MOV(t2, brw_imm_v(0x32103210));
Can we mark this with FINISHME? _______________________________________________ mesa-dev mailing list mesa-dev@lists.freedesktop.org https://lists.freedesktop.org/mailman/listinfo/mesa-dev