From: Nicolai Hähnle <nicolai.haeh...@amd.com>

---
 src/amd/common/ac_nir_to_llvm.c | 114 +++++++++++++++++++++-------------------
 1 file changed, 59 insertions(+), 55 deletions(-)

diff --git a/src/amd/common/ac_nir_to_llvm.c b/src/amd/common/ac_nir_to_llvm.c
index d2238c3..e3d1529 100644
--- a/src/amd/common/ac_nir_to_llvm.c
+++ b/src/amd/common/ac_nir_to_llvm.c
@@ -2177,46 +2177,47 @@ static LLVMValueRef visit_load_push_constant(struct 
nir_to_llvm_context *ctx,
        return LLVMBuildLoad(ctx->builder, ptr, "");
 }
 
 static LLVMValueRef visit_get_buffer_size(struct ac_nir_context *ctx,
                                           const nir_intrinsic_instr *instr)
 {
        LLVMValueRef desc = get_src(ctx, instr->src[0]);
 
        return get_buffer_size(ctx, desc, false);
 }
-static void visit_store_ssbo(struct nir_to_llvm_context *ctx,
+static void visit_store_ssbo(struct ac_nir_context *ctx,
                              nir_intrinsic_instr *instr)
 {
        const char *store_name;
-       LLVMValueRef src_data = get_src(ctx->nir, instr->src[0]);
-       LLVMTypeRef data_type = ctx->f32;
+       LLVMValueRef src_data = get_src(ctx, instr->src[0]);
+       LLVMTypeRef data_type = ctx->ac.f32;
        int elem_size_mult = get_elem_bits(&ctx->ac, LLVMTypeOf(src_data)) / 32;
        int components_32bit = elem_size_mult * instr->num_components;
        unsigned writemask = nir_intrinsic_write_mask(instr);
        LLVMValueRef base_data, base_offset;
        LLVMValueRef params[6];
+       LLVMValueRef i1false = LLVMConstInt(ctx->ac.i1, 0, false);
 
-       params[1] = ctx->abi.load_ssbo(&ctx->abi,
-                                      get_src(ctx->nir, instr->src[1]), true);
-       params[2] = LLVMConstInt(ctx->i32, 0, false); /* vindex */
-       params[4] = ctx->i1false;  /* glc */
-       params[5] = ctx->i1false;  /* slc */
+       params[1] = ctx->abi->load_ssbo(ctx->abi,
+                                       get_src(ctx, instr->src[1]), true);
+       params[2] = LLVMConstInt(ctx->ac.i32, 0, false); /* vindex */
+       params[4] = i1false;  /* glc */
+       params[5] = i1false;  /* slc */
 
        if (components_32bit > 1)
-               data_type = LLVMVectorType(ctx->f32, components_32bit);
+               data_type = LLVMVectorType(ctx->ac.f32, components_32bit);
 
        base_data = to_float(&ctx->ac, src_data);
        base_data = trim_vector(&ctx->ac, base_data, instr->num_components);
-       base_data = LLVMBuildBitCast(ctx->builder, base_data,
+       base_data = LLVMBuildBitCast(ctx->ac.builder, base_data,
                                     data_type, "");
-       base_offset = get_src(ctx->nir, instr->src[2]);      /* voffset */
+       base_offset = get_src(ctx, instr->src[2]);      /* voffset */
        while (writemask) {
                int start, count;
                LLVMValueRef data;
                LLVMValueRef offset;
                LLVMValueRef tmp;
                u_bit_scan_consecutive_range(&writemask, &start, &count);
 
                /* Due to an LLVM limitation, split 3-element writes
                 * into a 2-element and a 1-element write. */
                if (count == 3) {
@@ -2229,69 +2230,71 @@ static void visit_store_ssbo(struct nir_to_llvm_context 
*ctx,
 
                if (count > 4) {
                        writemask |= ((1u << (count - 4)) - 1u) << (start + 4);
                        count = 4;
                }
 
                if (count == 4) {
                        store_name = "llvm.amdgcn.buffer.store.v4f32";
                        data = base_data;
                } else if (count == 2) {
-                       tmp = LLVMBuildExtractElement(ctx->builder,
-                                                     base_data, 
LLVMConstInt(ctx->i32, start, false), "");
-                       data = LLVMBuildInsertElement(ctx->builder, 
LLVMGetUndef(ctx->v2f32), tmp,
-                                                     ctx->i32zero, "");
-
-                       tmp = LLVMBuildExtractElement(ctx->builder,
-                                                     base_data, 
LLVMConstInt(ctx->i32, start + 1, false), "");
-                       data = LLVMBuildInsertElement(ctx->builder, data, tmp,
-                                                     ctx->i32one, "");
+                       LLVMTypeRef v2f32 = LLVMVectorType(ctx->ac.f32, 2);
+
+                       tmp = LLVMBuildExtractElement(ctx->ac.builder,
+                                                     base_data, 
LLVMConstInt(ctx->ac.i32, start, false), "");
+                       data = LLVMBuildInsertElement(ctx->ac.builder, 
LLVMGetUndef(v2f32), tmp,
+                                                     ctx->ac.i32_0, "");
+
+                       tmp = LLVMBuildExtractElement(ctx->ac.builder,
+                                                     base_data, 
LLVMConstInt(ctx->ac.i32, start + 1, false), "");
+                       data = LLVMBuildInsertElement(ctx->ac.builder, data, 
tmp,
+                                                     ctx->ac.i32_1, "");
                        store_name = "llvm.amdgcn.buffer.store.v2f32";
 
                } else {
                        assert(count == 1);
                        if (get_llvm_num_components(base_data) > 1)
-                               data = LLVMBuildExtractElement(ctx->builder, 
base_data,
-                                                              
LLVMConstInt(ctx->i32, start, false), "");
+                               data = LLVMBuildExtractElement(ctx->ac.builder, 
base_data,
+                                                              
LLVMConstInt(ctx->ac.i32, start, false), "");
                        else
                                data = base_data;
                        store_name = "llvm.amdgcn.buffer.store.f32";
                }
 
                offset = base_offset;
                if (start != 0) {
-                       offset = LLVMBuildAdd(ctx->builder, offset, 
LLVMConstInt(ctx->i32, start * 4, false), "");
+                       offset = LLVMBuildAdd(ctx->ac.builder, offset, 
LLVMConstInt(ctx->ac.i32, start * 4, false), "");
                }
                params[0] = data;
                params[3] = offset;
                ac_build_intrinsic(&ctx->ac, store_name,
-                                  ctx->voidt, params, 6, 0);
+                                  ctx->ac.voidt, params, 6, 0);
        }
 }
 
-static LLVMValueRef visit_atomic_ssbo(struct nir_to_llvm_context *ctx,
+static LLVMValueRef visit_atomic_ssbo(struct ac_nir_context *ctx,
                                       const nir_intrinsic_instr *instr)
 {
        const char *name;
        LLVMValueRef params[6];
        int arg_count = 0;
 
        if (instr->intrinsic == nir_intrinsic_ssbo_atomic_comp_swap) {
-               params[arg_count++] = llvm_extract_elem(&ctx->ac, 
get_src(ctx->nir, instr->src[3]), 0);
+               params[arg_count++] = llvm_extract_elem(&ctx->ac, get_src(ctx, 
instr->src[3]), 0);
        }
-       params[arg_count++] = llvm_extract_elem(&ctx->ac, get_src(ctx->nir, 
instr->src[2]), 0);
-       params[arg_count++] = ctx->abi.load_ssbo(&ctx->abi,
-                                                get_src(ctx->nir, 
instr->src[0]),
+       params[arg_count++] = llvm_extract_elem(&ctx->ac, get_src(ctx, 
instr->src[2]), 0);
+       params[arg_count++] = ctx->abi->load_ssbo(ctx->abi,
+                                                get_src(ctx, instr->src[0]),
                                                 true);
-       params[arg_count++] = LLVMConstInt(ctx->i32, 0, false); /* vindex */
-       params[arg_count++] = get_src(ctx->nir, instr->src[1]);      /* voffset 
*/
-       params[arg_count++] = ctx->i1false;  /* slc */
+       params[arg_count++] = LLVMConstInt(ctx->ac.i32, 0, false); /* vindex */
+       params[arg_count++] = get_src(ctx, instr->src[1]);      /* voffset */
+       params[arg_count++] = LLVMConstInt(ctx->ac.i1, 0, false);  /* slc */
 
        switch (instr->intrinsic) {
        case nir_intrinsic_ssbo_atomic_add:
                name = "llvm.amdgcn.buffer.atomic.add";
                break;
        case nir_intrinsic_ssbo_atomic_imin:
                name = "llvm.amdgcn.buffer.atomic.smin";
                break;
        case nir_intrinsic_ssbo_atomic_umin:
                name = "llvm.amdgcn.buffer.atomic.umin";
@@ -2314,83 +2317,84 @@ static LLVMValueRef visit_atomic_ssbo(struct 
nir_to_llvm_context *ctx,
        case nir_intrinsic_ssbo_atomic_exchange:
                name = "llvm.amdgcn.buffer.atomic.swap";
                break;
        case nir_intrinsic_ssbo_atomic_comp_swap:
                name = "llvm.amdgcn.buffer.atomic.cmpswap";
                break;
        default:
                abort();
        }
 
-       return ac_build_intrinsic(&ctx->ac, name, ctx->i32, params, arg_count, 
0);
+       return ac_build_intrinsic(&ctx->ac, name, ctx->ac.i32, params, 
arg_count, 0);
 }
 
-static LLVMValueRef visit_load_buffer(struct nir_to_llvm_context *ctx,
+static LLVMValueRef visit_load_buffer(struct ac_nir_context *ctx,
                                       const nir_intrinsic_instr *instr)
 {
        LLVMValueRef results[2];
        int load_components;
        int num_components = instr->num_components;
        if (instr->dest.ssa.bit_size == 64)
                num_components *= 2;
 
        for (int i = 0; i < num_components; i += load_components) {
                load_components = MIN2(num_components - i, 4);
                const char *load_name;
-               LLVMTypeRef data_type = ctx->f32;
-               LLVMValueRef offset = LLVMConstInt(ctx->i32, i * 4, false);
-               offset = LLVMBuildAdd(ctx->builder, get_src(ctx->nir, 
instr->src[1]), offset, "");
+               LLVMTypeRef data_type = ctx->ac.f32;
+               LLVMValueRef offset = LLVMConstInt(ctx->ac.i32, i * 4, false);
+               offset = LLVMBuildAdd(ctx->ac.builder, get_src(ctx, 
instr->src[1]), offset, "");
 
                if (load_components == 3)
-                       data_type = LLVMVectorType(ctx->f32, 4);
+                       data_type = LLVMVectorType(ctx->ac.f32, 4);
                else if (load_components > 1)
-                       data_type = LLVMVectorType(ctx->f32, load_components);
+                       data_type = LLVMVectorType(ctx->ac.f32, 
load_components);
 
                if (load_components >= 3)
                        load_name = "llvm.amdgcn.buffer.load.v4f32";
                else if (load_components == 2)
                        load_name = "llvm.amdgcn.buffer.load.v2f32";
                else if (load_components == 1)
                        load_name = "llvm.amdgcn.buffer.load.f32";
                else
                        unreachable("unhandled number of components");
 
+               LLVMValueRef i1false = LLVMConstInt(ctx->ac.i1, 0, false);
                LLVMValueRef params[] = {
-                       ctx->abi.load_ssbo(&ctx->abi,
-                                          get_src(ctx->nir, instr->src[0]),
-                                          false),
-                       LLVMConstInt(ctx->i32, 0, false),
+                       ctx->abi->load_ssbo(ctx->abi,
+                                           get_src(ctx, instr->src[0]),
+                                           false),
+                       LLVMConstInt(ctx->ac.i32, 0, false),
                        offset,
-                       ctx->i1false,
-                       ctx->i1false,
+                       i1false,
+                       i1false,
                };
 
                results[i] = ac_build_intrinsic(&ctx->ac, load_name, data_type, 
params, 5, 0);
 
        }
 
        LLVMValueRef ret = results[0];
        if (num_components > 4 || num_components == 3) {
                LLVMValueRef masks[] = {
-                       LLVMConstInt(ctx->i32, 0, false), 
LLVMConstInt(ctx->i32, 1, false),
-                       LLVMConstInt(ctx->i32, 2, false), 
LLVMConstInt(ctx->i32, 3, false),
-                       LLVMConstInt(ctx->i32, 4, false), 
LLVMConstInt(ctx->i32, 5, false),
-                       LLVMConstInt(ctx->i32, 6, false), 
LLVMConstInt(ctx->i32, 7, false)
+                       LLVMConstInt(ctx->ac.i32, 0, false), 
LLVMConstInt(ctx->ac.i32, 1, false),
+                       LLVMConstInt(ctx->ac.i32, 2, false), 
LLVMConstInt(ctx->ac.i32, 3, false),
+                       LLVMConstInt(ctx->ac.i32, 4, false), 
LLVMConstInt(ctx->ac.i32, 5, false),
+                       LLVMConstInt(ctx->ac.i32, 6, false), 
LLVMConstInt(ctx->ac.i32, 7, false)
                };
 
                LLVMValueRef swizzle = LLVMConstVector(masks, num_components);
-               ret = LLVMBuildShuffleVector(ctx->builder, results[0],
+               ret = LLVMBuildShuffleVector(ctx->ac.builder, results[0],
                                             results[num_components > 4 ? 1 : 
0], swizzle, "");
        }
 
-       return LLVMBuildBitCast(ctx->builder, ret,
-                               get_def_type(ctx->nir, &instr->dest.ssa), "");
+       return LLVMBuildBitCast(ctx->ac.builder, ret,
+                               get_def_type(ctx, &instr->dest.ssa), "");
 }
 
 static LLVMValueRef visit_load_ubo_buffer(struct ac_nir_context *ctx,
                                           const nir_intrinsic_instr *instr)
 {
        LLVMValueRef results[8], ret;
        LLVMValueRef rsrc = get_src(ctx, instr->src[0]);
        LLVMValueRef offset = get_src(ctx, instr->src[1]);
        int num_components = instr->num_components;
 
@@ -3927,36 +3931,36 @@ static void visit_intrinsic(struct ac_nir_context *ctx,
        case nir_intrinsic_load_local_invocation_index:
                result = visit_load_local_invocation_index(ctx->nctx);
                break;
        case nir_intrinsic_load_push_constant:
                result = visit_load_push_constant(ctx->nctx, instr);
                break;
        case nir_intrinsic_vulkan_resource_index:
                result = visit_vulkan_resource_index(ctx->nctx, instr);
                break;
        case nir_intrinsic_store_ssbo:
-               visit_store_ssbo(ctx->nctx, instr);
+               visit_store_ssbo(ctx, instr);
                break;
        case nir_intrinsic_load_ssbo:
-               result = visit_load_buffer(ctx->nctx, instr);
+               result = visit_load_buffer(ctx, instr);
                break;
        case nir_intrinsic_ssbo_atomic_add:
        case nir_intrinsic_ssbo_atomic_imin:
        case nir_intrinsic_ssbo_atomic_umin:
        case nir_intrinsic_ssbo_atomic_imax:
        case nir_intrinsic_ssbo_atomic_umax:
        case nir_intrinsic_ssbo_atomic_and:
        case nir_intrinsic_ssbo_atomic_or:
        case nir_intrinsic_ssbo_atomic_xor:
        case nir_intrinsic_ssbo_atomic_exchange:
        case nir_intrinsic_ssbo_atomic_comp_swap:
-               result = visit_atomic_ssbo(ctx->nctx, instr);
+               result = visit_atomic_ssbo(ctx, instr);
                break;
        case nir_intrinsic_load_ubo:
                result = visit_load_ubo_buffer(ctx, instr);
                break;
        case nir_intrinsic_get_buffer_size:
                result = visit_get_buffer_size(ctx, instr);
                break;
        case nir_intrinsic_load_var:
                result = visit_load_var(ctx, instr);
                break;
-- 
2.9.3

_______________________________________________
mesa-dev mailing list
mesa-dev@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/mesa-dev

Reply via email to