From: Connor Abbott <cwabbo...@gmail.com>

---
 src/amd/common/ac_nir_to_llvm.c | 72 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 72 insertions(+)

diff --git a/src/amd/common/ac_nir_to_llvm.c b/src/amd/common/ac_nir_to_llvm.c
index b39b873..bafe4d3 100644
--- a/src/amd/common/ac_nir_to_llvm.c
+++ b/src/amd/common/ac_nir_to_llvm.c
@@ -4142,6 +4142,78 @@ static void visit_intrinsic(struct ac_nir_context *ctx,
                                                         get_src(ctx, 
instr->src[0])),
                                       ctx->ac.i32, "");
                break;
+
+#define __REDUCE(op, identity, type, nir_suffix, reduce_type) \
+       case nir_intrinsic_subgroup_##op##nir_suffix: { \
+               LLVMValueRef src = ac_to_##type(&ctx->ac, \
+                                               get_src(ctx, instr->src[0])); \
+               LLVMTypeRef src_type = LLVMTypeOf(src); \
+               result = ac_build_subgroup_##reduce_type( \
+                       &ctx->ac, src, \
+                       ac_reduce_##op, identity); \
+               break; \
+       } \
+       case nir_intrinsic_group_##op##nir_suffix: { \
+               LLVMValueRef src = ac_to_##type(&ctx->ac, \
+                                               get_src(ctx, instr->src[0])); \
+               LLVMTypeRef src_type = LLVMTypeOf(src); \
+               LLVMValueRef wavefront_id = \
+                       LLVMBuildLShr(ctx->ac.builder, \
+                                     
visit_load_local_invocation_index(ctx->nctx), \
+                                     LLVMConstInt(ctx->ac.i32, 6, 0), ""); \
+               result = ac_build_group_##reduce_type( \
+                       &ctx->ac, src, \
+                       ac_reduce_##op, identity, \
+                       ctx->nctx->max_workgroup_size, \
+                       wavefront_id); \
+               break; \
+       } \
+
+#define REDUCE(op, identity, type) \
+       __REDUCE(op, identity, type, , reduce) \
+       __REDUCE(op, identity, type, _inclusive_scan, inclusive_scan) \
+       __REDUCE(op, identity, type, _exclusive_scan, exclusive_scan) \
+       __REDUCE(op, identity, type, _nonuniform, reduce_nonuniform) \
+       __REDUCE(op, identity, type, _inclusive_scan_nonuniform, \
+                inclusive_scan_nonuniform) \
+       __REDUCE(op, identity, type, _exclusive_scan_nonuniform, \
+                exclusive_scan_nonuniform) \
+
+       REDUCE(fadd, LLVMConstReal(src_type, 0), float)
+       REDUCE(iadd, LLVMConstInt(src_type, 0, 0), integer)
+       REDUCE(fmin, LLVMConstReal(src_type, INFINITY), float)
+       REDUCE(imin, LLVMConstInt(src_type, LLVMGetIntTypeWidth(src_type) == 64
+                                 ? INT64_MAX : INT32_MAX, 0), integer)
+       REDUCE(umin, LLVMConstInt(src_type, LLVMGetIntTypeWidth(src_type) == 64
+                                 ? UINT64_MAX : UINT32_MAX, 0), integer)
+       REDUCE(fmax, LLVMConstReal(src_type, -INFINITY), float)
+       REDUCE(imax, LLVMConstInt(src_type, LLVMGetIntTypeWidth(src_type) == 64
+                                 ? INT64_MIN : INT32_MIN, 0), integer)
+       REDUCE(umax, LLVMConstInt(src_type, 0, 0), integer)
+
+       case nir_intrinsic_quad_swizzle_amd:
+               result = ac_build_swizzle_quad(&ctx->ac,
+                                              get_src(ctx, instr->src[0]),
+                                              instr->const_index[0]);
+               break;
+
+       case nir_intrinsic_masked_swizzle_amd:
+               result = ac_build_swizzle_masked(&ctx->ac,
+                                                get_src(ctx, instr->src[0]),
+                                                instr->const_index[0]);
+               break;
+
+       case nir_intrinsic_write_invocation:
+               result = ac_build_writelane(&ctx->ac,
+                                           get_src(ctx, instr->src[0]),
+                                           get_src(ctx, instr->src[1]),
+                                           get_src(ctx, instr->src[2]));
+               break;
+
+       case nir_intrinsic_mbcnt_amd:
+               result = ac_build_mbcnt(&ctx->ac, get_src(ctx, instr->src[0]));
+               break;
+
        default:
                fprintf(stderr, "Unknown intrinsic: ");
                nir_print_instr(&instr->instr, stderr);
-- 
2.9.4

_______________________________________________
mesa-dev mailing list
mesa-dev@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/mesa-dev

Reply via email to