[Mesa-dev] [PATCH 04/14] radv/tess: drop tcs_in_layout setting completely.
From: Dave AirlieInline all calcs at shader creation. Signed-off-by: Dave Airlie --- src/amd/vulkan/radv_nir_to_llvm.c | 26 +- src/amd/vulkan/radv_pipeline.c| 12 ++-- src/amd/vulkan/radv_shader.h | 1 + 3 files changed, 24 insertions(+), 15 deletions(-) diff --git a/src/amd/vulkan/radv_nir_to_llvm.c b/src/amd/vulkan/radv_nir_to_llvm.c index 64b50cab0a1..ee32549bde6 100644 --- a/src/amd/vulkan/radv_nir_to_llvm.c +++ b/src/amd/vulkan/radv_nir_to_llvm.c @@ -65,7 +65,6 @@ struct radv_shader_context { LLVMValueRef tcs_offchip_layout; LLVMValueRef tcs_out_offsets; LLVMValueRef tcs_out_layout; - LLVMValueRef tcs_in_layout; LLVMValueRef oc_lds; LLVMValueRef merged_wave_info; LLVMValueRef tess_factor_offset; @@ -108,6 +107,7 @@ struct radv_shader_context { uint32_t tcs_patch_outputs_read; uint64_t tcs_outputs_read; uint32_t tcs_vertices_per_patch; + uint32_t tcs_num_inputs; }; enum radeon_llvm_calling_convention { @@ -162,7 +162,11 @@ static LLVMValueRef get_tcs_in_patch_stride(struct radv_shader_context *ctx) { assert (ctx->stage == MESA_SHADER_TESS_CTRL); - return ac_unpack_param(>ac, ctx->tcs_in_layout, 0, 13); + uint32_t input_vertex_size = ctx->tcs_num_inputs * 16; + uint32_t input_patch_size = ctx->options->key.tcs.input_vertices * input_vertex_size; + + input_patch_size /= 4; + return LLVMConstInt(ctx->ac.i32, input_patch_size, false); } static LLVMValueRef @@ -462,7 +466,7 @@ static void allocate_user_sgprs(struct radv_shader_context *ctx, if (previous_stage == MESA_SHADER_VERTEX) user_sgpr_info->sgpr_count += count_vs_user_sgprs(ctx); } - user_sgpr_info->sgpr_count += 4; + user_sgpr_info->sgpr_count += 3; break; case MESA_SHADER_TESS_EVAL: user_sgpr_info->sgpr_count += 1; @@ -764,8 +768,6 @@ static void create_function(struct radv_shader_context *ctx, >tcs_out_offsets); add_arg(, ARG_SGPR, ctx->ac.i32, >tcs_out_layout); - add_arg(, ARG_SGPR, ctx->ac.i32, - >tcs_in_layout); if (needs_view_index) add_arg(, ARG_SGPR, ctx->ac.i32, >abi.view_index); @@ -789,8 +791,6 @@ static void create_function(struct radv_shader_context *ctx, >tcs_out_offsets); add_arg(, ARG_SGPR, ctx->ac.i32, >tcs_out_layout); - add_arg(, ARG_SGPR, ctx->ac.i32, - >tcs_in_layout); if (needs_view_index) add_arg(, ARG_SGPR, ctx->ac.i32, >abi.view_index); @@ -999,7 +999,7 @@ static void create_function(struct radv_shader_context *ctx, case MESA_SHADER_TESS_CTRL: set_vs_specific_input_locs(ctx, stage, has_previous_stage, previous_stage, _sgpr_idx); - set_loc_shader(ctx, AC_UD_TCS_OFFCHIP_LAYOUT, _sgpr_idx, 4); + set_loc_shader(ctx, AC_UD_TCS_OFFCHIP_LAYOUT, _sgpr_idx, 3); if (ctx->abi.view_index) set_loc_shader(ctx, AC_UD_VIEW_INDEX, _sgpr_idx, 1); break; @@ -1226,7 +1226,8 @@ load_tcs_varyings(struct ac_shader_abi *abi, unsigned param = shader_io_get_unique_index(location); if (load_input) { - stride = ac_unpack_param(>ac, ctx->tcs_in_layout, 13, 8); + uint32_t input_vertex_size = (ctx->tcs_num_inputs * 16) / 4; + stride = LLVMConstInt(ctx->ac.i32, input_vertex_size, false); dw_addr = get_tcs_in_current_patch_offset(ctx); } else { if (!is_patch) { @@ -3020,6 +3021,10 @@ LLVMModuleRef ac_translate_nir_to_llvm(LLVMTargetMachineRef tm, ctx.abi.load_patch_vertices_in = load_patch_vertices_in; ctx.abi.store_tcs_outputs = store_tcs_output; ctx.tcs_vertices_per_patch = shaders[i]->info.tess.tcs_vertices_out; + if (shader_count == 1) + ctx.tcs_num_inputs = ctx.options->key.tcs.num_inputs; + else + ctx.tcs_num_inputs = util_last_bit64(shader_info->info.vs.ls_outputs_written); } else if (shaders[i]->info.stage == MESA_SHADER_TESS_EVAL) { ctx.tes_primitive_mode = shaders[i]->info.tess.primitive_mode; ctx.abi.load_tess_varyings =
[Mesa-dev] [PATCH 04/14] radv/tess: drop tcs_in_layout setting completely.
From: Dave AirlieInline all calcs at shader creation. Signed-off-by: Dave Airlie --- src/amd/common/ac_nir_to_llvm.c | 27 ++- src/amd/common/ac_nir_to_llvm.h | 1 + src/amd/vulkan/radv_pipeline.c | 12 ++-- 3 files changed, 25 insertions(+), 15 deletions(-) diff --git a/src/amd/common/ac_nir_to_llvm.c b/src/amd/common/ac_nir_to_llvm.c index ce3679abedc..923bfaabb97 100644 --- a/src/amd/common/ac_nir_to_llvm.c +++ b/src/amd/common/ac_nir_to_llvm.c @@ -84,7 +84,6 @@ struct radv_shader_context { LLVMValueRef tcs_offchip_layout; LLVMValueRef tcs_out_offsets; LLVMValueRef tcs_out_layout; - LLVMValueRef tcs_in_layout; LLVMValueRef oc_lds; LLVMValueRef merged_wave_info; LLVMValueRef tess_factor_offset; @@ -127,6 +126,7 @@ struct radv_shader_context { uint32_t tcs_patch_outputs_read; uint64_t tcs_outputs_read; uint32_t tcs_vertices_per_patch; + uint32_t tcs_num_inputs; }; static inline struct radv_shader_context * @@ -345,7 +345,11 @@ static LLVMValueRef get_tcs_in_patch_stride(struct radv_shader_context *ctx) { assert (ctx->stage == MESA_SHADER_TESS_CTRL); - return unpack_param(>ac, ctx->tcs_in_layout, 0, 13); + uint32_t input_vertex_size = ctx->tcs_num_inputs * 16; + uint32_t input_patch_size = ctx->options->key.tcs.input_vertices * input_vertex_size; + + input_patch_size /= 4; + return LLVMConstInt(ctx->ac.i32, input_patch_size, false); } static LLVMValueRef @@ -529,7 +533,7 @@ static void allocate_user_sgprs(struct radv_shader_context *ctx, if (previous_stage == MESA_SHADER_VERTEX) user_sgpr_info->sgpr_count += count_vs_user_sgprs(ctx); } - user_sgpr_info->sgpr_count += 4; + user_sgpr_info->sgpr_count += 3; break; case MESA_SHADER_TESS_EVAL: user_sgpr_info->sgpr_count += 1; @@ -802,8 +806,6 @@ static void create_function(struct radv_shader_context *ctx, >tcs_out_offsets); add_arg(, ARG_SGPR, ctx->ac.i32, >tcs_out_layout); - add_arg(, ARG_SGPR, ctx->ac.i32, - >tcs_in_layout); if (needs_view_index) add_arg(, ARG_SGPR, ctx->ac.i32, >abi.view_index); @@ -827,8 +829,6 @@ static void create_function(struct radv_shader_context *ctx, >tcs_out_offsets); add_arg(, ARG_SGPR, ctx->ac.i32, >tcs_out_layout); - add_arg(, ARG_SGPR, ctx->ac.i32, - >tcs_in_layout); if (needs_view_index) add_arg(, ARG_SGPR, ctx->ac.i32, >abi.view_index); @@ -1037,7 +1037,7 @@ static void create_function(struct radv_shader_context *ctx, case MESA_SHADER_TESS_CTRL: set_vs_specific_input_locs(ctx, stage, has_previous_stage, previous_stage, _sgpr_idx); - set_loc_shader(ctx, AC_UD_TCS_OFFCHIP_LAYOUT, _sgpr_idx, 4); + set_loc_shader(ctx, AC_UD_TCS_OFFCHIP_LAYOUT, _sgpr_idx, 3); if (ctx->abi.view_index) set_loc_shader(ctx, AC_UD_VIEW_INDEX, _sgpr_idx, 1); break; @@ -2857,7 +2857,9 @@ load_tcs_varyings(struct ac_shader_abi *abi, unsigned param = shader_io_get_unique_index(location); if (load_input) { - stride = unpack_param(>ac, ctx->tcs_in_layout, 13, 8); + uint32_t input_vertex_size = ctx->tcs_num_inputs * 16; + input_vertex_size /= 4; + stride = LLVMConstInt(ctx->ac.i32, input_vertex_size, false); dw_addr = get_tcs_in_current_patch_offset(ctx); } else { if (!is_patch) { @@ -6863,6 +6865,10 @@ LLVMModuleRef ac_translate_nir_to_llvm(LLVMTargetMachineRef tm, ctx.abi.load_patch_vertices_in = load_patch_vertices_in; ctx.abi.store_tcs_outputs = store_tcs_output; ctx.tcs_vertices_per_patch = shaders[i]->info.tess.tcs_vertices_out; + if (shader_count == 1) + ctx.tcs_num_inputs = ctx.options->key.tcs.num_inputs; + else + ctx.tcs_num_inputs = util_last_bit64(shader_info->info.vs.ls_outputs_written); } else if (shaders[i]->info.stage == MESA_SHADER_TESS_EVAL) { ctx.tes_primitive_mode = shaders[i]->info.tess.primitive_mode;