Re: [Mesa-dev] [PATCH 4/4] radv: rework how the number of VGPRs is computed
r-b for the series On Wed, Jun 26, 2019 at 3:07 PM Samuel Pitoiset wrote: > > Just a cleanup, it shouldn't change anything. > > Signed-off-by: Samuel Pitoiset > --- > src/amd/vulkan/radv_nir_to_llvm.c | 22 > src/amd/vulkan/radv_shader.c | 34 --- > src/amd/vulkan/radv_shader.h | 1 - > 3 files changed, 31 insertions(+), 26 deletions(-) > > diff --git a/src/amd/vulkan/radv_nir_to_llvm.c > b/src/amd/vulkan/radv_nir_to_llvm.c > index d6f286fe4ec..211fc4aec47 100644 > --- a/src/amd/vulkan/radv_nir_to_llvm.c > +++ b/src/amd/vulkan/radv_nir_to_llvm.c > @@ -2191,14 +2191,6 @@ handle_vs_input_decl(struct radv_shader_context *ctx, > buffer_index = > LLVMBuildUDiv(ctx->ac.builder, buffer_index, > > LLVMConstInt(ctx->ac.i32, divisor, 0), ""); > } > - > - if (ctx->options->key.vs.as_ls) { > - ctx->shader_info->vs.vgpr_comp_cnt = > - MAX2(2, > ctx->shader_info->vs.vgpr_comp_cnt); > - } else { > - ctx->shader_info->vs.vgpr_comp_cnt = > - MAX2(1, > ctx->shader_info->vs.vgpr_comp_cnt); > - } > } else { > buffer_index = ctx->ac.i32_0; > } > @@ -3044,8 +3036,6 @@ handle_vs_outputs_post(struct radv_shader_context *ctx, > LLVMValueRef values[4]; > > values[0] = ctx->vs_prim_id; > - ctx->shader_info->vs.vgpr_comp_cnt = MAX2(2, > - > ctx->shader_info->vs.vgpr_comp_cnt); > for (unsigned j = 1; j < 4; j++) > values[j] = ctx->ac.f32_0; > > @@ -3751,15 +3741,6 @@ LLVMModuleRef ac_translate_nir_to_llvm(struct > ac_llvm_compiler *ac_llvm, > ctx.tcs_vertices_per_patch = > shaders[i]->info.tess.tcs_vertices_out; > ctx.tcs_num_patches = > ctx.options->key.tes.num_patches; > } else if (shaders[i]->info.stage == MESA_SHADER_VERTEX) { > - if (shader_info->info.vs.needs_instance_id) { > - if (ctx.options->key.vs.as_ls) { > - ctx.shader_info->vs.vgpr_comp_cnt = > - MAX2(2, > ctx.shader_info->vs.vgpr_comp_cnt); > - } else { > - ctx.shader_info->vs.vgpr_comp_cnt = > - MAX2(1, > ctx.shader_info->vs.vgpr_comp_cnt); > - } > - } > ctx.abi.load_base_vertex = radv_load_base_vertex; > } else if (shaders[i]->info.stage == MESA_SHADER_FRAGMENT) { > shader_info->fs.can_discard = > shaders[i]->info.fs.uses_discard; > @@ -3994,9 +3975,6 @@ ac_fill_shader_info(struct radv_shader_variant_info > *shader_info, struct nir_sha > case MESA_SHADER_VERTEX: > shader_info->vs.as_es = options->key.vs.as_es; > shader_info->vs.as_ls = options->key.vs.as_ls; > -/* in LS mode we need at least 1, invocation id needs 2, > handled elsewhere */ > -if (options->key.vs.as_ls) > -shader_info->vs.vgpr_comp_cnt = MAX2(1, > shader_info->vs.vgpr_comp_cnt); > break; > default: > break; > diff --git a/src/amd/vulkan/radv_shader.c b/src/amd/vulkan/radv_shader.c > index 5205dc1bfc5..0ec0d67e3b6 100644 > --- a/src/amd/vulkan/radv_shader.c > +++ b/src/amd/vulkan/radv_shader.c > @@ -507,13 +507,40 @@ radv_fill_shader_variant(struct radv_device *device, > break; > case MESA_SHADER_TESS_CTRL: > if (device->physical_device->rad_info.chip_class >= GFX9) { > - vgpr_comp_cnt = variant->info.vs.vgpr_comp_cnt; > + /* We need at least 2 components for LS. > +* VGPR0-3: (VertexID, RelAutoindex, InstanceID / > StepRate0, InstanceID). > +* StepRate0 is set to 1. so that VGPR3 doesn't have > to be loaded. > +*/ > + vgpr_comp_cnt = info->vs.needs_instance_id ? 2 : 1; > } else { > variant->rsrc2 |= S_00B12C_OC_LDS_EN(1); > } > break; > case MESA_SHADER_VERTEX: > - vgpr_comp_cnt = variant->info.vs.vgpr_comp_cnt; > + if (variant->info.vs.as_ls) { > +
[Mesa-dev] [PATCH 4/4] radv: rework how the number of VGPRs is computed
Just a cleanup, it shouldn't change anything. Signed-off-by: Samuel Pitoiset --- src/amd/vulkan/radv_nir_to_llvm.c | 22 src/amd/vulkan/radv_shader.c | 34 --- src/amd/vulkan/radv_shader.h | 1 - 3 files changed, 31 insertions(+), 26 deletions(-) diff --git a/src/amd/vulkan/radv_nir_to_llvm.c b/src/amd/vulkan/radv_nir_to_llvm.c index d6f286fe4ec..211fc4aec47 100644 --- a/src/amd/vulkan/radv_nir_to_llvm.c +++ b/src/amd/vulkan/radv_nir_to_llvm.c @@ -2191,14 +2191,6 @@ handle_vs_input_decl(struct radv_shader_context *ctx, buffer_index = LLVMBuildUDiv(ctx->ac.builder, buffer_index, LLVMConstInt(ctx->ac.i32, divisor, 0), ""); } - - if (ctx->options->key.vs.as_ls) { - ctx->shader_info->vs.vgpr_comp_cnt = - MAX2(2, ctx->shader_info->vs.vgpr_comp_cnt); - } else { - ctx->shader_info->vs.vgpr_comp_cnt = - MAX2(1, ctx->shader_info->vs.vgpr_comp_cnt); - } } else { buffer_index = ctx->ac.i32_0; } @@ -3044,8 +3036,6 @@ handle_vs_outputs_post(struct radv_shader_context *ctx, LLVMValueRef values[4]; values[0] = ctx->vs_prim_id; - ctx->shader_info->vs.vgpr_comp_cnt = MAX2(2, - ctx->shader_info->vs.vgpr_comp_cnt); for (unsigned j = 1; j < 4; j++) values[j] = ctx->ac.f32_0; @@ -3751,15 +3741,6 @@ LLVMModuleRef ac_translate_nir_to_llvm(struct ac_llvm_compiler *ac_llvm, ctx.tcs_vertices_per_patch = shaders[i]->info.tess.tcs_vertices_out; ctx.tcs_num_patches = ctx.options->key.tes.num_patches; } else if (shaders[i]->info.stage == MESA_SHADER_VERTEX) { - if (shader_info->info.vs.needs_instance_id) { - if (ctx.options->key.vs.as_ls) { - ctx.shader_info->vs.vgpr_comp_cnt = - MAX2(2, ctx.shader_info->vs.vgpr_comp_cnt); - } else { - ctx.shader_info->vs.vgpr_comp_cnt = - MAX2(1, ctx.shader_info->vs.vgpr_comp_cnt); - } - } ctx.abi.load_base_vertex = radv_load_base_vertex; } else if (shaders[i]->info.stage == MESA_SHADER_FRAGMENT) { shader_info->fs.can_discard = shaders[i]->info.fs.uses_discard; @@ -3994,9 +3975,6 @@ ac_fill_shader_info(struct radv_shader_variant_info *shader_info, struct nir_sha case MESA_SHADER_VERTEX: shader_info->vs.as_es = options->key.vs.as_es; shader_info->vs.as_ls = options->key.vs.as_ls; -/* in LS mode we need at least 1, invocation id needs 2, handled elsewhere */ -if (options->key.vs.as_ls) -shader_info->vs.vgpr_comp_cnt = MAX2(1, shader_info->vs.vgpr_comp_cnt); break; default: break; diff --git a/src/amd/vulkan/radv_shader.c b/src/amd/vulkan/radv_shader.c index 5205dc1bfc5..0ec0d67e3b6 100644 --- a/src/amd/vulkan/radv_shader.c +++ b/src/amd/vulkan/radv_shader.c @@ -507,13 +507,40 @@ radv_fill_shader_variant(struct radv_device *device, break; case MESA_SHADER_TESS_CTRL: if (device->physical_device->rad_info.chip_class >= GFX9) { - vgpr_comp_cnt = variant->info.vs.vgpr_comp_cnt; + /* We need at least 2 components for LS. +* VGPR0-3: (VertexID, RelAutoindex, InstanceID / StepRate0, InstanceID). +* StepRate0 is set to 1. so that VGPR3 doesn't have to be loaded. +*/ + vgpr_comp_cnt = info->vs.needs_instance_id ? 2 : 1; } else { variant->rsrc2 |= S_00B12C_OC_LDS_EN(1); } break; case MESA_SHADER_VERTEX: - vgpr_comp_cnt = variant->info.vs.vgpr_comp_cnt; + if (variant->info.vs.as_ls) { + assert(device->physical_device->rad_info.chip_class <= GFX8); + /* We need at least 2 components for LS. +* VGPR0-3: (VertexID, RelAutoindex, InstanceID / StepRate0, InstanceID). +* StepRate0 is set to 1.