Signed-off-by: Bas Nieuwenhuizen <[email protected]>
---
docs/GL3.txt | 4 ++--
docs/relnotes/11.3.0.html | 1 +
src/gallium/drivers/radeon/r600_pipe_common.c | 21 ++++++++++++++++-----
src/gallium/drivers/radeonsi/si_pipe.c | 3 ++-
4 files changed, 21 insertions(+), 8 deletions(-)
diff --git a/docs/GL3.txt b/docs/GL3.txt
index 6bfbd09..6ea8d5c 100644
--- a/docs/GL3.txt
+++ b/docs/GL3.txt
@@ -167,7 +167,7 @@ GL 4.3, GLSL 4.30:
GL_ARB_arrays_of_arrays DONE (all drivers that
support GLSL 1.30)
GL_ARB_ES3_compatibility DONE (all drivers that
support GLSL 3.30)
GL_ARB_clear_buffer_object DONE (all drivers)
- GL_ARB_compute_shader DONE (i965)
+ GL_ARB_compute_shader DONE (i965, radeonsi)
GL_ARB_copy_image DONE (i965, nv50,
nvc0, r600, radeonsi)
GL_KHR_debug DONE (all drivers)
GL_ARB_explicit_uniform_location DONE (all drivers that
support GLSL)
@@ -225,7 +225,7 @@ GL 4.5, GLSL 4.50:
These are the extensions cherry-picked to make GLES 3.1
GLES3.1, GLSL ES 3.1
GL_ARB_arrays_of_arrays DONE (all drivers that
support GLSL 1.30)
- GL_ARB_compute_shader DONE (i965)
+ GL_ARB_compute_shader DONE (i965, radeonsi)
GL_ARB_draw_indirect DONE (i965, nvc0,
r600, radeonsi, llvmpipe, softpipe)
GL_ARB_explicit_uniform_location DONE (all drivers that
support GLSL)
GL_ARB_framebuffer_no_attachments DONE (i965)
diff --git a/docs/relnotes/11.3.0.html b/docs/relnotes/11.3.0.html
index c4e3f36..8624924 100644
--- a/docs/relnotes/11.3.0.html
+++ b/docs/relnotes/11.3.0.html
@@ -44,6 +44,7 @@ Note: some of the new features are only available with
certain drivers.
</p>
<ul>
+<li>GL_ARB_compute_shader on radeonsi</li>
<li>GL_ARB_internalformat_query2 on all drivers</li>
<li>GL_ARB_shader_atomic_counters on radeonsi</li>
<li>GL_ARB_shader_atomic_counter_ops on nvc0, radeonsi</li>
diff --git a/src/gallium/drivers/radeon/r600_pipe_common.c
b/src/gallium/drivers/radeon/r600_pipe_common.c
index 32bd6e4..1ab69e8 100644
--- a/src/gallium/drivers/radeon/r600_pipe_common.c
+++ b/src/gallium/drivers/radeon/r600_pipe_common.c
@@ -654,23 +654,34 @@ static int r600_get_compute_param(struct pipe_screen
*screen,
uint64_t *grid_size = ret;
grid_size[0] = 65535;
grid_size[1] = 65535;
- grid_size[2] = 1;
+ grid_size[2] = 65536;
}
return 3 * sizeof(uint64_t) ;
case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:
if (ret) {
uint64_t *block_size = ret;
- block_size[0] = 256;
- block_size[1] = 256;
- block_size[2] = 256;
+ if (rscreen->family > CHIP_ARUBA && HAVE_LLVM >= 0x309
&&
+ ir_type == PIPE_SHADER_IR_TGSI) {
+ block_size[0] = 2048;
+ block_size[1] = 2048;
+ block_size[2] = 2048;
+ } else {
+ block_size[0] = 256;
+ block_size[1] = 256;
+ block_size[2] = 256;
+ }
}
return 3 * sizeof(uint64_t);
case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:
if (ret) {
uint64_t *max_threads_per_block = ret;
- *max_threads_per_block = 256;
+ if (rscreen->family > CHIP_ARUBA && HAVE_LLVM >= 0x309
&&
+ ir_type == PIPE_SHADER_IR_TGSI)
+ *max_threads_per_block = 2048;
+ else
+ *max_threads_per_block = 256;
}
return sizeof(uint64_t);
diff --git a/src/gallium/drivers/radeonsi/si_pipe.c
b/src/gallium/drivers/radeonsi/si_pipe.c
index 4f837ef..f9e3e8c 100644
--- a/src/gallium/drivers/radeonsi/si_pipe.c
+++ b/src/gallium/drivers/radeonsi/si_pipe.c
@@ -462,7 +462,8 @@ static int si_get_shader_param(struct pipe_screen* pscreen,
unsigned shader, enu
return PIPE_SHADER_IR_NATIVE;
case PIPE_SHADER_CAP_SUPPORTED_IRS:
- return 0;
+ return (HAVE_LLVM >= 0x309 ? 1 << PIPE_SHADER_IR_TGSI :
0) |
+ (1 << PIPE_SHADER_IR_NATIVE);
case PIPE_SHADER_CAP_DOUBLES:
return HAVE_LLVM >= 0x0307;
--
2.7.4
_______________________________________________
mesa-dev mailing list
[email protected]
https://lists.freedesktop.org/mailman/listinfo/mesa-dev