Mesa (main): llvmpipe: clean-up llvmpipe_get_query_result()

GitLab Mirror Tue, 04 Apr 2023 21:06:28 -0700

Module: Mesa
Branch: main
Commit: 6eaf2e7c16df7291bd8fc0a96b5522dd96cfa1a0
URL:    
http://cgit.freedesktop.org/mesa/mesa/commit/?id=6eaf2e7c16df7291bd8fc0a96b5522dd96cfa1a0


Author: Brian Paul <[email protected]>
Date:   Mon Apr  3 20:53:00 2023 -0600

llvmpipe: clean-up llvmpipe_get_query_result()

Get rid of the uint64 result pointer which was used by some query
types.  Handle each switch case with self-contained code.  Remove
unneeded casts.  Use MIN2/MAX2 macros.

Signed-off-by: Brian Paul <[email protected]>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/22281>

---

 src/gallium/drivers/llvmpipe/lp_query.c | 117 ++++++++++++++++++--------------
 1 file changed, 67 insertions(+), 50 deletions(-)

diff --git a/src/gallium/drivers/llvmpipe/lp_query.c 
b/src/gallium/drivers/llvmpipe/lp_query.c
index e9b5abf34bb..00005f0e309 100644
--- a/src/gallium/drivers/llvmpipe/lp_query.c
+++ b/src/gallium/drivers/llvmpipe/lp_query.c
@@ -93,12 +93,11 @@ static bool
 llvmpipe_get_query_result(struct pipe_context *pipe,
                           struct pipe_query *q,
                           bool wait,
-                          union pipe_query_result *vresult)
+                          union pipe_query_result *result)
 {
-   struct llvmpipe_screen *screen = llvmpipe_screen(pipe->screen);
-   unsigned num_threads = MAX2(1, screen->num_threads);
+   const struct llvmpipe_screen *screen = llvmpipe_screen(pipe->screen);
+   const unsigned num_threads = MAX2(1, screen->num_threads);
    struct llvmpipe_query *pq = llvmpipe_query(q);
-   uint64_t *result = (uint64_t *)vresult;
 
    if (pq->fence) {
       /* only have a fence if there was a scene */
@@ -113,84 +112,102 @@ llvmpipe_get_query_result(struct pipe_context *pipe,
       }
    }
 
-   /* Sum the results from each of the threads:
+   /* Always initialize the first 64-bit result word to zero since some
+    * callers don't consider whether the result is actually a 1-byte or 4-byte
+    * quantity.
     */
-   *result = 0;
+   result->u64 = 0;
 
+   /* Combine the per-thread results */
    switch (pq->type) {
    case PIPE_QUERY_OCCLUSION_COUNTER:
-      for (unsigned i = 0; i < num_threads; i++) {
-         *result += pq->end[i];
+      {
+         uint64_t sum = 0;
+         for (unsigned i = 0; i < num_threads; i++) {
+            sum += pq->end[i];
+         }
+         result->u64 = sum;
       }
       break;
    case PIPE_QUERY_OCCLUSION_PREDICATE:
    case PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE:
+      result->b = false;
       for (unsigned i = 0; i < num_threads; i++) {
          /* safer (still not guaranteed) when there's an overflow */
-         vresult->b = vresult->b || pq->end[i];
+         if (pq->end[i] > 0) {
+            result->b = true;
+            break;
+         }
       }
       break;
    case PIPE_QUERY_TIMESTAMP:
-      for (unsigned i = 0; i < num_threads; i++) {
-         if (pq->end[i] > *result) {
-            *result = pq->end[i];
+      {
+         uint64_t max_time = 0;
+         for (unsigned i = 0; i < num_threads; i++) {
+            max_time = MAX2(max_time, pq->end[i]);
          }
+         result->u64 = max_time;
       }
       break;
-   case PIPE_QUERY_TIME_ELAPSED: {
-      uint64_t start = (uint64_t)-1, end = 0;
-      for (unsigned i = 0; i < num_threads; i++) {
-         if (pq->start[i] && pq->start[i] < start)
-            start = pq->start[i];
-         if (pq->end[i] && pq->end[i] > end)
-            end = pq->end[i];
+   case PIPE_QUERY_TIME_ELAPSED:
+      {
+         uint64_t start = UINT64_MAX, end = 0;
+         for (unsigned i = 0; i < num_threads; i++) {
+            if (pq->start[i]) {
+               start = MIN2(start, pq->start[i]);
+            }
+            if (pq->end[i]) {
+               end = MAX2(end, pq->end[i]);
+            }
+         }
+         result->u64 = end - start;
       }
-      *result = end - start;
       break;
-   }
-   case PIPE_QUERY_TIMESTAMP_DISJOINT: {
-      struct pipe_query_data_timestamp_disjoint *td =
-         (struct pipe_query_data_timestamp_disjoint *)vresult;
+   case PIPE_QUERY_TIMESTAMP_DISJOINT:
       /* os_get_time_nano return nanoseconds */
-      td->frequency = UINT64_C(1000000000);
-      td->disjoint = false;
-   }
+      result->timestamp_disjoint.frequency = UINT64_C(1000000000);
+      result->timestamp_disjoint.disjoint = false;
       break;
    case PIPE_QUERY_GPU_FINISHED:
-      vresult->b = true;
+      result->b = true;
       break;
    case PIPE_QUERY_PRIMITIVES_GENERATED:
-      *result = pq->num_primitives_generated[0];
+      result->u64 = pq->num_primitives_generated[0];
       break;
    case PIPE_QUERY_PRIMITIVES_EMITTED:
-      *result = pq->num_primitives_written[0];
+      result->u64 = pq->num_primitives_written[0];
       break;
    case PIPE_QUERY_SO_OVERFLOW_ANY_PREDICATE:
-      vresult->b = false;
-      for (unsigned s = 0; s < PIPE_MAX_VERTEX_STREAMS; s++)
-         vresult->b |= pq->num_primitives_generated[s] > 
pq->num_primitives_written[s];
+      result->b = false;
+      for (unsigned s = 0; s < PIPE_MAX_VERTEX_STREAMS; s++) {
+         if (pq->num_primitives_generated[s] > pq->num_primitives_written[s]) {
+            result->b = true;
+            break;
+         }
+      }
       break;
    case PIPE_QUERY_SO_OVERFLOW_PREDICATE:
-      vresult->b = pq->num_primitives_generated[0] > 
pq->num_primitives_written[0];
+      result->b = pq->num_primitives_generated[0] > 
pq->num_primitives_written[0];
       break;
-   case PIPE_QUERY_SO_STATISTICS: {
-      struct pipe_query_data_so_statistics *stats =
-         (struct pipe_query_data_so_statistics *)vresult;
-      stats->num_primitives_written = pq->num_primitives_written[0];
-      stats->primitives_storage_needed = pq->num_primitives_generated[0];
-   }
+   case PIPE_QUERY_SO_STATISTICS:
+      result->so_statistics.num_primitives_written = 
pq->num_primitives_written[0];
+      result->so_statistics.primitives_storage_needed = 
pq->num_primitives_generated[0];
       break;
-   case PIPE_QUERY_PIPELINE_STATISTICS: {
-      struct pipe_query_data_pipeline_statistics *stats =
-         (struct pipe_query_data_pipeline_statistics *)vresult;
-      /* only ps_invocations come from binned query */
-      pq->stats.ps_invocations = 0;
-      for (unsigned i = 0; i < num_threads; i++) {
-         pq->stats.ps_invocations += pq->end[i];
+   case PIPE_QUERY_PIPELINE_STATISTICS:
+      {
+         /* only ps_invocations are per-bin/thread */
+         uint64_t sum = 0;
+         for (unsigned i = 0; i < num_threads; i++) {
+            sum += pq->end[i];
+         }
+         /* The FS/PS operates on a block of pixels at a time.  The counter is
+          * incremented per block so we multiply by pixels per block here.
+          * This will not be a pixel-exact result.
+          */
+         pq->stats.ps_invocations =
+            sum * LP_RASTER_BLOCK_SIZE * LP_RASTER_BLOCK_SIZE;
+         result->pipeline_statistics = pq->stats;
       }
-      pq->stats.ps_invocations *= LP_RASTER_BLOCK_SIZE * LP_RASTER_BLOCK_SIZE;
-      *stats = pq->stats;
-   }
       break;
    default:
       assert(0);

Mesa (main): llvmpipe: clean-up llvmpipe_get_query_result()

Reply via email to