Hi!

On 2020-06-29T13:16:51-0700, Julian Brown <jul...@codesourcery.com> wrote:
> This patch turns off the middle-end worker-partitioning support if the
> number of workers for an outlined offload function is one.  In that case,
> we do not need to perform the broadcasting/neutering code transformation.

ACK, thanks.

> --- a/gcc/omp-offload.c
> +++ b/gcc/omp-offload.c
> @@ -2165,7 +2165,20 @@ public:
>    /* opt_pass methods: */
>    virtual bool gate (function *)
>    {
> -    return flag_openacc && targetm.goacc.worker_partitioning;
> +    if (!flag_openacc || !targetm.goacc.worker_partitioning)
> +      return false;
> +
> +    tree attr = oacc_get_fn_attrib (current_function_decl);
> +
> +    if (!attr)
> +      /* Not an offloaded function.  */
> +      return false;

This last check implies that code in
'gcc/omp-oacc-neuter-broadcast.cc:execute_omp_oacc_neuter_broadcast'
ought to be simplified which currently does:

    tree attr = oacc_get_fn_attrib (current_function_decl);
    if (attr)

..., which now is always-true.

> +
> +    int worker_dim
> +      = oacc_get_fn_dim_size (current_function_decl, GOMP_DIM_WORKER);
> +
> +    /* No worker partitioning if we know the number of workers is 1.  */
> +    return worker_dim != 1;
>    };

Pushed to master branch commit 82792cc407d7a7ab99f37e8501d19be2e6164e50
"openacc: Turn off worker partitioning if num_workers==1", see attached.


Grüße
 Thomas


-----------------
Siemens Electronic Design Automation GmbH; Anschrift: Arnulfstraße 201, 80634 
München; Gesellschaft mit beschränkter Haftung; Geschäftsführer: Thomas 
Heurung, Frank Thürauf; Sitz der Gesellschaft: München; Registergericht 
München, HRB 106955
>From 82792cc407d7a7ab99f37e8501d19be2e6164e50 Mon Sep 17 00:00:00 2001
From: Julian Brown <jul...@codesourcery.com>
Date: Mon, 29 Jun 2020 13:16:51 -0700
Subject: [PATCH] openacc: Turn off worker partitioning if num_workers==1

This patch turns off the middle-end worker-partitioning support if the
number of workers for an outlined offload function is one.  In that case,
we do not need to perform the broadcasting/neutering code transformation.

	gcc/
	* omp-oacc-neuter-broadcast.cc
	(pass_omp_oacc_neuter_broadcast::gate): Disable if num_workers is
	1.
	(execute_omp_oacc_neuter_broadcast): Adjust.

Co-Authored-By: Thomas Schwinge <tho...@codesourcery.com>
---
 gcc/omp-oacc-neuter-broadcast.cc | 47 +++++++++++++++++++++-----------
 1 file changed, 31 insertions(+), 16 deletions(-)

diff --git a/gcc/omp-oacc-neuter-broadcast.cc b/gcc/omp-oacc-neuter-broadcast.cc
index d48627a6940..3fe92248c4e 100644
--- a/gcc/omp-oacc-neuter-broadcast.cc
+++ b/gcc/omp-oacc-neuter-broadcast.cc
@@ -1378,18 +1378,17 @@ execute_omp_oacc_neuter_broadcast ()
 
   /* If this is a routine, calculate MASK as if the outer levels are already
      partitioned.  */
-  tree attr = oacc_get_fn_attrib (current_function_decl);
-  if (attr)
-    {
-      tree dims = TREE_VALUE (attr);
-      unsigned ix;
-      for (ix = 0; ix != GOMP_DIM_MAX; ix++, dims = TREE_CHAIN (dims))
-	{
-	  tree allowed = TREE_PURPOSE (dims);
-	  if (allowed && integer_zerop (allowed))
-	    mask |= GOMP_DIM_MASK (ix);
-	}
-    }
+  {
+    tree attr = oacc_get_fn_attrib (current_function_decl);
+    tree dims = TREE_VALUE (attr);
+    unsigned ix;
+    for (ix = 0; ix != GOMP_DIM_MAX; ix++, dims = TREE_CHAIN (dims))
+      {
+	tree allowed = TREE_PURPOSE (dims);
+	if (allowed && integer_zerop (allowed))
+	  mask |= GOMP_DIM_MASK (ix);
+      }
+  }
 
   parallel_g *par = omp_sese_discover_pars (&bb_stmt_map);
   populate_single_mode_bitmaps (par, worker_single, vector_single, mask, 0);
@@ -1506,11 +1505,27 @@ public:
   {}
 
   /* opt_pass methods: */
-  virtual bool gate (function *)
+  virtual bool gate (function *fun)
   {
-    return (flag_openacc
-	    && targetm.goacc.create_worker_broadcast_record);
-  };
+    if (!flag_openacc)
+      return false;
+
+    if (!targetm.goacc.create_worker_broadcast_record)
+      return false;
+
+    /* Only relevant for OpenACC offloaded functions.  */
+    tree attr = oacc_get_fn_attrib (fun->decl);
+    if (!attr)
+      return false;
+
+    /* Not relevant for 'num_workers(1)'.  */
+    int worker_dim
+      = oacc_get_fn_dim_size (fun->decl, GOMP_DIM_WORKER);
+    if (worker_dim == 1)
+      return false;
+
+    return true;
+  }
 
   virtual unsigned int execute (function *)
     {
-- 
2.33.0

Reply via email to