Hello Everyone,
        Attached, please find a patch that will add regression test cases for 
elemental function implementation in C. 

Here are the Changelog entries:
=======================================================================
gcc/testsuite/ChangeLog
2012-09-05  Balaji V. Iyer  <balaji.v.i...@intel.com>

        * gcc.dg/cilk-plus/elem_fn_tests/32bit/test1.c: New test.
        * gcc.dg/cilk-plus/elem_fn_tests/32bit/test10.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/32bit/test11.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/32bit/test12.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/32bit/test7.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/32bit/test8.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/32bit/test9.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/ctrl_flow.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/ctrl_flow2.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/switch_stmt.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test1.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test13.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test14.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test15.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test16.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test17.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test18.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test2.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test3.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test4.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test5.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/64bit/test6.c: Likewise.
        * gcc.dg/cilk-plus/elem_fn_tests/elem_fn.exp: New script.

==================================================================================

Thanking You,

Yours Sincerely,

Balaji V. Iyer.
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test1.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test1.c
new file mode 100644
index 0000000..a33ea3b
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test1.c
@@ -0,0 +1,30 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will insert the clone for the function ef_add inside the function
+ * main (the non-masked version).
+ */
+
+#include <stdlib.h>
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (pentium_4), uniform 
(x,y)))) My_Type ef_add (My_Type x, My_Type y);
+
+My_Type vhx2[10];
+int
+main (int argc, char **argv)
+{
+  My_Type vhx[10];
+  int ii = 9;
+
+  if (argc == 1) 
+    for (ii = 0; ii < 10; ii++) 
+      vhx[ii] = argc;
+
+  for (ii = 0; ii < 10; ii++)
+    vhx2[ii] = ef_add(vhx[ii], vhx[ii]);
+ 
+  for (ii = 0; ii < 10; ii++)
+    if (vhx2[ii] != (argc + argc))
+      abort ();
+  return 0;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test10.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test10.c
new file mode 100644
index 0000000..477369e
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test10.c
@@ -0,0 +1,12 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will create 2 clones of the function below,
+ * for the pentium4 with sse3 processor.
+ */
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (pentium_4_sse3), linear(y), 
uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test11.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test11.c
new file mode 100644
index 0000000..197064b
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test11.c
@@ -0,0 +1,12 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will create 1 clones of the function below, just mask 
+ * for the pentium4 processor.
+ */
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), mask, processor (pentium_4_sse3), 
linear(y), uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test12.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test12.c
new file mode 100644
index 0000000..1c78356
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test12.c
@@ -0,0 +1,12 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will create 1 clones of the function below, just no mask 
+ * for the pentium4 with sse3 processor.
+ */
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), nomask, processor (pentium_4_sse3), 
linear(y), uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test7.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test7.c
new file mode 100644
index 0000000..6720a8c
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test7.c
@@ -0,0 +1,12 @@
+
+/* { dg-final { scan-assembler "simdsimd"  } } */
+/* This test will create 1 clone of the function below, just one for mask
+ * for the pentium4 processor.
+ */
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), mask, processor (pentium_4), 
linear(y), uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test8.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test8.c
new file mode 100644
index 0000000..7f40220
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test8.c
@@ -0,0 +1,12 @@
+
+/* { dg-final { scan-assembler "simdsimd"  } } */
+/* This test will create 1 clone of the function below, just one for nomask
+ * for the pentium4 processor.
+ */
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), nomask, processor (pentium_4), 
linear(y), uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test9.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test9.c
new file mode 100644
index 0000000..0a5caf8
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/32bit/test9.c
@@ -0,0 +1,12 @@
+
+/* { dg-final { scan-assembler "simdsimd"  } } */
+/* This test will create 2 clones of the function below,
+ * for the pentium4 processor.
+ */
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (pentium_4), linear(y), 
uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/ctrl_flow.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/ctrl_flow.c
new file mode 100644
index 0000000..8df372a
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/ctrl_flow.c
@@ -0,0 +1,15 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+/* This test will create 2 clones of the function below, one for mask and one 
+   without the mask
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (core_i7_sse4_2), uniform 
(x,y))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  if (x > 0)
+    return x + y;
+  else
+    return (x-y);
+}
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/ctrl_flow2.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/ctrl_flow2.c
new file mode 100644
index 0000000..30e710f
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/ctrl_flow2.c
@@ -0,0 +1,22 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will create 2 clones of the function below, one for mask and one 
+   without the mask
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (core_i7_sse4_2), uniform 
(x,y))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  if (x > 0) {
+    if (y > 0) {
+      return x + y;
+    }
+    else
+      return (x-y);
+  }
+  else
+    return 0;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/switch_stmt.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/switch_stmt.c
new file mode 100644
index 0000000..0d9db6f
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/switch_stmt.c
@@ -0,0 +1,25 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+/* This test will create 2 clones of the function below, one for mask and one 
+   without the mask
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (core_i7_sse4_2), uniform 
(x,y))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  switch ((int)x) {
+    case 0:
+    case 1:
+      x = x + 1;
+      return x+y;
+    case 2:
+      y = y + 2;
+      return x-y;
+    default:
+      return 0;
+  }
+  return 0;
+
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test1.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test1.c
new file mode 100644
index 0000000..576821a
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test1.c
@@ -0,0 +1,30 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will insert the clone for the function ef_add inside the function
+ * main (the non-masked version).
+ */
+
+#include <stdlib.h>
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (core_i7_sse4_2), uniform 
(x,y)))) My_Type ef_add (My_Type x, My_Type y);
+
+My_Type vhx2[10];
+int
+main (int argc, char **argv)
+{
+  My_Type vhx[10];
+  int ii = 9;
+
+  if (argc == 1) 
+    for (ii = 0; ii < 10; ii++) 
+      vhx[ii] = argc;
+
+  for (ii = 0; ii < 10; ii++)
+    vhx2[ii] = ef_add(vhx[ii], vhx[ii]);
+ 
+  for (ii = 0; ii < 10; ii++)
+    if (vhx2[ii] != (argc + argc))
+      abort ();
+  return 0;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test13.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test13.c
new file mode 100644
index 0000000..18c8844
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test13.c
@@ -0,0 +1,13 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+/* This test will create 2 clones of the function below,
+ * for the pentium4 with sse3 processor.
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (core2_duo_sse3), linear(y), 
uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test14.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test14.c
new file mode 100644
index 0000000..f154d49
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test14.c
@@ -0,0 +1,14 @@
+
+/* { dg-final { scan-assembler "simdsimd"  } } */
+/* This test will create 1 clones of the function below, just the mask
+ * for the pentium4 with sse3 processor.
+ */
+
+#define My_Type float
+__attribute__ ((vector(mask, vectorlength(4), processor (core2_duo_sse3), 
linear(y), uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test15.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test15.c
new file mode 100644
index 0000000..8a458fc
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test15.c
@@ -0,0 +1,14 @@
+
+/* { dg-final { scan-assembler "simdsimd"  } } */
+/* This test will create 1 clones of the function below, just the mask
+ * for the pentium4 with sse3 processor.
+ */
+
+#define My_Type float
+__attribute__ ((vector(nomask, vectorlength(4), processor (core2_duo_sse3), 
linear(y), uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test16.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test16.c
new file mode 100644
index 0000000..fcfc5c0
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test16.c
@@ -0,0 +1,14 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will create 2 clones of the function below,
+ * for the pentium4 with sse3 processor.
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (core_2_duo_sse_4_1), 
linear(y), uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test17.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test17.c
new file mode 100644
index 0000000..847c219
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test17.c
@@ -0,0 +1,14 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will create 2 clones of the function below,
+ * for the core2_duo with sse 4.1 processor.
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (core_2_duo_sse_4_1), 
linear(y), uniform (x), nomask)))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test18.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test18.c
new file mode 100644
index 0000000..daa1546
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test18.c
@@ -0,0 +1,14 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will create 1 clones of the function below, just mask
+ * for the core2_duo with sse 4.1 processor.
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (core_2_duo_sse_4_1), 
linear(y), mask, uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test2.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test2.c
new file mode 100644
index 0000000..a515c53
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test2.c
@@ -0,0 +1,14 @@
+
+/* { dg-final { scan-assembler "simdsimd"  } } */
+/* This test will create 2 clones of the function below, one for mask and one 
+   without the mask
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), processor (core_i7_sse4_2), uniform 
(x,y))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test3.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test3.c
new file mode 100644
index 0000000..d9e3fe1
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test3.c
@@ -0,0 +1,13 @@
+
+/* { dg-final { scan-assembler "simdsimd"  } } */
+/* This test will create 1 clone of the function below, just one for mask
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), mask, processor (core_i7_sse4_2), 
uniform (x,y))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test4.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test4.c
new file mode 100644
index 0000000..9aa36cc
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test4.c
@@ -0,0 +1,13 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will create 1 clone of the function below, just one for nomask
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), nomask, processor (core_i7_sse4_2), 
uniform (x,y))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test5.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test5.c
new file mode 100644
index 0000000..6688980
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test5.c
@@ -0,0 +1,14 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will create 1 clone of the function below, just one for nomask and
+   do a linear for y variable
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), nomask, processor (core_i7_sse4_2), 
uniform (x), linear(y))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test6.c 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test6.c
new file mode 100644
index 0000000..4ec317f
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/64bit/test6.c
@@ -0,0 +1,13 @@
+/* { dg-final { scan-assembler "simdsimd"  } } */
+
+/* This test will create 1 clone of the function below, just one for mask
+ */
+
+#define My_Type float
+__attribute__ ((vector(vectorlength(4), mask, processor (core_i7_sse4_2), 
linear(y), uniform (x))))
+My_Type ef_add (My_Type x, My_Type y) 
+
+{
+  return x + y;
+}
+
diff --git gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/elem_fn.exp 
gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/elem_fn.exp
new file mode 100644
index 0000000..50a27ba
--- /dev/null
+++ gcc/testsuite/gcc.dg/cilk-plus/elem_fn_tests/elem_fn.exp
@@ -0,0 +1,50 @@
+# Copyright (C) 2012
+# Free Software Foundation, Inc.
+
+# Contributed by Balaji V. Iyer  <balaji.v.i...@intel.com>
+#                Intel Corporation. 
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 3 of the License, or
+# (at your option) any later version.
+# 
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+# 
+# You should have received a copy of the GNU General Public License
+# along with GCC; see the file COPYING3.  If not see
+# <http://www.gnu.org/licenses/>.
+
+
+# Exit immediately if this isn't a x86 target.
+if { ![istarget i?86*-*-*] && ![istarget x86_64-*-*] } then {
+  return
+}
+
+# Load support procs.
+load_lib gcc-dg.exp
+set tests_32bit [lsort [glob -nocomplain $srcdir/$subdir/32bit/*.\[cS\]]]
+set tests_64bit [lsort [glob -nocomplain $srcdir/$subdir/64bit/*.\[cS\]]]
+
+if { [istarget i?86*-*-*] } then {
+
+# Main loop.
+dg-runtest $tests_32bit " -O3 -ftree-vectorize -fcilkplus" " "
+# All done.
+dg-finish
+}
+
+# For 64 bit architectures, we can run both 32 bit and 64 bit tests. 
+if { [istarget x86_64-*-*] } then {
+
+# Main loop.
+dg-runtest $tests_32bit "-m32 -O3 -ftree-vectorize -fcilkplus" " "
+# All done.
+dg-finish
+# Main loop.
+dg-runtest $tests_64bit " -O3 -ftree-vectorize -fcilkplus" " "
+# All done.
+dg-finish
+}

Reply via email to