Re: [AArch64/ARM 1/3] Add execution + assembler tests of AArch64 TRN Intrinsics

2014-04-24 Thread Marcus Shawcroft
On 28 March 2014 15:31, Alan Lawrence alan.lawre...@arm.com wrote:
 This adds DejaGNU tests of the existing AArch64 vuzp_* intrinsics, both
 checking
 the assembler output and the runtime results. Test bodies are in separate
 files
 ready to reuse for ARM in the third patch.

 Putting these in a new subdirectory with the ZIP Intrinsics tests, using
 simd.exp added there (will commit ZIP tests first).

 All tests passing on aarch64-none-elf and aarch64_be-none-elf.

 testsuite/ChangeLog:
 2012-03-28  Alan Lawrence  alan.lawre...@arm.com

 * gcc.target/aarch64/simd/vtrnf32_1.c: New file.
 * gcc.target/aarch64/simd/vtrnf32.x: New file.
 * gcc.target/aarch64/simd/vtrnp16_1.c: New file.
 * gcc.target/aarch64/simd/vtrnp16.x: New file.
 * gcc.target/aarch64/simd/vtrnp8_1.c: New file.
 * gcc.target/aarch64/simd/vtrnp8.x: New file.
 * gcc.target/aarch64/simd/vtrnqf32_1.c: New file.
 * gcc.target/aarch64/simd/vtrnqf32.x: New file.
 * gcc.target/aarch64/simd/vtrnqp16_1.c: New file.
 * gcc.target/aarch64/simd/vtrnqp16.x: New file.
 * gcc.target/aarch64/simd/vtrnqp8_1.c: New file.
 * gcc.target/aarch64/simd/vtrnqp8.x: New file.
 * gcc.target/aarch64/simd/vtrnqs16_1.c: New file.
 * gcc.target/aarch64/simd/vtrnqs16.x: New file.
 * gcc.target/aarch64/simd/vtrnqs32_1.c: New file.
 * gcc.target/aarch64/simd/vtrnqs32.x: New file.
 * gcc.target/aarch64/simd/vtrnqs8_1.c: New file.
 * gcc.target/aarch64/simd/vtrnqs8.x: New file.
 * gcc.target/aarch64/simd/vtrnqu16_1.c: New file.
 * gcc.target/aarch64/simd/vtrnqu16.x: New file.
 * gcc.target/aarch64/simd/vtrnqu32_1.c: New file.
 * gcc.target/aarch64/simd/vtrnqu32.x: New file.
 * gcc.target/aarch64/simd/vtrnqu8_1.c: New file.
 * gcc.target/aarch64/simd/vtrnqu8.x: New file.
 * gcc.target/aarch64/simd/vtrns16_1.c: New file.
 * gcc.target/aarch64/simd/vtrns16.x: New file.
 * gcc.target/aarch64/simd/vtrns32_1.c: New file.
 * gcc.target/aarch64/simd/vtrns32.x: New file.
 * gcc.target/aarch64/simd/vtrns8_1.c: New file.
 * gcc.target/aarch64/simd/vtrns8.x: New file.
 * gcc.target/aarch64/simd/vtrnu16_1.c: New file.
 * gcc.target/aarch64/simd/vtrnu16.x: New file.
 * gcc.target/aarch64/simd/vtrnu32_1.c: New file.
 * gcc.target/aarch64/simd/vtrnu32.x: New file.
 * gcc.target/aarch64/simd/vtrnu8_1.c: New file.
 * gcc.target/aarch64/simd/vtrnu8.x: New file.

OK /Marcus


[AArch64/ARM 1/3] Add execution + assembler tests of AArch64 TRN Intrinsics

2014-03-28 Thread Alan Lawrence

This adds DejaGNU tests of the existing AArch64 vuzp_* intrinsics, both checking
the assembler output and the runtime results. Test bodies are in separate files
ready to reuse for ARM in the third patch.

Putting these in a new subdirectory with the ZIP Intrinsics tests, using 
simd.exp added there (will commit ZIP tests first).


All tests passing on aarch64-none-elf and aarch64_be-none-elf.

testsuite/ChangeLog:
2012-03-28  Alan Lawrence  alan.lawre...@arm.com

* gcc.target/aarch64/simd/vtrnf32_1.c: New file.
* gcc.target/aarch64/simd/vtrnf32.x: New file.
* gcc.target/aarch64/simd/vtrnp16_1.c: New file.
* gcc.target/aarch64/simd/vtrnp16.x: New file.
* gcc.target/aarch64/simd/vtrnp8_1.c: New file.
* gcc.target/aarch64/simd/vtrnp8.x: New file.
* gcc.target/aarch64/simd/vtrnqf32_1.c: New file.
* gcc.target/aarch64/simd/vtrnqf32.x: New file.
* gcc.target/aarch64/simd/vtrnqp16_1.c: New file.
* gcc.target/aarch64/simd/vtrnqp16.x: New file.
* gcc.target/aarch64/simd/vtrnqp8_1.c: New file.
* gcc.target/aarch64/simd/vtrnqp8.x: New file.
* gcc.target/aarch64/simd/vtrnqs16_1.c: New file.
* gcc.target/aarch64/simd/vtrnqs16.x: New file.
* gcc.target/aarch64/simd/vtrnqs32_1.c: New file.
* gcc.target/aarch64/simd/vtrnqs32.x: New file.
* gcc.target/aarch64/simd/vtrnqs8_1.c: New file.
* gcc.target/aarch64/simd/vtrnqs8.x: New file.
* gcc.target/aarch64/simd/vtrnqu16_1.c: New file.
* gcc.target/aarch64/simd/vtrnqu16.x: New file.
* gcc.target/aarch64/simd/vtrnqu32_1.c: New file.
* gcc.target/aarch64/simd/vtrnqu32.x: New file.
* gcc.target/aarch64/simd/vtrnqu8_1.c: New file.
* gcc.target/aarch64/simd/vtrnqu8.x: New file.
* gcc.target/aarch64/simd/vtrns16_1.c: New file.
* gcc.target/aarch64/simd/vtrns16.x: New file.
* gcc.target/aarch64/simd/vtrns32_1.c: New file.
* gcc.target/aarch64/simd/vtrns32.x: New file.
* gcc.target/aarch64/simd/vtrns8_1.c: New file.
* gcc.target/aarch64/simd/vtrns8.x: New file.
* gcc.target/aarch64/simd/vtrnu16_1.c: New file.
* gcc.target/aarch64/simd/vtrnu16.x: New file.
* gcc.target/aarch64/simd/vtrnu32_1.c: New file.
* gcc.target/aarch64/simd/vtrnu32.x: New file.
* gcc.target/aarch64/simd/vtrnu8_1.c: New file.
* gcc.target/aarch64/simd/vtrnu8.x: New file.diff --git a/gcc/testsuite/gcc.target/aarch64/simd/vtrnf32.x b/gcc/testsuite/gcc.target/aarch64/simd/vtrnf32.x
new file mode 100644
index 000..7b03e6b
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/simd/vtrnf32.x
@@ -0,0 +1,27 @@
+extern void abort (void);
+
+float32x2x2_t
+test_vtrnf32 (float32x2_t _a, float32x2_t _b)
+{
+  return vtrn_f32 (_a, _b);
+}
+
+int
+main (int argc, char **argv)
+{
+  int i;
+  float32_t first[] = {1, 2};
+  float32_t second[] = {3, 4};
+  float32x2x2_t result = test_vtrnf32 (vld1_f32 (first), vld1_f32 (second));
+  float32x2_t res1 = result.val[0], res2 = result.val[1];
+  float32_t exp1[] = {1, 3};
+  float32_t exp2[] = {2, 4};
+  float32x2_t expected1 = vld1_f32 (exp1);
+  float32x2_t expected2 = vld1_f32 (exp2);
+
+  for (i = 0; i  2; i++)
+if ((res1[i] != expected1[i]) || (res2[i] != expected2[i]))
+  abort ();
+
+  return 0;
+}
diff --git a/gcc/testsuite/gcc.target/aarch64/simd/vtrnf32_1.c b/gcc/testsuite/gcc.target/aarch64/simd/vtrnf32_1.c
new file mode 100644
index 000..24c30a3
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/simd/vtrnf32_1.c
@@ -0,0 +1,11 @@
+/* Test the `vtrn_f32' AArch64 SIMD intrinsic.  */
+
+/* { dg-do run } */
+/* { dg-options -save-temps -fno-inline } */
+
+#include arm_neon.h
+#include vtrnf32.x
+
+/* { dg-final { scan-assembler-times trn1\[ \t\]+v\[0-9\]+\.2s, ?v\[0-9\]+\.2s, ?v\[0-9\]+\.2s!?\(?:\[ \t\]+@\[a-zA-Z0-9 \]+\)?\n 1 } } */
+/* { dg-final { scan-assembler-times trn2\[ \t\]+v\[0-9\]+\.2s, ?v\[0-9\]+\.2s, ?v\[0-9\]+\.2s!?\(?:\[ \t\]+@\[a-zA-Z0-9 \]+\)?\n 1 } } */
+/* { dg-final { cleanup-saved-temps } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/simd/vtrnp16.x b/gcc/testsuite/gcc.target/aarch64/simd/vtrnp16.x
new file mode 100644
index 000..5feabe4
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/simd/vtrnp16.x
@@ -0,0 +1,27 @@
+extern void abort (void);
+
+poly16x4x2_t
+test_vtrnp16 (poly16x4_t _a, poly16x4_t _b)
+{
+  return vtrn_p16 (_a, _b);
+}
+
+int
+main (int argc, char **argv)
+{
+  int i;
+  poly16_t first[] = {1, 2, 3, 4};
+  poly16_t second[] = {5, 6, 7, 8};
+  poly16x4x2_t result = test_vtrnp16 (vld1_p16 (first), vld1_p16 (second));
+  poly16x4_t res1 = result.val[0], res2 = result.val[1];
+  poly16_t exp1[] = {1, 5, 3, 7};
+  poly16_t exp2[] = {2, 6, 4, 8};
+  poly16x4_t expected1 = vld1_p16 (exp1);
+  poly16x4_t expected2 = vld1_p16 (exp2);
+
+  for (i = 0; i  4; i++)
+if ((res1[i] != expected1[i]) || (res2[i] != expected2[i]))
+