---
gcc/ChangeLog:
* common/config/i386/cpuinfo.h (get_available_features):
* common/config/i386/i386-common.cc (OPTION_MASK_ISA2_AVX10_V2_AUX_SET):
(OPTION_MASK_ISA2_AVX10_V2_AUX_UNSET):
(ix86_handle_option):
* common/config/i386/i386-cpuinfo.h (enum processor_features):
* common/config/i386/i386-isas.h:
* config.gcc:
* config/i386/cpuid.h (bit_AVX10_V2_AUX):
* config/i386/i386-builtin-types.def (V16QI):
* config/i386/i386-builtin.def (BDESC):
* config/i386/i386-c.cc (ix86_target_macros_internal):
* config/i386/i386-expand.cc (ix86_expand_args_builtin):
* config/i386/i386-isa.def (AVX10_V2_AUX):
* config/i386/i386-options.cc (ix86_valid_target_attribute_inner_p):
* config/i386/i386.opt:
* config/i386/immintrin.h:
* config/i386/sse.md (vcvt<convertps2fp8><mode>):
(vcvt<convertps2fp8><mode>_mask):
(*vcvt<convertps2fp8><mode>_mask):
* doc/invoke.texi:
* config/i386/avx10_v2_auxintrin.h: New file.
gcc/testsuite/ChangeLog:
* lib/target-supports.exp:
* gcc.target/i386/avx10_2-v2-aux-convert-1.c: New test.
gcc/common/config/i386/cpuinfo.h | 4 +
gcc/common/config/i386/i386-common.cc | 19 +-
gcc/common/config/i386/i386-cpuinfo.h | 1 +
gcc/common/config/i386/i386-isas.h | 2 +
gcc/config.gcc | 2 +-
gcc/config/i386/avx10_v2_auxintrin.h | 409 ++++++++++++++++++
gcc/config/i386/cpuid.h | 4 +
gcc/config/i386/i386-builtin-types.def | 5 +
gcc/config/i386/i386-builtin.def | 14 +
gcc/config/i386/i386-c.cc | 2 +
gcc/config/i386/i386-expand.cc | 3 +
gcc/config/i386/i386-isa.def | 1 +
gcc/config/i386/i386-options.cc | 4 +-
gcc/config/i386/i386.opt | 4 +
gcc/config/i386/immintrin.h | 2 +
gcc/config/i386/sse.md | 61 +++
gcc/doc/invoke.texi | 7 +-
.../i386/avx10_2-v2-aux-convert-1.c | 88 ++++
gcc/testsuite/lib/target-supports.exp | 11 +
19 files changed, 639 insertions(+), 4 deletions(-)
create mode 100644 gcc/config/i386/avx10_v2_auxintrin.h
create mode 100644 gcc/testsuite/gcc.target/i386/avx10_2-v2-aux-convert-1.c
diff --git a/gcc/common/config/i386/cpuinfo.h b/gcc/common/config/i386/cpuinfo.h
index f59090c8cde..6310e7294da 100644
--- a/gcc/common/config/i386/cpuinfo.h
+++ b/gcc/common/config/i386/cpuinfo.h
@@ -1139,6 +1139,10 @@ get_available_features (struct __processor_model
*cpu_model,
set_feature (FEATURE_AVX10_1);
break;
}
+ /* CPUID.(EAX=24H, ECX=1) for AVX10_V2_AUX features. */
+ __cpuid_count (0x24, 1, eax, ebx, ecx, edx);
+ if (ecx & bit_AVX10_V2_AUX)
+ set_feature (FEATURE_AVX10_V2_AUX);
}
/* Check cpuid level of extended features. */
diff --git a/gcc/common/config/i386/i386-common.cc
b/gcc/common/config/i386/i386-common.cc
index 607581b0f09..a57f7887b58 100644
--- a/gcc/common/config/i386/i386-common.cc
+++ b/gcc/common/config/i386/i386-common.cc
@@ -140,7 +140,8 @@ along with GCC; see the file COPYING3. If not see
#define OPTION_MASK_ISA2_AMX_MOVRS_SET \
(OPTION_MASK_ISA2_AMX_TILE_SET | OPTION_MASK_ISA2_AMX_MOVRS)
#define OPTION_MASK_ISA2_AVX512BMM_SET OPTION_MASK_ISA2_AVX512BMM
-
+#define OPTION_MASK_ISA2_AVX10_V2_AUX_SET \
+ (OPTION_MASK_ISA2_AVX10_1_SET | OPTION_MASK_ISA2_AVX10_V2_AUX)
/* SSE4 includes both SSE4.1 and SSE4.2. -msse4 should be the same
as -msse4.2. */
#define OPTION_MASK_ISA_SSE4_SET OPTION_MASK_ISA_SSE4_2_SET
@@ -334,6 +335,7 @@ along with GCC; see the file COPYING3. If not see
#define OPTION_MASK_ISA2_MOVRS_UNSET OPTION_MASK_ISA2_MOVRS
#define OPTION_MASK_ISA2_AMX_MOVRS_UNSET OPTION_MASK_ISA2_AMX_MOVRS
#define OPTION_MASK_ISA2_AVX512BMM_UNSET OPTION_MASK_ISA2_AVX512BMM
+#define OPTION_MASK_ISA2_AVX10_V2_AUX_UNSET OPTION_MASK_ISA2_AVX10_V2_AUX
/* SSE4 includes both SSE4.1 and SSE4.2. -mno-sse4 should the same
as -mno-sse4.1. */
@@ -1417,6 +1419,21 @@ ix86_handle_option (struct gcc_options *opts,
opts->x_ix86_isa_flags2_explicit |= OPTION_MASK_ISA2_AVX10_2_UNSET;
}
return true;
+
+ case OPT_mavx10_v2_aux:
+ if (value)
+ {
+ opts->x_ix86_isa_flags2 |= OPTION_MASK_ISA2_AVX10_V2_AUX_SET;
+ opts->x_ix86_isa_flags2_explicit |= OPTION_MASK_ISA2_AVX10_V2_AUX_SET;
+ opts->x_ix86_isa_flags |= OPTION_MASK_ISA_AVX10_1_SET;
+ opts->x_ix86_isa_flags_explicit |= OPTION_MASK_ISA_AVX10_1_SET;
+ }
+ else
+ {
+ opts->x_ix86_isa_flags2 &= ~OPTION_MASK_ISA2_AVX10_V2_AUX_UNSET;
+ opts->x_ix86_isa_flags2_explicit |=
OPTION_MASK_ISA2_AVX10_V2_AUX_UNSET;
+ }
+ return true;
case OPT_mamx_avx512:
if (value)
diff --git a/gcc/common/config/i386/i386-cpuinfo.h
b/gcc/common/config/i386/i386-cpuinfo.h
index f9c644c6def..9291e3187d5 100644
--- a/gcc/common/config/i386/i386-cpuinfo.h
+++ b/gcc/common/config/i386/i386-cpuinfo.h
@@ -284,6 +284,7 @@ enum processor_features
FEATURE_MOVRS,
FEATURE_AMX_MOVRS,
FEATURE_AVX512BMM,
+ FEATURE_AVX10_V2_AUX,
CPU_FEATURE_MAX
};
diff --git a/gcc/common/config/i386/i386-isas.h
b/gcc/common/config/i386/i386-isas.h
index 62973b15f0f..5959a3a17df 100644
--- a/gcc/common/config/i386/i386-isas.h
+++ b/gcc/common/config/i386/i386-isas.h
@@ -192,4 +192,6 @@ ISA_NAMES_TABLE_START
ISA_NAMES_TABLE_ENTRY("movrs", FEATURE_MOVRS, P_NONE, "-mmovrs")
ISA_NAMES_TABLE_ENTRY("amx-movrs", FEATURE_AMX_MOVRS, P_NONE, "-mamx-movrs")
ISA_NAMES_TABLE_ENTRY("avx512bmm", FEATURE_AVX512BMM, P_NONE, "-mavx512bmm")
+ ISA_NAMES_TABLE_ENTRY("avx10-v2-aux", FEATURE_AVX10_V2_AUX, P_NONE,
+ "-mavx10-v2-aux")
ISA_NAMES_TABLE_END
diff --git a/gcc/config.gcc b/gcc/config.gcc
index fb4cdc0a475..c21e263fc2f 100644
--- a/gcc/config.gcc
+++ b/gcc/config.gcc
@@ -472,7 +472,7 @@ i[34567]86-*-* | x86_64-*-*)
avx10_2minmaxintrin.h avx10_2copyintrin.h
amxavx512intrin.h amxtf32intrin.h amxfp8intrin.h
movrsintrin.h amxmovrsintrin.h avx512bmmintrin.h
- avx512bmmvlintrin.h"
+ avx512bmmvlintrin.h avx10_v2_auxintrin.h"
;;
ia64-*-*)
extra_headers=ia64intrin.h
diff --git a/gcc/config/i386/avx10_v2_auxintrin.h
b/gcc/config/i386/avx10_v2_auxintrin.h
new file mode 100644
index 00000000000..3ca4d0b1166
--- /dev/null
+++ b/gcc/config/i386/avx10_v2_auxintrin.h
@@ -0,0 +1,409 @@
+/* Copyright (C) 2024-2026 Free Software Foundation, Inc.
+ This file is part of GCC.
+ GCC is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License as published by
+ the Free Software Foundation; either version 3, or (at your option)
+ any later version.
+ GCC is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ GNU General Public License for more details.
+ Under Section 7 of GPL version 3, you are granted additional
+ permissions described in the GCC Runtime Library Exception, version
+ 3.1, as published by the Free Software Foundation.
+ You should have received a copy of the GNU General Public License and
+ a copy of the GCC Runtime Library Exception along with this program;
+ see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
+ <http://www.gnu.org/licenses/>. */
+
+#if !defined _IMMINTRIN_H_INCLUDED
+#error "Never use <avx10_2_v2_auxintrin.h> directly; include <immintrin.h>
instead."
+
+#endif
+
+#ifndef _AVX10_V2_AUXINTRIN_H_INCLUDED
+#define _AVX10_V2_AUXINTRIN_H_INCLUDED
+
+#if !defined(__AVX10_V2_AUX__)
+#pragma GCC push_options
+#pragma GCC target("avx10-v2-aux")
+#define __DISABLE_AVX10_V2_AUX__
+#endif /* __AVX10_V2_AUX__ */
+
+// VCVTPS2BF8 - 128-bit
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_cvtps_bf8 (__m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8128_mask ((__v4sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask8) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_mask_cvtps_bf8 (__m128i __W, __mmask8 __U, __m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8128_mask ((__v4sf) __A,
+ (__v16qi) __W,
+ (__mmask8) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_maskz_cvtps_bf8 (__mmask8 __U, __m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8128_mask ((__v4sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask8) __U);
+}
+
+// VCVTPS2BF8 - 256-bit
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_cvtps_bf8 (__m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8256_mask ((__v8sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask8) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_mask_cvtps_bf8 (__m128i __W, __mmask8 __U, __m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8256_mask ((__v8sf) __A,
+ (__v16qi) __W,
+ (__mmask8) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_maskz_cvtps_bf8 (__mmask8 __U, __m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8256_mask ((__v8sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask8) __U);
+}
+
+// VCVTPS2BF8 - 512-bit
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_cvtps_bf8 (__m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8512_mask ((__v16sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask16) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_mask_cvtps_bf8 (__m128i __W, __mmask16 __U, __m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8512_mask ((__v16sf) __A,
+ (__v16qi) __W,
+ (__mmask16) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_maskz_cvtps_bf8 (__mmask16 __U, __m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8512_mask ((__v16sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask16) __U);
+}
+
+// VCVTPS2BF8S - 128-bit
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_cvts_ps_bf8 (__m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8s128_mask ((__v4sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask8) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_mask_cvts_ps_bf8 (__m128i __W, __mmask8 __U, __m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8s128_mask ((__v4sf) __A,
+ (__v16qi) __W,
+ (__mmask8) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_maskz_cvts_ps_bf8 (__mmask8 __U, __m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8s128_mask ((__v4sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask8) __U);
+}
+
+// VCVTPS2BF8S - 256-bit
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_cvts_ps_bf8 (__m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8s256_mask ((__v8sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask8) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_mask_cvts_ps_bf8 (__m128i __W, __mmask8 __U, __m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8s256_mask ((__v8sf) __A,
+ (__v16qi) __W,
+ (__mmask8) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_maskz_cvts_ps_bf8 (__mmask8 __U, __m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8s256_mask ((__v8sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask8) __U);
+}
+
+// VCVTPS2BF8S - 512-bit
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_cvts_ps_bf8 (__m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8s512_mask ((__v16sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask16) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_mask_cvts_ps_bf8 (__m128i __W, __mmask16 __U, __m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8s512_mask ((__v16sf) __A,
+ (__v16qi) __W,
+ (__mmask16) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_maskz_cvts_ps_bf8 (__mmask16 __U, __m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2bf8s512_mask ((__v16sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask16) __U);
+}
+
+// VCVTPS2HF8 - 128-bit
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_cvtps_hf8 (__m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8128_mask ((__v4sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask8) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_mask_cvtps_hf8 (__m128i __W, __mmask8 __U, __m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8128_mask ((__v4sf) __A,
+ (__v16qi) __W,
+ (__mmask8) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_maskz_cvtps_hf8 (__mmask8 __U, __m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8128_mask ((__v4sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask8) __U);
+}
+
+// VCVTPS2HF8 - 256-bit
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_cvtps_hf8 (__m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8256_mask ((__v8sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask8) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_mask_cvtps_hf8 (__m128i __W, __mmask8 __U, __m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8256_mask ((__v8sf) __A,
+ (__v16qi) __W,
+ (__mmask8) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_maskz_cvtps_hf8 (__mmask8 __U, __m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8256_mask ((__v8sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask8) __U);
+}
+
+// VCVTPS2HF8 - 512-bit
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_cvtps_hf8 (__m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8512_mask ((__v16sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask16) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_mask_cvtps_hf8 (__m128i __W, __mmask16 __U, __m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8512_mask ((__v16sf) __A,
+ (__v16qi) __W,
+ (__mmask16) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_maskz_cvtps_hf8 (__mmask16 __U, __m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8512_mask ((__v16sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask16) __U);
+}
+
+// VCVTPS2HF8S - 128-bit
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_cvts_ps_hf8 (__m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8s128_mask ((__v4sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask8) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_mask_cvts_ps_hf8 (__m128i __W, __mmask8 __U, __m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8s128_mask ((__v4sf) __A,
+ (__v16qi) __W,
+ (__mmask8) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_maskz_cvts_ps_hf8 (__mmask8 __U, __m128 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8s128_mask ((__v4sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask8) __U);
+}
+
+// VCVTPS2HF8S - 256-bit
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_cvts_ps_hf8 (__m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8s256_mask ((__v8sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask8) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_mask_cvts_ps_hf8 (__m128i __W, __mmask8 __U, __m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8s256_mask ((__v8sf) __A,
+ (__v16qi) __W,
+ (__mmask8) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_maskz_cvts_ps_hf8 (__mmask8 __U, __m256 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8s256_mask ((__v8sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask8) __U);
+}
+
+// VCVTPS2HF8S - 512-bit
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_cvts_ps_hf8 (__m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8s512_mask ((__v16sf) __A,
+ (__v16qi)
+ _mm_undefined_si128 (),
+ (__mmask16) -1);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_mask_cvts_ps_hf8 (__m128i __W, __mmask16 __U, __m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8s512_mask ((__v16sf) __A,
+ (__v16qi) __W,
+ (__mmask16) __U);
+}
+
+extern __inline __m128i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_maskz_cvts_ps_hf8 (__mmask16 __U, __m512 __A)
+{
+ return (__m128i) __builtin_ia32_vcvtps2hf8s512_mask ((__v16sf) __A,
+ (__v16qi)
+ _mm_setzero_si128 (),
+ (__mmask16) __U);
+}
+
+#ifdef __DISABLE_AVX10_V2_AUX__
+#undef __DISABLE_AVX10_V2_AUX__
+#pragma GCC pop_options
+#endif /* __DISABLE_AVX10_V2_AUX__ */
+
+#endif /* _AVX10_V2_AUXINTRIN_H_INCLUDED */
diff --git a/gcc/config/i386/cpuid.h b/gcc/config/i386/cpuid.h
index c48556afa6e..4d03bedcc83 100644
--- a/gcc/config/i386/cpuid.h
+++ b/gcc/config/i386/cpuid.h
@@ -170,6 +170,10 @@
/* Sub leaf (%eax == 0x21) */
#define bit_AVX512BMM ( 1<<23 )
+/* AVX10 sub leaf (%eax == 0x24, %ecx == 1) */
+/* %ecx */
+#define bit_AVX10_V2_AUX (1 << 3)
+
/* AMX sub leaf (%eax == 0x1e, %ecx == 1) */
/* %eax */
#define bit_AMX_FP8 (1 << 4)
diff --git a/gcc/config/i386/i386-builtin-types.def
b/gcc/config/i386/i386-builtin-types.def
index 64bde021d11..f35bdcd2056 100644
--- a/gcc/config/i386/i386-builtin-types.def
+++ b/gcc/config/i386/i386-builtin-types.def
@@ -1474,6 +1474,11 @@ DEF_FUNCTION_TYPE (V8DI, V8SF, V8DI, UQI)
DEF_FUNCTION_TYPE (V8DI, V8DF, V8DI, UQI)
DEF_FUNCTION_TYPE (V8SI, V8DF, V8SI, UQI)
+# AVX10_V2_AUX builtins
+DEF_FUNCTION_TYPE (V16QI, V4SF, V16QI, UQI)
+DEF_FUNCTION_TYPE (V16QI, V8SF, V16QI, UQI)
+DEF_FUNCTION_TYPE (V16QI, V16SF, V16QI, UHI)
+
# SM4 builtins
DEF_FUNCTION_TYPE (V16SI, V16SI, V16SI)
diff --git a/gcc/config/i386/i386-builtin.def b/gcc/config/i386/i386-builtin.def
index 30e728ab15d..40afda1c366 100644
--- a/gcc/config/i386/i386-builtin.def
+++ b/gcc/config/i386/i386-builtin.def
@@ -3369,6 +3369,20 @@ BDESC (0, OPTION_MASK_ISA2_AVX10_2,
CODE_FOR_avx10_2_minmaxpv2df_mask, "__builti
BDESC (0, OPTION_MASK_ISA2_AVX10_2, CODE_FOR_avx10_2_minmaxpv8hf_mask,
"__builtin_ia32_minmaxph128_mask", IX86_BUILTIN_MINMAXPH128_MASK, UNKNOWN,
(int) V8HF_FTYPE_V8HF_V8HF_INT_V8HF_UQI)
BDESC (0, OPTION_MASK_ISA2_AVX10_2, CODE_FOR_avx10_2_minmaxpv4sf_mask,
"__builtin_ia32_minmaxps128_mask", IX86_BUILTIN_MINMAXPS128_MASK, UNKNOWN,
(int) V4SF_FTYPE_V4SF_V4SF_INT_V4SF_UQI)
+/* AVX10_V2_AUX */
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2bf8v4sf_mask,
"__builtin_ia32_vcvtps2bf8128_mask", IX86_BUILTIN_VCVTPS2BF8128_MASK, UNKNOWN,
(int) V16QI_FTYPE_V4SF_V16QI_UQI)
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2bf8v8sf_mask,
"__builtin_ia32_vcvtps2bf8256_mask", IX86_BUILTIN_VCVTPS2BF8256_MASK, UNKNOWN,
(int) V16QI_FTYPE_V8SF_V16QI_UQI)
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2bf8v16sf_mask,
"__builtin_ia32_vcvtps2bf8512_mask", IX86_BUILTIN_VCVTPS2BF8512_MASK, UNKNOWN,
(int) V16QI_FTYPE_V16SF_V16QI_UHI)
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2bf8sv4sf_mask,
"__builtin_ia32_vcvtps2bf8s128_mask", IX86_BUILTIN_VCVTPS2BF8S128_MASK,
UNKNOWN, (int) V16QI_FTYPE_V4SF_V16QI_UQI)
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2bf8sv8sf_mask,
"__builtin_ia32_vcvtps2bf8s256_mask", IX86_BUILTIN_VCVTPS2BF8S256_MASK,
UNKNOWN, (int) V16QI_FTYPE_V8SF_V16QI_UQI)
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2bf8sv16sf_mask,
"__builtin_ia32_vcvtps2bf8s512_mask", IX86_BUILTIN_VCVTPS2BF8S512_MASK,
UNKNOWN, (int) V16QI_FTYPE_V16SF_V16QI_UHI)
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2hf8v4sf_mask,
"__builtin_ia32_vcvtps2hf8128_mask", IX86_BUILTIN_VCVTPS2HF8128_MASK, UNKNOWN,
(int) V16QI_FTYPE_V4SF_V16QI_UQI)
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2hf8v8sf_mask,
"__builtin_ia32_vcvtps2hf8256_mask", IX86_BUILTIN_VCVTPS2HF8256_MASK, UNKNOWN,
(int) V16QI_FTYPE_V8SF_V16QI_UQI)
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2hf8v16sf_mask,
"__builtin_ia32_vcvtps2hf8512_mask", IX86_BUILTIN_VCVTPS2HF8512_MASK, UNKNOWN,
(int) V16QI_FTYPE_V16SF_V16QI_UHI)
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2hf8sv4sf_mask,
"__builtin_ia32_vcvtps2hf8s128_mask", IX86_BUILTIN_VCVTPS2HF8S128_MASK,
UNKNOWN, (int) V16QI_FTYPE_V4SF_V16QI_UQI)
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2hf8sv8sf_mask,
"__builtin_ia32_vcvtps2hf8s256_mask", IX86_BUILTIN_VCVTPS2HF8S256_MASK,
UNKNOWN, (int) V16QI_FTYPE_V8SF_V16QI_UQI)
+BDESC (0, OPTION_MASK_ISA2_AVX10_V2_AUX, CODE_FOR_vcvtps2hf8sv16sf_mask,
"__builtin_ia32_vcvtps2hf8s512_mask", IX86_BUILTIN_VCVTPS2HF8S512_MASK,
UNKNOWN, (int) V16QI_FTYPE_V16SF_V16QI_UHI)
+
/* Builtins with rounding support. */
BDESC_END (ARGS, ROUND_ARGS)
diff --git a/gcc/config/i386/i386-c.cc b/gcc/config/i386/i386-c.cc
index 00cfeafac12..d8688f43563 100644
--- a/gcc/config/i386/i386-c.cc
+++ b/gcc/config/i386/i386-c.cc
@@ -792,6 +792,8 @@ ix86_target_macros_internal (HOST_WIDE_INT isa_flag,
def_or_undef (parse_in, "__AMX_MOVRS__");
if (isa_flag2 & OPTION_MASK_ISA2_AVX512BMM)
def_or_undef (parse_in, "__AVX512BMM__");
+ if (isa_flag2 & OPTION_MASK_ISA2_AVX10_V2_AUX)
+ def_or_undef (parse_in, "__AVX10_V2_AUX__");
if (TARGET_IAMCU)
{
def_or_undef (parse_in, "__iamcu");
diff --git a/gcc/config/i386/i386-expand.cc b/gcc/config/i386/i386-expand.cc
index 99b6343106a..2bd26ce5d81 100644
--- a/gcc/config/i386/i386-expand.cc
+++ b/gcc/config/i386/i386-expand.cc
@@ -12898,6 +12898,9 @@ ix86_expand_args_builtin (const struct
builtin_description *d,
case V8DI_FTYPE_V8SF_V8DI_UQI:
case V8DI_FTYPE_V8DF_V8DI_UQI:
case V8SI_FTYPE_V8DF_V8SI_UQI:
+ case V16QI_FTYPE_V4SF_V16QI_UQI:
+ case V16QI_FTYPE_V8SF_V16QI_UQI:
+ case V16QI_FTYPE_V16SF_V16QI_UHI:
nargs = 3;
break;
case V32QI_FTYPE_V32QI_V32QI_INT:
diff --git a/gcc/config/i386/i386-isa.def b/gcc/config/i386/i386-isa.def
index 7a9cdd84c4c..cd2a436295e 100644
--- a/gcc/config/i386/i386-isa.def
+++ b/gcc/config/i386/i386-isa.def
@@ -126,3 +126,4 @@ DEF_PTA(AMX_FP8)
DEF_PTA(MOVRS)
DEF_PTA(AMX_MOVRS)
DEF_PTA(AVX512BMM)
+DEF_PTA(AVX10_V2_AUX)
diff --git a/gcc/config/i386/i386-options.cc b/gcc/config/i386/i386-options.cc
index f7282dbe36f..f780c3202ee 100644
--- a/gcc/config/i386/i386-options.cc
+++ b/gcc/config/i386/i386-options.cc
@@ -275,7 +275,8 @@ static struct ix86_target_opts isa2_opts[] =
{ "-mamx-fp8", OPTION_MASK_ISA2_AMX_FP8 },
{ "-mmovrs", OPTION_MASK_ISA2_MOVRS },
{ "-mamx-movrs", OPTION_MASK_ISA2_AMX_MOVRS },
- { "-mavx512bmm", OPTION_MASK_ISA2_AVX512BMM }
+ { "-mavx512bmm", OPTION_MASK_ISA2_AVX512BMM },
+ { "-mavx10-v2-aux", OPTION_MASK_ISA2_AVX10_V2_AUX }
};
static struct ix86_target_opts isa_opts[] =
{
@@ -1141,6 +1142,7 @@ ix86_valid_target_attribute_inner_p (tree fndecl, tree
args, char *p_strings[],
IX86_ATTR_ISA ("movrs", OPT_mmovrs),
IX86_ATTR_ISA ("amx-movrs", OPT_mamx_movrs),
IX86_ATTR_ISA ("avx512bmm", OPT_mavx512bmm),
+ IX86_ATTR_ISA ("avx10-v2-aux", OPT_mavx10_v2_aux),
/* enum options */
IX86_ATTR_ENUM ("fpmath=", OPT_mfpmath_),
diff --git a/gcc/config/i386/i386.opt b/gcc/config/i386/i386.opt
index ff08188c761..6f6fc081448 100644
--- a/gcc/config/i386/i386.opt
+++ b/gcc/config/i386/i386.opt
@@ -1389,3 +1389,7 @@ Support AMX-MOVRS built-in functions and code generation.
mavx512bmm
Target Mask(ISA2_AVX512BMM) Var(ix86_isa_flags2) Save
Support AVX512BMM built-in functions and code generation.
+
+mavx10-v2-aux
+Target Mask(ISA2_AVX10_V2_AUX) Var(ix86_isa_flags2) Save
+Support AVX10_V2_AUX built-in functions and code generation.
diff --git a/gcc/config/i386/immintrin.h b/gcc/config/i386/immintrin.h
index 41b4be26a11..9811f7a0bae 100644
--- a/gcc/config/i386/immintrin.h
+++ b/gcc/config/i386/immintrin.h
@@ -148,6 +148,8 @@
#include <avx10_2convertintrin.h>
+#include <avx10_v2_auxintrin.h>
+
#include <avx10_2bf16intrin.h>
#include <avx10_2satcvtintrin.h>
diff --git a/gcc/config/i386/sse.md b/gcc/config/i386/sse.md
index bb150f6b5f9..c5c3b48e63e 100644
--- a/gcc/config/i386/sse.md
+++ b/gcc/config/i386/sse.md
@@ -258,6 +258,12 @@
;; For MOVRS support
UNSPEC_VMOVRS
+
+ ;; For AVX10_V2_AUX support
+ UNSPEC_VCVTPS2BF8
+ UNSPEC_VCVTPS2BF8S
+ UNSPEC_VCVTPS2HF8
+ UNSPEC_VCVTPS2HF8S
])
(define_c_enum "unspecv" [
@@ -33795,3 +33801,58 @@
"vbitrevb\t{%1, %0|%0, %1}"
[(set_attr "prefix" "evex")
(set_attr "mode" "<sseinsnmode>")])
+
+;; AVX10_V2_AUX instructions
+
+;; FP32 to FP8 single-source converts (VCVTPS2BF8, VCVTPS2BF8S,
+;; VCVTPS2HF8, VCVTPS2HF8S)
+
+(define_int_iterator UNSPEC_CONVERTPS2FP8
+ [UNSPEC_VCVTPS2BF8 UNSPEC_VCVTPS2BF8S
+ UNSPEC_VCVTPS2HF8 UNSPEC_VCVTPS2HF8S])
+
+(define_int_attr convertps2fp8
+ [(UNSPEC_VCVTPS2BF8 "ps2bf8")
+ (UNSPEC_VCVTPS2BF8S "ps2bf8s")
+ (UNSPEC_VCVTPS2HF8 "ps2hf8")
+ (UNSPEC_VCVTPS2HF8S "ps2hf8s")])
+
+(define_insn "vcvt<convertps2fp8><mode>"
+ [(set (match_operand:V16QI 0 "register_operand" "=v")
+ (unspec:V16QI
+ [(match_operand:VF1_AVX512VL 1 "nonimmediate_operand" "vm")]
+ UNSPEC_CONVERTPS2FP8))]
+ "TARGET_AVX10_V2_AUX"
+ "vcvt<convertps2fp8>\t{%1, %0|%0, %1}"
+ [(set_attr "prefix" "evex")
+ (set_attr "mode" "<sseinsnmode>")])
+
+(define_expand "vcvt<convertps2fp8><mode>_mask"
+ [(set (match_operand:V16QI 0 "register_operand")
+ (vec_merge:V16QI
+ (unspec:V16QI
+ [(match_operand:VF1_AVX512VL 1 "nonimmediate_operand")]
+ UNSPEC_CONVERTPS2FP8)
+ (match_operand:V16QI 2 "nonimm_or_0_operand")
+ (match_operand:<avx512fmaskmode> 3 "register_or_constm1_operand")))]
+ "TARGET_AVX10_V2_AUX"
+{
+ if (CONST_INT_P (operands[3]))
+ {
+ emit_insn (gen_vcvt<convertps2fp8><mode> (operands[0], operands[1]));
+ DONE;
+ }
+})
+
+(define_insn "*vcvt<convertps2fp8><mode>_mask"
+ [(set (match_operand:V16QI 0 "register_operand" "=v")
+ (vec_merge:V16QI
+ (unspec:V16QI
+ [(match_operand:VF1_AVX512VL 1 "nonimmediate_operand" "vm")]
+ UNSPEC_CONVERTPS2FP8)
+ (match_operand:V16QI 2 "nonimm_or_0_operand" "0C")
+ (match_operand:<avx512fmaskmode> 3 "register_operand" "Yk")))]
+ "TARGET_AVX10_V2_AUX"
+ "vcvt<convertps2fp8>\t{%1, %0%{%3%}%N2|%0%{%3%}%N2, %1}"
+ [(set_attr "prefix" "evex")
+ (set_attr "mode" "<sseinsnmode>")])
diff --git a/gcc/doc/invoke.texi b/gcc/doc/invoke.texi
index 8da5f03ccbd..a8685896897 100644
--- a/gcc/doc/invoke.texi
+++ b/gcc/doc/invoke.texi
@@ -1551,7 +1551,7 @@ See RS/6000 and PowerPC Options.
-mavxneconvert -mcmpccxadd -mamx-fp16 -mprefetchi -mraoint
-mamx-complex -mavxvnniint16 -msm3 -msha512 -msm4 -mapxf
-musermsr -mavx10.1 -mavx10.2 -mamx-avx512 -mamx-tf32 -mmovrs
--mamx-movrs -mavx512bmm -mcldemote -mms-bitfields
+-mamx-movrs -mavx512bmm -mavx10-v2-aux -mcldemote -mms-bitfields
-mno-align-stringops -minline-all-stringops
-minline-stringops-dynamically -mstringop-strategy=@var{alg}
-mkl -mwidekl
@@ -36192,6 +36192,11 @@ Support MOVRS built-in functions and code generation.
@opindex mno-amx-movrs
@item -mamx-movrs
Support AMX-MOVRS built-in functions and code generation.
+
+@opindex mavx10-v2-aux
+@opindex mno-avx10-v2-aux
+@item -mavx10-v2-aux
+Support AVX10_V2_AUX built-in functions and code generation.
@end table
These additional options are available for the x86 processor family.
diff --git a/gcc/testsuite/gcc.target/i386/avx10_2-v2-aux-convert-1.c
b/gcc/testsuite/gcc.target/i386/avx10_2-v2-aux-convert-1.c
new file mode 100644
index 00000000000..7ee543c9682
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx10_2-v2-aux-convert-1.c
@@ -0,0 +1,88 @@
+/* { dg-do compile } */
+/* { dg-options "-mavx10-v2-aux -O2" } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8s\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8s\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8s\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8s\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8s\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8s\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8s\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8s\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2bf8s\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8s\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8s\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8s\[
\\t\]+\[^\{\n\]*%xmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8s\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8s\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8s\[
\\t\]+\[^\{\n\]*%ymm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8s\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8s\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}(?:\n|\[
\\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vcvtps2hf8s\[
\\t\]+\[^\{\n\]*%zmm\[0-9\]+\[^\n\r]*%xmm\[0-9\]+\{%k\[1-7\]\}\{z\}(?:\n|\[
\\t\]+#)" 1 } } */
+
+#include <immintrin.h>
+
+__m128i test_mm_cvtps_bf8 (__m128 a) { return _mm_cvtps_bf8 (a); }
+__m128i test_mm_mask_cvtps_bf8 (__m128i w, __mmask8 u, __m128 a) { return
_mm_mask_cvtps_bf8 (w, u, a); }
+__m128i test_mm_maskz_cvtps_bf8 (__mmask8 u, __m128 a) { return
_mm_maskz_cvtps_bf8 (u, a); }
+
+__m128i test_mm256_cvtps_bf8 (__m256 a) { return _mm256_cvtps_bf8 (a); }
+__m128i test_mm256_mask_cvtps_bf8 (__m128i w, __mmask8 u, __m256 a) { return
_mm256_mask_cvtps_bf8 (w, u, a); }
+__m128i test_mm256_maskz_cvtps_bf8 (__mmask8 u, __m256 a) { return
_mm256_maskz_cvtps_bf8 (u, a); }
+
+__m128i test_mm512_cvtps_bf8 (__m512 a) { return _mm512_cvtps_bf8 (a); }
+__m128i test_mm512_mask_cvtps_bf8 (__m128i w, __mmask16 u, __m512 a) { return
_mm512_mask_cvtps_bf8 (w, u, a); }
+__m128i test_mm512_maskz_cvtps_bf8 (__mmask16 u, __m512 a) { return
_mm512_maskz_cvtps_bf8 (u, a); }
+
+__m128i test_mm_cvts_ps_bf8 (__m128 a) { return _mm_cvts_ps_bf8 (a); }
+__m128i test_mm_mask_cvts_ps_bf8 (__m128i w, __mmask8 u, __m128 a) { return
_mm_mask_cvts_ps_bf8 (w, u, a); }
+__m128i test_mm_maskz_cvts_ps_bf8 (__mmask8 u, __m128 a) { return
_mm_maskz_cvts_ps_bf8 (u, a); }
+
+__m128i test_mm256_cvts_ps_bf8 (__m256 a) { return _mm256_cvts_ps_bf8 (a); }
+__m128i test_mm256_mask_cvts_ps_bf8 (__m128i w, __mmask8 u, __m256 a) { return
_mm256_mask_cvts_ps_bf8 (w, u, a); }
+__m128i test_mm256_maskz_cvts_ps_bf8 (__mmask8 u, __m256 a) { return
_mm256_maskz_cvts_ps_bf8 (u, a); }
+
+__m128i test_mm512_cvts_ps_bf8 (__m512 a) { return _mm512_cvts_ps_bf8 (a); }
+__m128i test_mm512_mask_cvts_ps_bf8 (__m128i w, __mmask16 u, __m512 a) {
return _mm512_mask_cvts_ps_bf8 (w, u, a); }
+__m128i test_mm512_maskz_cvts_ps_bf8 (__mmask16 u, __m512 a) { return
_mm512_maskz_cvts_ps_bf8 (u, a); }
+
+__m128i test_mm_cvtps_hf8 (__m128 a) { return _mm_cvtps_hf8 (a); }
+__m128i test_mm_mask_cvtps_hf8 (__m128i w, __mmask8 u, __m128 a) { return
_mm_mask_cvtps_hf8 (w, u, a); }
+__m128i test_mm_maskz_cvtps_hf8 (__mmask8 u, __m128 a) { return
_mm_maskz_cvtps_hf8 (u, a); }
+
+__m128i test_mm256_cvtps_hf8 (__m256 a) { return _mm256_cvtps_hf8 (a); }
+__m128i test_mm256_mask_cvtps_hf8 (__m128i w, __mmask8 u, __m256 a) { return
_mm256_mask_cvtps_hf8 (w, u, a); }
+__m128i test_mm256_maskz_cvtps_hf8 (__mmask8 u, __m256 a) { return
_mm256_maskz_cvtps_hf8 (u, a); }
+
+__m128i test_mm512_cvtps_hf8 (__m512 a) { return _mm512_cvtps_hf8 (a); }
+__m128i test_mm512_mask_cvtps_hf8 (__m128i w, __mmask16 u, __m512 a) { return
_mm512_mask_cvtps_hf8 (w, u, a); }
+__m128i test_mm512_maskz_cvtps_hf8 (__mmask16 u, __m512 a) { return
_mm512_maskz_cvtps_hf8 (u, a); }
+
+__m128i test_mm_cvts_ps_hf8 (__m128 a) { return _mm_cvts_ps_hf8 (a); }
+__m128i test_mm_mask_cvts_ps_hf8 (__m128i w, __mmask8 u, __m128 a) { return
_mm_mask_cvts_ps_hf8 (w, u, a); }
+__m128i test_mm_maskz_cvts_ps_hf8 (__mmask8 u, __m128 a) { return
_mm_maskz_cvts_ps_hf8 (u, a); }
+
+__m128i test_mm256_cvts_ps_hf8 (__m256 a) { return _mm256_cvts_ps_hf8 (a); }
+__m128i test_mm256_mask_cvts_ps_hf8 (__m128i w, __mmask8 u, __m256 a) { return
_mm256_mask_cvts_ps_hf8 (w, u, a); }
+__m128i test_mm256_maskz_cvts_ps_hf8 (__mmask8 u, __m256 a) { return
_mm256_maskz_cvts_ps_hf8 (u, a); }
+
+__m128i test_mm512_cvts_ps_hf8 (__m512 a) { return _mm512_cvts_ps_hf8 (a); }
+__m128i test_mm512_mask_cvts_ps_hf8 (__m128i w, __mmask16 u, __m512 a) {
return _mm512_mask_cvts_ps_hf8 (w, u, a); }
+__m128i test_mm512_maskz_cvts_ps_hf8 (__mmask16 u, __m512 a) { return
_mm512_maskz_cvts_ps_hf8 (u, a); }
diff --git a/gcc/testsuite/lib/target-supports.exp
b/gcc/testsuite/lib/target-supports.exp
index c6ebbed4f4b..d79729f6086 100644
--- a/gcc/testsuite/lib/target-supports.exp
+++ b/gcc/testsuite/lib/target-supports.exp
@@ -11522,6 +11522,17 @@ proc check_effective_target_avx10_2 { } {
} "" ]
}
+# Return 1 if avx10-v2-aux instructions can be compiled.
+proc check_effective_target_avx10_v2_aux { } {
+ return [check_no_compiler_messages avx10_v2_aux object {
+ void
+ foo ()
+ {
+ __asm__ volatile ("vcvtps2bf8\t{%%xmm1, %%xmm0|%%xmm0, %%xmm1}");
+ }
+ } "-mavx10-v2-aux" ]
+}
+
# Return 1 if amx-avx512 instructions can be compiled.
proc check_effective_target_amx_avx512 { } {
return [check_no_compiler_messages amx_avx512 object {
--
2.34.1