Author: Momchil Velikov
Date: 2026-05-11T10:45:28+01:00
New Revision: b7f564781acbb6f373bd24752fd6b3977f376723

URL: 
https://github.com/llvm/llvm-project/commit/b7f564781acbb6f373bd24752fd6b3977f376723
DIFF: 
https://github.com/llvm/llvm-project/commit/b7f564781acbb6f373bd24752fd6b3977f376723.diff

LOG: [Clang] Fix incorrect type for `__mfp8` in `extractelement` codegen 
(#192977)

The codegen for extracting an element from an FP8 vector was emitting a
simple `extractelement` with `i8` type for the extracted element. The
`__mfp8` type is represented as `<1 x i8>` in LLVM IR. This codegen
created inconsistency in Clang - some `__mfp8` expressions would
correspond to LLVM IR values with `<1 x i8>` type and some to `i8` type.

It also caused an assertion failure when the extracted element was
passed as a function argument.

This patch fixes the issue by inserting the extracted element
into a `<1 x i8>`.

Added: 
    clang/test/CodeGen/AArch64/fp8-extract.c

Modified: 
    clang/lib/CodeGen/CGExprScalar.cpp
    clang/test/CodeGen/arm-mfp8.c

Removed: 
    


################################################################################
diff  --git a/clang/lib/CodeGen/CGExprScalar.cpp 
b/clang/lib/CodeGen/CGExprScalar.cpp
index d60f1b37be50e..c8a8ec7b6d928 100644
--- a/clang/lib/CodeGen/CGExprScalar.cpp
+++ b/clang/lib/CodeGen/CGExprScalar.cpp
@@ -2213,7 +2213,15 @@ Value 
*ScalarExprEmitter::VisitArraySubscriptExpr(ArraySubscriptExpr *E) {
   if (CGF.SanOpts.has(SanitizerKind::ArrayBounds))
     CGF.EmitBoundsCheck(E, E->getBase(), Idx, IdxTy, /*Accessed*/true);
 
-  return Builder.CreateExtractElement(Base, Idx, "vecext");
+  Value *Ret = Builder.CreateExtractElement(Base, Idx, "vecext");
+
+  // Even being a scalar the `__mfp8` type corresponds to `<1 x i8>` in LLVM 
IR.
+  if (E->getType()->isMFloat8Type())
+    Ret = Builder.CreateInsertElement(
+        llvm::PoisonValue::get(llvm::FixedVectorType::get(CGF.Int8Ty, 1)), Ret,
+        uint64_t(0), "mfp8ext");
+
+  return Ret;
 }
 
 Value *ScalarExprEmitter::VisitMatrixSingleSubscriptExpr(

diff  --git a/clang/test/CodeGen/AArch64/fp8-extract.c 
b/clang/test/CodeGen/AArch64/fp8-extract.c
new file mode 100644
index 0000000000000..7fa93c6f15305
--- /dev/null
+++ b/clang/test/CodeGen/AArch64/fp8-extract.c
@@ -0,0 +1,52 @@
+// NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py 
UTC_ARGS: --version 6
+// RUN: %clang_cc1        -triple aarch64-none-linux-gnu -target-feature +neon 
-disable-O0-optnone -Werror -Wall -emit-llvm -o - %s | opt -S -p 
mem2reg,instcombine | FileCheck %s
+// RUN: %clang_cc1 -x c++ -triple aarch64-none-linux-gnu -target-feature +neon 
-disable-O0-optnone -Werror -Wall -emit-llvm -o - %s | opt -S -p 
mem2reg,instcombine | FileCheck %s -check-prefix CHECK-CXX
+
+// RUN: %clang_cc1        -triple aarch64-none-linux-gnu -target-feature +neon 
-disable-O0-optnone -Werror -Wall -S -o /dev/null %s
+
+// REQUIRES: aarch64-registered-target
+
+#include <arm_neon.h>
+
+// Test for a n internal compiler error when extracting an element from an FP8
+// vector and passing it to a function.
+
+// CHECK-LABEL: define dso_local void @test_var(
+// CHECK-SAME: <16 x i8> [[V:%.*]], i32 noundef [[I:%.*]]) #[[ATTR0:[0-9]+]] {
+// CHECK-NEXT:  [[ENTRY:.*:]]
+// CHECK-NEXT:    [[VECEXT:%.*]] = extractelement <16 x i8> [[V]], i32 [[I]]
+// CHECK-NEXT:    [[MFP8CAST:%.*]] = insertelement <1 x i8> poison, i8 
[[VECEXT]], i64 0
+// CHECK-NEXT:    call void @g(<1 x i8> [[MFP8CAST]]) #[[ATTR2:[0-9]+]]
+// CHECK-NEXT:    ret void
+//
+// CHECK-CXX-LABEL: define dso_local void @_Z8test_var14__Mfloat8x16_ti(
+// CHECK-CXX-SAME: <16 x i8> [[V:%.*]], i32 noundef [[I:%.*]]) 
#[[ATTR0:[0-9]+]] {
+// CHECK-CXX-NEXT:  [[ENTRY:.*:]]
+// CHECK-CXX-NEXT:    [[VECEXT:%.*]] = extractelement <16 x i8> [[V]], i32 
[[I]]
+// CHECK-CXX-NEXT:    [[MFP8CAST:%.*]] = insertelement <1 x i8> poison, i8 
[[VECEXT]], i64 0
+// CHECK-CXX-NEXT:    call void @_Z1gu6__mfp8(<1 x i8> [[MFP8CAST]]) 
#[[ATTR2:[0-9]+]]
+// CHECK-CXX-NEXT:    ret void
+//
+void test_var(__Mfloat8x16_t v, int i) {
+  void g(__mfp8);
+  g(v[i]);
+}
+
+// CHECK-LABEL: define dso_local void @test_cst(
+// CHECK-SAME: <16 x i8> [[V:%.*]]) #[[ATTR0]] {
+// CHECK-NEXT:  [[ENTRY:.*:]]
+// CHECK-NEXT:    [[MFP8CAST:%.*]] = shufflevector <16 x i8> [[V]], <16 x i8> 
poison, <1 x i32> <i32 3>
+// CHECK-NEXT:    call void @g(<1 x i8> [[MFP8CAST]]) #[[ATTR2]]
+// CHECK-NEXT:    ret void
+//
+// CHECK-CXX-LABEL: define dso_local void @_Z8test_cst14__Mfloat8x16_t(
+// CHECK-CXX-SAME: <16 x i8> [[V:%.*]]) #[[ATTR0]] {
+// CHECK-CXX-NEXT:  [[ENTRY:.*:]]
+// CHECK-CXX-NEXT:    [[MFP8CAST:%.*]] = shufflevector <16 x i8> [[V]], <16 x 
i8> poison, <1 x i32> <i32 3>
+// CHECK-CXX-NEXT:    call void @_Z1gu6__mfp8(<1 x i8> [[MFP8CAST]]) #[[ATTR2]]
+// CHECK-CXX-NEXT:    ret void
+//
+void test_cst(__Mfloat8x16_t v) {
+  void g(__mfp8);
+  g(v[3]);
+}

diff  --git a/clang/test/CodeGen/arm-mfp8.c b/clang/test/CodeGen/arm-mfp8.c
index 9385b537f18b3..82df375a45686 100644
--- a/clang/test/CodeGen/arm-mfp8.c
+++ b/clang/test/CodeGen/arm-mfp8.c
@@ -64,20 +64,16 @@ __mfp8 func1n(__mfp8 mfp8) {
 // CHECK-C-LABEL: define dso_local <1 x i8> @test_extract_element(
 // CHECK-C-SAME: <16 x i8> [[X:%.*]], i32 noundef [[I:%.*]]) #[[ATTR0]] {
 // CHECK-C-NEXT:  [[ENTRY:.*:]]
-// CHECK-C-NEXT:    [[RETVAL:%.*]] = alloca <1 x i8>, align 1
 // CHECK-C-NEXT:    [[VECEXT:%.*]] = extractelement <16 x i8> [[X]], i32 [[I]]
-// CHECK-C-NEXT:    store i8 [[VECEXT]], ptr [[RETVAL]], align 1
-// CHECK-C-NEXT:    [[TMP0:%.*]] = load <1 x i8>, ptr [[RETVAL]], align 1
-// CHECK-C-NEXT:    ret <1 x i8> [[TMP0]]
+// CHECK-C-NEXT:    [[MFP8CAST:%.*]] = insertelement <1 x i8> poison, i8 
[[VECEXT]], i64 0
+// CHECK-C-NEXT:    ret <1 x i8> [[MFP8CAST]]
 //
 // CHECK-CXX-LABEL: define dso_local <1 x i8> 
@_Z20test_extract_element14__Mfloat8x16_ti(
 // CHECK-CXX-SAME: <16 x i8> [[X:%.*]], i32 noundef [[I:%.*]]) #[[ATTR0]] {
 // CHECK-CXX-NEXT:  [[ENTRY:.*:]]
-// CHECK-CXX-NEXT:    [[RETVAL:%.*]] = alloca <1 x i8>, align 1
 // CHECK-CXX-NEXT:    [[VECEXT:%.*]] = extractelement <16 x i8> [[X]], i32 
[[I]]
-// CHECK-CXX-NEXT:    store i8 [[VECEXT]], ptr [[RETVAL]], align 1
-// CHECK-CXX-NEXT:    [[TMP0:%.*]] = load <1 x i8>, ptr [[RETVAL]], align 1
-// CHECK-CXX-NEXT:    ret <1 x i8> [[TMP0]]
+// CHECK-CXX-NEXT:    [[MFP8CAST:%.*]] = insertelement <1 x i8> poison, i8 
[[VECEXT]], i64 0
+// CHECK-CXX-NEXT:    ret <1 x i8> [[MFP8CAST]]
 //
 mfloat8_t test_extract_element(mfloat8x16_t x, int i) {
   return x[i];


        
_______________________________________________
cfe-commits mailing list
[email protected]
https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits

Reply via email to