C23 adds a memalignment function to determine the alignment of a pointer.
Given how simple it is (convert pointer to an integer then return (p & -p)),
GCC should support expanding it inline.
This patch implements __builtin_memalignment which expands to p & -p
gcc/ChangeLog:
PR middle-end/122117
* builtin-types.def (BT_FN_SIZE_CONST_PTR): New function type.
* builtins.def (BUILT_IN_MEMALIGNMENT): New C23 builtin.
* builtins.cc (fold_builtin_memalignment): New function to fold
__builtin_memalignment to (size_t)ptr & -(size_t)ptr.
(fold_builtin_1): Handle BUILT_IN_MEMALIGNMENT.
(is_inexpensive_builtin): Add BUILT_IN_MEMALIGNMENT.
gcc/testsuite/ChangeLog:
* gcc.dg/builtin-memalignment.c: New test.
---
gcc/builtin-types.def | 1 +
gcc/builtins.cc | 26 +++++
gcc/builtins.def | 1 +
gcc/testsuite/gcc.dg/builtin-memalignment.c | 114 ++++++++++++++++++++
4 files changed, 142 insertions(+)
create mode 100644 gcc/testsuite/gcc.dg/builtin-memalignment.c
diff --git a/gcc/builtin-types.def b/gcc/builtin-types.def
index 9583d30dfc0..eecb30fd12d 100644
--- a/gcc/builtin-types.def
+++ b/gcc/builtin-types.def
@@ -360,6 +360,7 @@ DEF_FUNCTION_TYPE_1 (BT_FN_LONGLONG_FLOAT32X, BT_LONGLONG,
BT_FLOAT32X)
DEF_FUNCTION_TYPE_1 (BT_FN_LONGLONG_FLOAT64X, BT_LONGLONG, BT_FLOAT64X)
DEF_FUNCTION_TYPE_1 (BT_FN_LONGLONG_FLOAT128X, BT_LONGLONG, BT_FLOAT128X)
DEF_FUNCTION_TYPE_1 (BT_FN_VOID_PTR, BT_VOID, BT_PTR)
+DEF_FUNCTION_TYPE_1 (BT_FN_SIZE_CONST_PTR, BT_SIZE, BT_CONST_PTR)
DEF_FUNCTION_TYPE_1 (BT_FN_SIZE_CONST_STRING, BT_SIZE, BT_CONST_STRING)
DEF_FUNCTION_TYPE_1 (BT_FN_INT_CONST_STRING, BT_INT, BT_CONST_STRING)
DEF_FUNCTION_TYPE_1 (BT_FN_PTR_PTR, BT_PTR, BT_PTR)
diff --git a/gcc/builtins.cc b/gcc/builtins.cc
index fb294ce58cd..5390b36c0f2 100644
--- a/gcc/builtins.cc
+++ b/gcc/builtins.cc
@@ -172,6 +172,7 @@ static tree fold_builtin_abs (location_t, tree, tree);
static tree fold_builtin_unordered_cmp (location_t, tree, tree, tree, enum
tree_code,
enum tree_code);
static tree fold_builtin_iseqsig (location_t, tree, tree);
+static tree fold_builtin_memalignment (location_t, tree);
static tree fold_builtin_varargs (location_t, tree, tree*, int);
static tree fold_builtin_strpbrk (location_t, tree, tree, tree, tree);
@@ -10115,6 +10116,27 @@ fold_builtin_iseqsig (location_t loc, tree arg0, tree
arg1)
return fold_build2_loc (loc, TRUTH_AND_EXPR, integer_type_node, cmp1, cmp2);
}
+/* Fold a call to __builtin_memalignment(). ARG is the pointer argument.
+ The code is folded to: (size_t)ARG & -(size_t)ARG */
+
+static tree
+fold_builtin_memalignment (location_t loc, tree arg)
+{
+ tree ptr_as_size, negated, result;
+
+ /* Convert pointer to size_t. */
+ ptr_as_size = fold_convert_loc (loc, size_type_node, arg);
+
+ /* Negate: -(size_t)ARG */
+ negated = fold_build1_loc (loc, NEGATE_EXPR, size_type_node, ptr_as_size);
+
+ /* Compute: (size_t)ARG & -(size_t)ARG */
+ result = fold_build2_loc (loc, BIT_AND_EXPR, size_type_node,
+ ptr_as_size, negated);
+
+ return result;
+}
+
/* Fold __builtin_{,s,u}{add,sub,mul}{,l,ll}_overflow, either into normal
arithmetics if it can never overflow, or into internal functions that
return both result of arithmetics and overflowed boolean flag in
@@ -10784,6 +10806,9 @@ fold_builtin_1 (location_t loc, tree expr, tree fndecl,
tree arg0)
case BUILT_IN_POPCOUNTG:
return fold_builtin_bit_query (loc, fcode, arg0, NULL_TREE);
+ case BUILT_IN_MEMALIGNMENT:
+ return fold_builtin_memalignment (loc, arg0);
+
default:
break;
}
@@ -12395,6 +12420,7 @@ is_inexpensive_builtin (tree decl)
case BUILT_IN_PARITYLL:
case BUILT_IN_PARITYIMAX:
case BUILT_IN_PARITY:
+ case BUILT_IN_MEMALIGNMENT:
case BUILT_IN_LABS:
case BUILT_IN_LLABS:
case BUILT_IN_PREFETCH:
diff --git a/gcc/builtins.def b/gcc/builtins.def
index 00cfb6a2057..036c79cbd8d 100644
--- a/gcc/builtins.def
+++ b/gcc/builtins.def
@@ -1023,6 +1023,7 @@ DEF_GCC_BUILTIN (BUILT_IN_BSWAP16, "bswap16",
BT_FN_UINT16_UINT16, ATTR_C
DEF_GCC_BUILTIN (BUILT_IN_BSWAP32, "bswap32", BT_FN_UINT32_UINT32,
ATTR_CONST_NOTHROW_LEAF_LIST)
DEF_GCC_BUILTIN (BUILT_IN_BSWAP64, "bswap64", BT_FN_UINT64_UINT64,
ATTR_CONST_NOTHROW_LEAF_LIST)
DEF_GCC_BUILTIN (BUILT_IN_BSWAP128, "bswap128", BT_FN_UINT128_UINT128,
ATTR_CONST_NOTHROW_LEAF_LIST)
+DEF_C23_BUILTIN (BUILT_IN_MEMALIGNMENT, "memalignment",
BT_FN_SIZE_CONST_PTR, ATTR_CONST_NOTHROW_LEAF_LIST)
DEF_EXT_LIB_BUILTIN (BUILT_IN_CLEAR_CACHE, "__clear_cache",
BT_FN_VOID_PTR_PTR, ATTR_NOTHROW_LEAF_LIST)
/* [trans-mem]: Adjust BUILT_IN_TM_CALLOC if BUILT_IN_CALLOC is changed. */
diff --git a/gcc/testsuite/gcc.dg/builtin-memalignment.c
b/gcc/testsuite/gcc.dg/builtin-memalignment.c
new file mode 100644
index 00000000000..993089a52b6
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/builtin-memalignment.c
@@ -0,0 +1,114 @@
+/* { dg-do run } */
+/* { dg-options "-O2 -fdump-tree-optimized" } */
+
+#include <stddef.h>
+#include <stdint.h>
+
+extern void abort (void);
+
+void test_alignment (void *ptr, size_t expected)
+{
+ size_t result = __builtin_memalignment (ptr);
+ if (result != expected)
+ abort ();
+}
+
+/* Verify that constant folding happens */
+void test_constant_p (void)
+{
+ /* These should be compile-time constants */
+ if (!__builtin_constant_p (__builtin_memalignment ((void *)((uintptr_t)16))))
+ abort ();
+ if (!__builtin_constant_p (__builtin_memalignment ((void *)((uintptr_t)24))))
+ abort ();
+ if (!__builtin_constant_p (__builtin_memalignment ((void *)0)))
+ abort ();
+}
+
+int main (void)
+{
+ /* Test with null pointer - alignment should be 0 */
+ test_alignment ((void *)0, 0);
+
+ /* Test powers of 2 alignments */
+ test_alignment ((void *)((uintptr_t)1), 1);
+ test_alignment ((void *)((uintptr_t)2), 2);
+ test_alignment ((void *)((uintptr_t)4), 4);
+ test_alignment ((void *)((uintptr_t)8), 8);
+ test_alignment ((void *)((uintptr_t)16), 16);
+ test_alignment ((void *)((uintptr_t)32), 32);
+ test_alignment ((void *)((uintptr_t)64), 64);
+ test_alignment ((void *)((uintptr_t)128), 128);
+ test_alignment ((void *)((uintptr_t)256), 256);
+
+ /* Test non-power-of-2 addresses */
+ test_alignment ((void *)((uintptr_t)3), 1); /* 0b11 -> alignment 1 */
+ test_alignment ((void *)((uintptr_t)5), 1); /* 0b101 -> alignment 1 */
+ test_alignment ((void *)((uintptr_t)6), 2); /* 0b110 -> alignment 2 */
+ test_alignment ((void *)((uintptr_t)12), 4); /* 0b1100 -> alignment 4 */
+ test_alignment ((void *)((uintptr_t)24), 8); /* 0b11000 -> alignment 8 */
+ test_alignment ((void *)((uintptr_t)48), 16); /* 0b110000 -> alignment 16 */
+
+ /* Verify constant folding happens */
+ test_constant_p ();
+
+ /* Test with variables having different alignments */
+ char c __attribute__((aligned(1)));
+ short s __attribute__((aligned(2)));
+ int i __attribute__((aligned(4)));
+ long long ll __attribute__((aligned(8)));
+ char a16 __attribute__((aligned(16)));
+ char a32 __attribute__((aligned(32)));
+ char a64 __attribute__((aligned(64)));
+
+ size_t align_c = __builtin_memalignment(&c);
+ size_t align_s = __builtin_memalignment(&s);
+ size_t align_i = __builtin_memalignment(&i);
+ size_t align_ll = __builtin_memalignment(&ll);
+ size_t align_a16 = __builtin_memalignment(&a16);
+ size_t align_a32 = __builtin_memalignment(&a32);
+ size_t align_a64 = __builtin_memalignment(&a64);
+
+ /* The alignment should be at least what we requested */
+ if (align_c < 1)
+ abort();
+ if (align_s < 2)
+ abort();
+ if (align_i < 4)
+ abort();
+ if (align_ll < 8)
+ abort();
+ if (align_a16 < 16)
+ abort();
+ if (align_a32 < 32)
+ abort();
+ if (align_a64 < 64)
+ abort();
+
+ /* Test array elements */
+ int array[16] __attribute__((aligned(64)));
+
+ /* First element should have the array's alignment */
+ if (__builtin_memalignment(&array[0]) < 64)
+ abort();
+
+ /* Other elements depend on their offset */
+ /* array[1] is at offset 4, so alignment is 4 */
+ if (__builtin_memalignment(&array[1]) != 4)
+ abort();
+
+ /* array[2] is at offset 8, so alignment is 8 */
+ if (__builtin_memalignment(&array[2]) != 8)
+ abort();
+
+ /* array[4] is at offset 16, so alignment is 16 */
+ if (__builtin_memalignment(&array[4]) != 16)
+ abort();
+
+ return 0;
+}
+
+/* { dg-final { scan-tree-dump-not "__builtin_memalignment" "optimized" } } */
+/* { dg-final { scan-tree-dump "return 16;" "optimized" } } */
+/* { dg-final { scan-tree-dump "return 8;" "optimized" } } */
+/* { dg-final { scan-tree-dump "return 0;" "optimized" } } */
--
2.47.3