================ @@ -0,0 +1,723 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 +; RUN: llc -mtriple=aarch64 -verify-machineinstrs --mattr=+cpa -aarch64-use-featcpa-codegen=true -O0 -global-isel=1 -global-isel-abort=1 %s -o - 2>&1 | FileCheck %s --check-prefixes=CHECK-CPA-O0 +; RUN: llc -mtriple=aarch64 -verify-machineinstrs --mattr=+cpa -aarch64-use-featcpa-codegen=true -O3 -global-isel=1 -global-isel-abort=1 %s -o - 2>&1 | FileCheck %s --check-prefixes=CHECK-CPA-O3 +; RUN: llc -mtriple=aarch64 -verify-machineinstrs --mattr=-cpa -O0 -global-isel=1 -global-isel-abort=1 %s -o - 2>&1 | FileCheck %s --check-prefixes=CHECK-NOCPA-O0 +; RUN: llc -mtriple=aarch64 -verify-machineinstrs --mattr=-cpa -O3 -global-isel=1 -global-isel-abort=1 %s -o - 2>&1 | FileCheck %s --check-prefixes=CHECK-NOCPA-O3 + +%struct.my_type = type { i64, i64 } +%struct.my_type2 = type { i64, i64, i64, i64, i64, i64 } + +@array = external dso_local global [10 x %struct.my_type], align 8 +@array2 = external dso_local global [10 x %struct.my_type2], align 8 + +define void @addpt1(i64 %index, i64 %arg) { +; CHECK-CPA-O0-LABEL: addpt1: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: adrp x8, array +; CHECK-CPA-O0-NEXT: add x8, x8, :lo12:array +; CHECK-CPA-O0-NEXT: addpt x8, x8, x0, lsl #4 +; CHECK-CPA-O0-NEXT: str x1, [x8, #8] +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: addpt1: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: adrp x8, array +; CHECK-CPA-O3-NEXT: add x8, x8, :lo12:array +; CHECK-CPA-O3-NEXT: addpt x8, x8, x0, lsl #4 +; CHECK-CPA-O3-NEXT: str x1, [x8, #8] +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: addpt1: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: adrp x8, array +; CHECK-NOCPA-O0-NEXT: add x8, x8, :lo12:array +; CHECK-NOCPA-O0-NEXT: add x8, x8, x0, lsl #4 +; CHECK-NOCPA-O0-NEXT: str x1, [x8, #8] +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: addpt1: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: adrp x8, array +; CHECK-NOCPA-O3-NEXT: add x8, x8, :lo12:array +; CHECK-NOCPA-O3-NEXT: add x8, x8, x0, lsl #4 +; CHECK-NOCPA-O3-NEXT: str x1, [x8, #8] +; CHECK-NOCPA-O3-NEXT: ret +entry: + %e2 = getelementptr inbounds %struct.my_type, ptr @array, i64 %index, i32 1 + store i64 %arg, ptr %e2, align 8 + ret void +} + +define void @maddpt1(i32 %pos, ptr %val) { +; CHECK-CPA-O0-LABEL: maddpt1: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: // implicit-def: $x8 +; CHECK-CPA-O0-NEXT: mov w8, w0 +; CHECK-CPA-O0-NEXT: sxtw x8, w8 +; CHECK-CPA-O0-NEXT: mov w9, #48 // =0x30 +; CHECK-CPA-O0-NEXT: // kill: def $x9 killed $w9 +; CHECK-CPA-O0-NEXT: adrp x10, array2 +; CHECK-CPA-O0-NEXT: add x10, x10, :lo12:array2 +; CHECK-CPA-O0-NEXT: maddpt x0, x8, x9, x10 +; CHECK-CPA-O0-NEXT: mov w8, #48 // =0x30 +; CHECK-CPA-O0-NEXT: mov w2, w8 +; CHECK-CPA-O0-NEXT: b memcpy +; +; CHECK-CPA-O3-LABEL: maddpt1: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: // kill: def $w0 killed $w0 def $x0 +; CHECK-CPA-O3-NEXT: sxtw x9, w0 +; CHECK-CPA-O3-NEXT: mov w8, #48 // =0x30 +; CHECK-CPA-O3-NEXT: ldr q0, [x1] +; CHECK-CPA-O3-NEXT: adrp x10, array2 +; CHECK-CPA-O3-NEXT: add x10, x10, :lo12:array2 +; CHECK-CPA-O3-NEXT: maddpt x8, x9, x8, x10 +; CHECK-CPA-O3-NEXT: str q0, [x8] +; CHECK-CPA-O3-NEXT: ldr q0, [x1, #16] +; CHECK-CPA-O3-NEXT: str q0, [x8, #16] +; CHECK-CPA-O3-NEXT: ldr q0, [x1, #32] +; CHECK-CPA-O3-NEXT: str q0, [x8, #32] +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: maddpt1: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: adrp x9, array2 +; CHECK-NOCPA-O0-NEXT: add x9, x9, :lo12:array2 +; CHECK-NOCPA-O0-NEXT: mov w8, #48 // =0x30 +; CHECK-NOCPA-O0-NEXT: smaddl x0, w0, w8, x9 +; CHECK-NOCPA-O0-NEXT: mov w8, #48 // =0x30 +; CHECK-NOCPA-O0-NEXT: mov w2, w8 +; CHECK-NOCPA-O0-NEXT: b memcpy +; +; CHECK-NOCPA-O3-LABEL: maddpt1: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: mov w8, #48 // =0x30 +; CHECK-NOCPA-O3-NEXT: adrp x9, array2 +; CHECK-NOCPA-O3-NEXT: add x9, x9, :lo12:array2 +; CHECK-NOCPA-O3-NEXT: smaddl x8, w0, w8, x9 +; CHECK-NOCPA-O3-NEXT: ldr q0, [x1] +; CHECK-NOCPA-O3-NEXT: str q0, [x8] +; CHECK-NOCPA-O3-NEXT: ldr q0, [x1, #16] +; CHECK-NOCPA-O3-NEXT: str q0, [x8, #16] +; CHECK-NOCPA-O3-NEXT: ldr q0, [x1, #32] +; CHECK-NOCPA-O3-NEXT: str q0, [x8, #32] +; CHECK-NOCPA-O3-NEXT: ret +entry: + %idxprom = sext i32 %pos to i64 + %arrayidx = getelementptr inbounds [10 x %struct.my_type2], ptr @array2, i64 0, i64 %idxprom + tail call void @llvm.memcpy.p0.p0.i64(ptr align 8 dereferenceable(48) %arrayidx, ptr align 8 dereferenceable(48) %val, i64 48, i1 false) + ret void +} + +define void @msubpt1(i32 %index, i32 %elem) { +; CHECK-CPA-O0-LABEL: msubpt1: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: // implicit-def: $x8 +; CHECK-CPA-O0-NEXT: mov w8, w0 +; CHECK-CPA-O0-NEXT: sxtw x10, w8 +; CHECK-CPA-O0-NEXT: mov w8, #48 // =0x30 +; CHECK-CPA-O0-NEXT: mov w9, w8 +; CHECK-CPA-O0-NEXT: mov w8, #288 // =0x120 +; CHECK-CPA-O0-NEXT: mov w11, w8 +; CHECK-CPA-O0-NEXT: adrp x8, array2 +; CHECK-CPA-O0-NEXT: add x8, x8, :lo12:array2 +; CHECK-CPA-O0-NEXT: addpt x11, x8, x11 +; CHECK-CPA-O0-NEXT: msubpt x0, x9, x10, x11 +; CHECK-CPA-O0-NEXT: mov w9, #48 // =0x30 +; CHECK-CPA-O0-NEXT: mov w2, w9 +; CHECK-CPA-O0-NEXT: mov w9, #96 // =0x60 +; CHECK-CPA-O0-NEXT: // kill: def $x9 killed $w9 +; CHECK-CPA-O0-NEXT: addpt x1, x8, x9 +; CHECK-CPA-O0-NEXT: b memcpy +; +; CHECK-CPA-O3-LABEL: msubpt1: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: // kill: def $w0 killed $w0 def $x0 +; CHECK-CPA-O3-NEXT: sxtw x9, w0 +; CHECK-CPA-O3-NEXT: adrp x10, array2+96 +; CHECK-CPA-O3-NEXT: add x10, x10, :lo12:array2+96 +; CHECK-CPA-O3-NEXT: mov w8, #48 // =0x30 +; CHECK-CPA-O3-NEXT: ldr q0, [x10] +; CHECK-CPA-O3-NEXT: msubpt x8, x8, x9, x10 +; CHECK-CPA-O3-NEXT: str q0, [x8, #192] +; CHECK-CPA-O3-NEXT: ldr q0, [x10, #16] +; CHECK-CPA-O3-NEXT: str q0, [x8, #208] +; CHECK-CPA-O3-NEXT: ldr q0, [x10, #32] +; CHECK-CPA-O3-NEXT: str q0, [x8, #224] +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: msubpt1: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: // implicit-def: $x8 +; CHECK-NOCPA-O0-NEXT: mov w8, w0 +; CHECK-NOCPA-O0-NEXT: sxtw x8, w8 +; CHECK-NOCPA-O0-NEXT: mov w9, #48 // =0x30 +; CHECK-NOCPA-O0-NEXT: // kill: def $x9 killed $w9 +; CHECK-NOCPA-O0-NEXT: mneg x10, x8, x9 +; CHECK-NOCPA-O0-NEXT: adrp x8, array2 +; CHECK-NOCPA-O0-NEXT: add x8, x8, :lo12:array2 +; CHECK-NOCPA-O0-NEXT: add x9, x8, #288 +; CHECK-NOCPA-O0-NEXT: add x0, x9, x10 +; CHECK-NOCPA-O0-NEXT: mov w9, #48 // =0x30 +; CHECK-NOCPA-O0-NEXT: mov w2, w9 +; CHECK-NOCPA-O0-NEXT: add x1, x8, #96 +; CHECK-NOCPA-O0-NEXT: b memcpy +; +; CHECK-NOCPA-O3-LABEL: msubpt1: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: // kill: def $w0 killed $w0 def $x0 +; CHECK-NOCPA-O3-NEXT: sxtw x8, w0 +; CHECK-NOCPA-O3-NEXT: mov w9, #48 // =0x30 +; CHECK-NOCPA-O3-NEXT: mneg x8, x8, x9 +; CHECK-NOCPA-O3-NEXT: adrp x9, array2+96 +; CHECK-NOCPA-O3-NEXT: add x9, x9, :lo12:array2+96 +; CHECK-NOCPA-O3-NEXT: ldr q0, [x9] +; CHECK-NOCPA-O3-NEXT: add x8, x9, x8 +; CHECK-NOCPA-O3-NEXT: str q0, [x8, #192] +; CHECK-NOCPA-O3-NEXT: ldr q0, [x9, #16] +; CHECK-NOCPA-O3-NEXT: str q0, [x8, #208] +; CHECK-NOCPA-O3-NEXT: ldr q0, [x9, #32] +; CHECK-NOCPA-O3-NEXT: str q0, [x8, #224] +; CHECK-NOCPA-O3-NEXT: ret +entry: + %idx.ext = sext i32 %index to i64 + %idx.neg = sub nsw i64 0, %idx.ext + %add.ptr = getelementptr inbounds %struct.my_type2, ptr getelementptr inbounds ([10 x %struct.my_type2], ptr @array2, i64 0, i64 6), i64 %idx.neg + tail call void @llvm.memcpy.p0.p0.i64(ptr align 8 dereferenceable(48) %add.ptr, ptr align 8 dereferenceable(48) getelementptr inbounds ([10 x %struct.my_type2], ptr @array2, i64 0, i64 2), i64 48, i1 false), !tbaa.struct !6 + ret void +} + +define void @subpt1(i32 %index, i32 %elem) { +; CHECK-CPA-O0-LABEL: subpt1: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: mov w8, #-16 // =0xfffffff0 +; CHECK-CPA-O0-NEXT: smull x9, w0, w8 +; CHECK-CPA-O0-NEXT: adrp x8, array +; CHECK-CPA-O0-NEXT: add x8, x8, :lo12:array +; CHECK-CPA-O0-NEXT: ldr q0, [x8, #32] +; CHECK-CPA-O0-NEXT: mov w10, #96 // =0x60 +; CHECK-CPA-O0-NEXT: // kill: def $x10 killed $w10 +; CHECK-CPA-O0-NEXT: addpt x8, x8, x10 +; CHECK-CPA-O0-NEXT: str q0, [x8, x9, lsl #4] +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: subpt1: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: mov w8, #-16 // =0xfffffff0 +; CHECK-CPA-O3-NEXT: adrp x9, array+32 +; CHECK-CPA-O3-NEXT: add x9, x9, :lo12:array+32 +; CHECK-CPA-O3-NEXT: smull x8, w0, w8 +; CHECK-CPA-O3-NEXT: ldr q0, [x9] +; CHECK-CPA-O3-NEXT: addpt x8, x9, x8, lsl #4 +; CHECK-CPA-O3-NEXT: str q0, [x8, #64] +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: subpt1: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: mov w8, #-16 // =0xfffffff0 +; CHECK-NOCPA-O0-NEXT: smull x9, w0, w8 +; CHECK-NOCPA-O0-NEXT: adrp x8, array +; CHECK-NOCPA-O0-NEXT: add x8, x8, :lo12:array +; CHECK-NOCPA-O0-NEXT: ldr q0, [x8, #32] +; CHECK-NOCPA-O0-NEXT: add x8, x8, #96 +; CHECK-NOCPA-O0-NEXT: str q0, [x8, x9, lsl #4] +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: subpt1: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: mov w8, #-16 // =0xfffffff0 +; CHECK-NOCPA-O3-NEXT: adrp x9, array+32 +; CHECK-NOCPA-O3-NEXT: add x9, x9, :lo12:array+32 +; CHECK-NOCPA-O3-NEXT: smull x8, w0, w8 +; CHECK-NOCPA-O3-NEXT: ldr q0, [x9] +; CHECK-NOCPA-O3-NEXT: add x8, x9, x8, lsl #4 +; CHECK-NOCPA-O3-NEXT: str q0, [x8, #64] +; CHECK-NOCPA-O3-NEXT: ret +entry: + %conv = sext i32 %index to i64 + %mul.neg = mul nsw i64 %conv, -16 + %add.ptr = getelementptr inbounds %struct.my_type, ptr getelementptr inbounds ([10 x %struct.my_type], ptr @array, i64 0, i64 6), i64 %mul.neg + tail call void @llvm.memcpy.p0.p0.i64(ptr noundef nonnull align 8 dereferenceable(16) %add.ptr, ptr noundef nonnull align 8 dereferenceable(16) getelementptr inbounds ([10 x %struct.my_type], ptr @array, i64 0, i64 2), i64 16, i1 false), !tbaa.struct !6 + ret void +} + +define void @subpt2(i32 %index, i32 %elem) { +; CHECK-CPA-O0-LABEL: subpt2: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: mov x8, xzr +; CHECK-CPA-O0-NEXT: subs x9, x8, w0, sxtw +; CHECK-CPA-O0-NEXT: adrp x8, array +; CHECK-CPA-O0-NEXT: add x8, x8, :lo12:array +; CHECK-CPA-O0-NEXT: ldr q0, [x8, #32] +; CHECK-CPA-O0-NEXT: mov w10, #96 // =0x60 +; CHECK-CPA-O0-NEXT: // kill: def $x10 killed $w10 +; CHECK-CPA-O0-NEXT: addpt x8, x8, x10 +; CHECK-CPA-O0-NEXT: str q0, [x8, x9, lsl #4] +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: subpt2: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: mov x8, xzr +; CHECK-CPA-O3-NEXT: adrp x9, array+32 +; CHECK-CPA-O3-NEXT: add x9, x9, :lo12:array+32 +; CHECK-CPA-O3-NEXT: sub x8, x8, w0, sxtw +; CHECK-CPA-O3-NEXT: ldr q0, [x9] +; CHECK-CPA-O3-NEXT: addpt x8, x9, x8, lsl #4 +; CHECK-CPA-O3-NEXT: str q0, [x8, #64] +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: subpt2: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: mov x8, xzr +; CHECK-NOCPA-O0-NEXT: subs x9, x8, w0, sxtw +; CHECK-NOCPA-O0-NEXT: adrp x8, array +; CHECK-NOCPA-O0-NEXT: add x8, x8, :lo12:array +; CHECK-NOCPA-O0-NEXT: ldr q0, [x8, #32] +; CHECK-NOCPA-O0-NEXT: add x8, x8, #96 +; CHECK-NOCPA-O0-NEXT: str q0, [x8, x9, lsl #4] +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: subpt2: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: mov x8, xzr +; CHECK-NOCPA-O3-NEXT: adrp x9, array+32 +; CHECK-NOCPA-O3-NEXT: add x9, x9, :lo12:array+32 +; CHECK-NOCPA-O3-NEXT: sub x8, x8, w0, sxtw +; CHECK-NOCPA-O3-NEXT: ldr q0, [x9] +; CHECK-NOCPA-O3-NEXT: add x8, x9, x8, lsl #4 +; CHECK-NOCPA-O3-NEXT: str q0, [x8, #64] +; CHECK-NOCPA-O3-NEXT: ret +entry: + %idx.ext = sext i32 %index to i64 + %idx.neg = sub nsw i64 0, %idx.ext + %add.ptr = getelementptr inbounds %struct.my_type, ptr getelementptr inbounds ([10 x %struct.my_type], ptr @array, i64 0, i64 6), i64 %idx.neg + tail call void @llvm.memcpy.p0.p0.i64(ptr noundef nonnull align 8 dereferenceable(16) %add.ptr, ptr noundef nonnull align 8 dereferenceable(16) getelementptr inbounds ([10 x %struct.my_type], ptr @array, i64 0, i64 2), i64 16, i1 false), !tbaa.struct !11 + ret void +} + +define ptr @subpt3(ptr %ptr, i32 %index) { +; CHECK-CPA-O0-LABEL: subpt3: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: mov x8, #-8 // =0xfffffffffffffff8 +; CHECK-CPA-O0-NEXT: addpt x0, x0, x8 +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: subpt3: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: mov x8, #-8 // =0xfffffffffffffff8 +; CHECK-CPA-O3-NEXT: addpt x0, x0, x8 +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: subpt3: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: subs x0, x0, #8 +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: subpt3: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: sub x0, x0, #8 +; CHECK-NOCPA-O3-NEXT: ret +entry: + %incdec.ptr.i.i.i = getelementptr inbounds i64, ptr %ptr, i64 -1 + ret ptr %incdec.ptr.i.i.i +} + +define i64 @subi64(i64 %ptr, i32 %index) { +; CHECK-CPA-O0-LABEL: subi64: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: subs x0, x0, #1 +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: subi64: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: sub x0, x0, #1 +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: subi64: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: subs x0, x0, #1 +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: subi64: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: sub x0, x0, #1 +; CHECK-NOCPA-O3-NEXT: ret +entry: + %incdec.ptr.i.i.i = add i64 %ptr, -1 + ret i64 %incdec.ptr.i.i.i +} + +define i32 @subi32(i32 %ptr, i32 %index) { +; CHECK-CPA-O0-LABEL: subi32: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: subs w0, w0, #1 +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: subi32: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: sub w0, w0, #1 +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: subi32: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: subs w0, w0, #1 +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: subi32: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: sub w0, w0, #1 +; CHECK-NOCPA-O3-NEXT: ret +entry: + %incdec.ptr.i.i.i = add i32 %ptr, -1 + ret i32 %incdec.ptr.i.i.i +} + +define i16 @subi16(i16 %ptr, i32 %index) { +; CHECK-CPA-O0-LABEL: subi16: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: subs w0, w0, #1 +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: subi16: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: sub w0, w0, #1 +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: subi16: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: subs w0, w0, #1 +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: subi16: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: sub w0, w0, #1 +; CHECK-NOCPA-O3-NEXT: ret +entry: + %incdec.ptr.i.i.i = add i16 %ptr, -1 + ret i16 %incdec.ptr.i.i.i +} + +define i64 @addi64(i64 %ptr, i32 %index) { +; CHECK-CPA-O0-LABEL: addi64: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: add x0, x0, #1 +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: addi64: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: add x0, x0, #1 +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: addi64: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: add x0, x0, #1 +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: addi64: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: add x0, x0, #1 +; CHECK-NOCPA-O3-NEXT: ret +entry: + %incdec.ptr.i.i.i = add i64 %ptr, 1 + ret i64 %incdec.ptr.i.i.i +} + +define i32 @addi32(i32 %ptr, i32 %index) { +; CHECK-CPA-O0-LABEL: addi32: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: add w0, w0, #1 +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: addi32: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: add w0, w0, #1 +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: addi32: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: add w0, w0, #1 +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: addi32: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: add w0, w0, #1 +; CHECK-NOCPA-O3-NEXT: ret +entry: + %incdec.ptr.i.i.i = add i32 %ptr, 1 + ret i32 %incdec.ptr.i.i.i +} + +define i16 @addi16(i16 %ptr, i32 %index) { +; CHECK-CPA-O0-LABEL: addi16: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: add w0, w0, #1 +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: addi16: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: add w0, w0, #1 +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: addi16: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: add w0, w0, #1 +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: addi16: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: add w0, w0, #1 +; CHECK-NOCPA-O3-NEXT: ret +entry: + %incdec.ptr.i.i.i = add i16 %ptr, 1 + ret i16 %incdec.ptr.i.i.i +} + +define i64 @arith1(i64 noundef %0, i64 noundef %1, i64 noundef %2) { +; CHECK-CPA-O0-LABEL: arith1: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: sub sp, sp, #32 +; CHECK-CPA-O0-NEXT: .cfi_def_cfa_offset 32 +; CHECK-CPA-O0-NEXT: str x0, [sp, #24] +; CHECK-CPA-O0-NEXT: str x1, [sp, #16] +; CHECK-CPA-O0-NEXT: str x2, [sp, #8] +; CHECK-CPA-O0-NEXT: ldr x8, [sp, #24] +; CHECK-CPA-O0-NEXT: ldr x9, [sp, #16] +; CHECK-CPA-O0-NEXT: ldr x10, [sp, #8] +; CHECK-CPA-O0-NEXT: mul x9, x9, x10 +; CHECK-CPA-O0-NEXT: add x0, x8, x9 +; CHECK-CPA-O0-NEXT: add sp, sp, #32 +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: arith1: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: sub sp, sp, #32 +; CHECK-CPA-O3-NEXT: .cfi_def_cfa_offset 32 +; CHECK-CPA-O3-NEXT: stp x2, x1, [sp, #8] +; CHECK-CPA-O3-NEXT: str x0, [sp, #24] +; CHECK-CPA-O3-NEXT: madd x0, x1, x2, x0 +; CHECK-CPA-O3-NEXT: add sp, sp, #32 +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: arith1: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: sub sp, sp, #32 +; CHECK-NOCPA-O0-NEXT: .cfi_def_cfa_offset 32 +; CHECK-NOCPA-O0-NEXT: str x0, [sp, #24] +; CHECK-NOCPA-O0-NEXT: str x1, [sp, #16] +; CHECK-NOCPA-O0-NEXT: str x2, [sp, #8] +; CHECK-NOCPA-O0-NEXT: ldr x8, [sp, #24] +; CHECK-NOCPA-O0-NEXT: ldr x9, [sp, #16] +; CHECK-NOCPA-O0-NEXT: ldr x10, [sp, #8] +; CHECK-NOCPA-O0-NEXT: mul x9, x9, x10 +; CHECK-NOCPA-O0-NEXT: add x0, x8, x9 +; CHECK-NOCPA-O0-NEXT: add sp, sp, #32 +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: arith1: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: sub sp, sp, #32 +; CHECK-NOCPA-O3-NEXT: .cfi_def_cfa_offset 32 +; CHECK-NOCPA-O3-NEXT: stp x2, x1, [sp, #8] +; CHECK-NOCPA-O3-NEXT: str x0, [sp, #24] +; CHECK-NOCPA-O3-NEXT: madd x0, x1, x2, x0 +; CHECK-NOCPA-O3-NEXT: add sp, sp, #32 +; CHECK-NOCPA-O3-NEXT: ret +entry: + %4 = alloca i64, align 8 + %5 = alloca i64, align 8 + %6 = alloca i64, align 8 + store i64 %0, ptr %4, align 8 + store i64 %1, ptr %5, align 8 + store i64 %2, ptr %6, align 8 + %7 = load i64, ptr %4, align 8 + %8 = load i64, ptr %5, align 8 + %9 = load i64, ptr %6, align 8 + %10 = mul nsw i64 %8, %9 + %11 = add nsw i64 %7, %10 + ret i64 %11 +} + +define i64 @arith2(ptr noundef %0, i64 noundef %1, i64 noundef %2, i32 noundef %3) { +; CHECK-CPA-O0-LABEL: arith2: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: sub sp, sp, #32 +; CHECK-CPA-O0-NEXT: .cfi_def_cfa_offset 32 +; CHECK-CPA-O0-NEXT: str x0, [sp, #24] +; CHECK-CPA-O0-NEXT: str x1, [sp, #16] +; CHECK-CPA-O0-NEXT: str x2, [sp, #8] +; CHECK-CPA-O0-NEXT: str w3, [sp, #4] +; CHECK-CPA-O0-NEXT: ldr x10, [sp, #24] +; CHECK-CPA-O0-NEXT: ldrsw x8, [sp, #4] +; CHECK-CPA-O0-NEXT: mov w9, #48 // =0x30 +; CHECK-CPA-O0-NEXT: // kill: def $x9 killed $w9 +; CHECK-CPA-O0-NEXT: maddpt x8, x8, x9, x10 +; CHECK-CPA-O0-NEXT: ldr x8, [x8, #24] +; CHECK-CPA-O0-NEXT: ldr x10, [sp, #16] +; CHECK-CPA-O0-NEXT: ldr x9, [sp, #8] +; CHECK-CPA-O0-NEXT: mul x10, x10, x9 +; CHECK-CPA-O0-NEXT: add x8, x8, x10 +; CHECK-CPA-O0-NEXT: subs x0, x8, x9 +; CHECK-CPA-O0-NEXT: add sp, sp, #32 +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: arith2: +; CHECK-CPA-O3: // %bb.0: // %entry +; CHECK-CPA-O3-NEXT: sub sp, sp, #32 +; CHECK-CPA-O3-NEXT: .cfi_def_cfa_offset 32 +; CHECK-CPA-O3-NEXT: str w3, [sp, #4] +; CHECK-CPA-O3-NEXT: mov w10, #48 // =0x30 +; CHECK-CPA-O3-NEXT: ldrsw x9, [sp, #4] +; CHECK-CPA-O3-NEXT: stp x1, x0, [sp, #16] +; CHECK-CPA-O3-NEXT: maddpt x8, x9, x10, x0 +; CHECK-CPA-O3-NEXT: str x2, [sp, #8] +; CHECK-CPA-O3-NEXT: ldr x8, [x8, #24] +; CHECK-CPA-O3-NEXT: madd x8, x1, x2, x8 +; CHECK-CPA-O3-NEXT: sub x0, x8, x2 +; CHECK-CPA-O3-NEXT: add sp, sp, #32 +; CHECK-CPA-O3-NEXT: ret +; +; CHECK-NOCPA-O0-LABEL: arith2: +; CHECK-NOCPA-O0: // %bb.0: // %entry +; CHECK-NOCPA-O0-NEXT: sub sp, sp, #32 +; CHECK-NOCPA-O0-NEXT: .cfi_def_cfa_offset 32 +; CHECK-NOCPA-O0-NEXT: str x0, [sp, #24] +; CHECK-NOCPA-O0-NEXT: str x1, [sp, #16] +; CHECK-NOCPA-O0-NEXT: str x2, [sp, #8] +; CHECK-NOCPA-O0-NEXT: str w3, [sp, #4] +; CHECK-NOCPA-O0-NEXT: ldr x8, [sp, #24] +; CHECK-NOCPA-O0-NEXT: ldrsw x9, [sp, #4] +; CHECK-NOCPA-O0-NEXT: mov w10, #48 // =0x30 +; CHECK-NOCPA-O0-NEXT: // kill: def $x10 killed $w10 +; CHECK-NOCPA-O0-NEXT: mul x9, x9, x10 +; CHECK-NOCPA-O0-NEXT: add x8, x8, x9 +; CHECK-NOCPA-O0-NEXT: ldr x8, [x8, #24] +; CHECK-NOCPA-O0-NEXT: ldr x10, [sp, #16] +; CHECK-NOCPA-O0-NEXT: ldr x9, [sp, #8] +; CHECK-NOCPA-O0-NEXT: mul x10, x10, x9 +; CHECK-NOCPA-O0-NEXT: add x8, x8, x10 +; CHECK-NOCPA-O0-NEXT: subs x0, x8, x9 +; CHECK-NOCPA-O0-NEXT: add sp, sp, #32 +; CHECK-NOCPA-O0-NEXT: ret +; +; CHECK-NOCPA-O3-LABEL: arith2: +; CHECK-NOCPA-O3: // %bb.0: // %entry +; CHECK-NOCPA-O3-NEXT: sub sp, sp, #32 +; CHECK-NOCPA-O3-NEXT: .cfi_def_cfa_offset 32 +; CHECK-NOCPA-O3-NEXT: str w3, [sp, #4] +; CHECK-NOCPA-O3-NEXT: mov w9, #48 // =0x30 +; CHECK-NOCPA-O3-NEXT: ldrsw x8, [sp, #4] +; CHECK-NOCPA-O3-NEXT: stp x1, x0, [sp, #16] +; CHECK-NOCPA-O3-NEXT: str x2, [sp, #8] +; CHECK-NOCPA-O3-NEXT: madd x8, x8, x9, x0 +; CHECK-NOCPA-O3-NEXT: ldr x8, [x8, #24] +; CHECK-NOCPA-O3-NEXT: madd x8, x1, x2, x8 +; CHECK-NOCPA-O3-NEXT: sub x0, x8, x2 +; CHECK-NOCPA-O3-NEXT: add sp, sp, #32 +; CHECK-NOCPA-O3-NEXT: ret +entry: + %5 = alloca ptr, align 8 + %6 = alloca i64, align 8 + %7 = alloca i64, align 8 + %8 = alloca i32, align 4 + store ptr %0, ptr %5, align 8 + store i64 %1, ptr %6, align 8 + store i64 %2, ptr %7, align 8 + store i32 %3, ptr %8, align 4 + %9 = load ptr, ptr %5, align 8 + %10 = load i32, ptr %8, align 4 + %11 = sext i32 %10 to i64 + %12 = getelementptr inbounds %struct.my_type2, ptr %9, i64 %11 + %13 = getelementptr inbounds %struct.my_type2, ptr %12, i32 0, i32 3 + %14 = load i64, ptr %13, align 8 + %15 = load i64, ptr %6, align 8 + %16 = load i64, ptr %7, align 8 + %17 = mul nsw i64 %15, %16 + %18 = add nsw i64 %14, %17 + %19 = sub nsw i64 %18, %16 + ret i64 %19 +} + +@a = hidden global [2 x [1 x [2 x i8]]] [[1 x [2 x i8]] [[2 x i8] c"\01\01"], [1 x [2 x i8]] [[2 x i8] c"\01\01"]], align 1 +@b = hidden global i16 0, align 2 + +define hidden void @multidim() { +; CHECK-CPA-O0-LABEL: multidim: +; CHECK-CPA-O0: // %bb.0: // %entry +; CHECK-CPA-O0-NEXT: adrp x8, b +; CHECK-CPA-O0-NEXT: ldrh w9, [x8, :lo12:b] +; CHECK-CPA-O0-NEXT: mov w10, w9 +; CHECK-CPA-O0-NEXT: ldrh w8, [x8, :lo12:b] +; CHECK-CPA-O0-NEXT: add w9, w8, #1 +; CHECK-CPA-O0-NEXT: // implicit-def: $x8 +; CHECK-CPA-O0-NEXT: mov w8, w9 +; CHECK-CPA-O0-NEXT: sxtw x9, w8 +; CHECK-CPA-O0-NEXT: mov w8, #2 // =0x2 +; CHECK-CPA-O0-NEXT: mov w11, w8 +; CHECK-CPA-O0-NEXT: adrp x8, a +; CHECK-CPA-O0-NEXT: add x8, x8, :lo12:a +; CHECK-CPA-O0-NEXT: addpt x8, x8, x11 +; CHECK-CPA-O0-NEXT: addpt x8, x8, x10, lsl #1 +; CHECK-CPA-O0-NEXT: addpt x8, x8, x9 +; CHECK-CPA-O0-NEXT: ldrb w8, [x8] +; CHECK-CPA-O0-NEXT: cbz w8, .LBB14_2 +; CHECK-CPA-O0-NEXT: b .LBB14_1 +; CHECK-CPA-O0-NEXT: .LBB14_1: // %if.then +; CHECK-CPA-O0-NEXT: b .LBB14_2 +; CHECK-CPA-O0-NEXT: .LBB14_2: // %if.end +; CHECK-CPA-O0-NEXT: ret +; +; CHECK-CPA-O3-LABEL: multidim: +; CHECK-CPA-O3: // %bb.0: // %entry ---------------- davemgreen wrote:
Is it worth adding a store or call to this example to make sure it doesn't all optimize away. https://github.com/llvm/llvm-project/pull/105669 _______________________________________________ cfe-commits mailing list cfe-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits