|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 |
| 2 | +; Test the generation of asm for the function: |
| 3 | +; int foo(_Atomic int *cp, int *old, int c) { |
| 4 | +; return atomic_compare_exchange_weak_explicit(cp, old, c, __ATOMIC_RELAXED, __ATOMIC_RELAXED); |
| 5 | +; } |
| 6 | + |
| 7 | +; RUN: llc < %s -ppc-asm-full-reg-names -mtriple=powerpc-ibm-aix -mcpu=pwr8 -verify-machineinstrs |\ |
| 8 | +; FileCheck %s --check-prefix=CHECK |
| 9 | +; RUN: llc < %s -ppc-asm-full-reg-names -mtriple=powerpc64-ibm-aix -mcpu=pwr8 -verify-machineinstrs |\ |
| 10 | +; FileCheck %s --check-prefix=CHECK64 |
| 11 | + |
| 12 | +define i32 @foo(ptr noundef %cp, ptr noundef %old, i32 noundef %c) { |
| 13 | +; CHECK-LABEL: foo: |
| 14 | +; CHECK: # %bb.0: # %entry |
| 15 | +; CHECK-NEXT: lwz r7, 0(r4) |
| 16 | +; CHECK-NEXT: stw r3, -4(r1) |
| 17 | +; CHECK-NEXT: stw r4, -8(r1) |
| 18 | +; CHECK-NEXT: stw r5, -12(r1) |
| 19 | +; CHECK-NEXT: stw r5, -16(r1) |
| 20 | +; CHECK-NEXT: L..BB0_1: # %entry |
| 21 | +; CHECK-NEXT: # |
| 22 | +; CHECK-NEXT: lwarx r6, 0, r3 |
| 23 | +; CHECK-NEXT: cmpw cr1, r6, r7 |
| 24 | +; CHECK-NEXT: bne cr1, L..BB0_3 |
| 25 | +; CHECK-NEXT: # %bb.2: # %entry |
| 26 | +; CHECK-NEXT: # |
| 27 | +; CHECK-NEXT: stwcx. r5, 0, r3 |
| 28 | +; CHECK-NEXT: bne cr0, L..BB0_1 |
| 29 | +; CHECK-NEXT: L..BB0_3: # %entry |
| 30 | +; CHECK-NEXT: cmplw r6, r7 |
| 31 | +; CHECK-NEXT: beq cr0, L..BB0_5 |
| 32 | +; CHECK-NEXT: # %bb.4: # %cmpxchg.store_expected |
| 33 | +; CHECK-NEXT: stw r6, 0(r4) |
| 34 | +; CHECK-NEXT: L..BB0_5: # %cmpxchg.continue |
| 35 | +; CHECK-NEXT: li r3, 0 |
| 36 | +; CHECK-NEXT: li r4, 1 |
| 37 | +; CHECK-NEXT: isel r3, r4, r3, 4*cr1+eq |
| 38 | +; CHECK-NEXT: stb r3, -17(r1) |
| 39 | +; CHECK-NEXT: blr |
| 40 | +; |
| 41 | +; CHECK64-LABEL: foo: |
| 42 | +; CHECK64: # %bb.0: # %entry |
| 43 | +; CHECK64-NEXT: lwz r7, 0(r4) |
| 44 | +; CHECK64-NEXT: std r3, -8(r1) |
| 45 | +; CHECK64-NEXT: std r4, -16(r1) |
| 46 | +; CHECK64-NEXT: stw r5, -20(r1) |
| 47 | +; CHECK64-NEXT: stw r5, -24(r1) |
| 48 | +; CHECK64-NEXT: L..BB0_1: # %entry |
| 49 | +; CHECK64-NEXT: # |
| 50 | +; CHECK64-NEXT: lwarx r6, 0, r3 |
| 51 | +; CHECK64-NEXT: cmpw cr1, r6, r7 |
| 52 | +; CHECK64-NEXT: bne cr1, L..BB0_3 |
| 53 | +; CHECK64-NEXT: # %bb.2: # %entry |
| 54 | +; CHECK64-NEXT: # |
| 55 | +; CHECK64-NEXT: stwcx. r5, 0, r3 |
| 56 | +; CHECK64-NEXT: bne cr0, L..BB0_1 |
| 57 | +; CHECK64-NEXT: L..BB0_3: # %entry |
| 58 | +; CHECK64-NEXT: cmplw r6, r7 |
| 59 | +; CHECK64-NEXT: beq cr0, L..BB0_5 |
| 60 | +; CHECK64-NEXT: # %bb.4: # %cmpxchg.store_expected |
| 61 | +; CHECK64-NEXT: stw r6, 0(r4) |
| 62 | +; CHECK64-NEXT: L..BB0_5: # %cmpxchg.continue |
| 63 | +; CHECK64-NEXT: li r3, 0 |
| 64 | +; CHECK64-NEXT: li r4, 1 |
| 65 | +; CHECK64-NEXT: isel r3, r4, r3, 4*cr1+eq |
| 66 | +; CHECK64-NEXT: li r4, 1 |
| 67 | +; CHECK64-NEXT: stb r3, -25(r1) |
| 68 | +; CHECK64-NEXT: li r3, 0 |
| 69 | +; CHECK64-NEXT: isel r3, r4, r3, 4*cr1+eq |
| 70 | +; CHECK64-NEXT: blr |
| 71 | +entry: |
| 72 | + %cp.addr = alloca ptr, align 4 |
| 73 | + %old.addr = alloca ptr, align 4 |
| 74 | + %c.addr = alloca i32, align 4 |
| 75 | + %.atomictmp = alloca i32, align 4 |
| 76 | + %cmpxchg.bool = alloca i8, align 1 |
| 77 | + store ptr %cp, ptr %cp.addr, align 4 |
| 78 | + store ptr %old, ptr %old.addr, align 4 |
| 79 | + store i32 %c, ptr %c.addr, align 4 |
| 80 | + %0 = load ptr, ptr %cp.addr, align 4 |
| 81 | + %1 = load ptr, ptr %old.addr, align 4 |
| 82 | + %2 = load i32, ptr %c.addr, align 4 |
| 83 | + store i32 %2, ptr %.atomictmp, align 4 |
| 84 | + %3 = load i32, ptr %1, align 4 |
| 85 | + %4 = load i32, ptr %.atomictmp, align 4 |
| 86 | + %5 = cmpxchg weak ptr %0, i32 %3, i32 %4 monotonic monotonic, align 4 |
| 87 | + %6 = extractvalue { i32, i1 } %5, 0 |
| 88 | + %7 = extractvalue { i32, i1 } %5, 1 |
| 89 | + br i1 %7, label %cmpxchg.continue, label %cmpxchg.store_expected |
| 90 | + |
| 91 | +cmpxchg.store_expected: ; preds = %entry |
| 92 | + store i32 %6, ptr %1, align 4 |
| 93 | + br label %cmpxchg.continue |
| 94 | + |
| 95 | +cmpxchg.continue: ; preds = %cmpxchg.store_expected, %entry |
| 96 | + %storedv = zext i1 %7 to i8 |
| 97 | + store i8 %storedv, ptr %cmpxchg.bool, align 1 |
| 98 | + %8 = load i8, ptr %cmpxchg.bool, align 1 |
| 99 | + %loadedv = trunc i8 %8 to i1 |
| 100 | + %conv = zext i1 %loadedv to i32 |
| 101 | + ret i32 %conv |
| 102 | +} |
0 commit comments