1*e2ee27b2SKai Luo; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 2*e2ee27b2SKai Luo; RUN: llc -verify-machineinstrs -mtriple=powerpc64-unknown-unknown \ 3*e2ee27b2SKai Luo; RUN: < %s | FileCheck --check-prefix=CHECK-64 %s 4*e2ee27b2SKai Luo; RUN: llc -verify-machineinstrs -mtriple=powerpc-unknown-unknown \ 5*e2ee27b2SKai Luo; RUN: < %s | FileCheck --check-prefix=CHECK-32 %s 6*e2ee27b2SKai Luo 7*e2ee27b2SKai Luodefine float @test_add(float* %ptr, float %incr) { 8*e2ee27b2SKai Luo; CHECK-64-LABEL: test_add: 9*e2ee27b2SKai Luo; CHECK-64: # %bb.0: # %entry 10*e2ee27b2SKai Luo; CHECK-64-NEXT: sync 11*e2ee27b2SKai Luo; CHECK-64-NEXT: lfs 0, 0(3) 12*e2ee27b2SKai Luo; CHECK-64-NEXT: b .LBB0_3 13*e2ee27b2SKai Luo; CHECK-64-NEXT: .LBB0_1: # %atomicrmw.start 14*e2ee27b2SKai Luo; CHECK-64-NEXT: # 15*e2ee27b2SKai Luo; CHECK-64-NEXT: stwcx. 5, 0, 3 16*e2ee27b2SKai Luo; CHECK-64-NEXT: .LBB0_2: # %atomicrmw.start 17*e2ee27b2SKai Luo; CHECK-64-NEXT: # 18*e2ee27b2SKai Luo; CHECK-64-NEXT: stw 5, -4(1) 19*e2ee27b2SKai Luo; CHECK-64-NEXT: cmplw 5, 4 20*e2ee27b2SKai Luo; CHECK-64-NEXT: lfs 0, -4(1) 21*e2ee27b2SKai Luo; CHECK-64-NEXT: beq 0, .LBB0_6 22*e2ee27b2SKai Luo; CHECK-64-NEXT: .LBB0_3: # %atomicrmw.start 23*e2ee27b2SKai Luo; CHECK-64-NEXT: # =>This Loop Header: Depth=1 24*e2ee27b2SKai Luo; CHECK-64-NEXT: # Child Loop BB0_4 Depth 2 25*e2ee27b2SKai Luo; CHECK-64-NEXT: fadds 2, 0, 1 26*e2ee27b2SKai Luo; CHECK-64-NEXT: stfs 2, -8(1) 27*e2ee27b2SKai Luo; CHECK-64-NEXT: stfs 0, -12(1) 28*e2ee27b2SKai Luo; CHECK-64-NEXT: lwz 6, -8(1) 29*e2ee27b2SKai Luo; CHECK-64-NEXT: lwz 4, -12(1) 30*e2ee27b2SKai Luo; CHECK-64-NEXT: .LBB0_4: # %atomicrmw.start 31*e2ee27b2SKai Luo; CHECK-64-NEXT: # Parent Loop BB0_3 Depth=1 32*e2ee27b2SKai Luo; CHECK-64-NEXT: # => This Inner Loop Header: Depth=2 33*e2ee27b2SKai Luo; CHECK-64-NEXT: lwarx 5, 0, 3 34*e2ee27b2SKai Luo; CHECK-64-NEXT: cmpw 4, 5 35*e2ee27b2SKai Luo; CHECK-64-NEXT: bne 0, .LBB0_1 36*e2ee27b2SKai Luo; CHECK-64-NEXT: # %bb.5: # %atomicrmw.start 37*e2ee27b2SKai Luo; CHECK-64-NEXT: # 38*e2ee27b2SKai Luo; CHECK-64-NEXT: stwcx. 6, 0, 3 39*e2ee27b2SKai Luo; CHECK-64-NEXT: bne 0, .LBB0_4 40*e2ee27b2SKai Luo; CHECK-64-NEXT: b .LBB0_2 41*e2ee27b2SKai Luo; CHECK-64-NEXT: .LBB0_6: # %atomicrmw.end 42*e2ee27b2SKai Luo; CHECK-64-NEXT: fmr 1, 0 43*e2ee27b2SKai Luo; CHECK-64-NEXT: lwsync 44*e2ee27b2SKai Luo; CHECK-64-NEXT: blr 45*e2ee27b2SKai Luo; 46*e2ee27b2SKai Luo; CHECK-32-LABEL: test_add: 47*e2ee27b2SKai Luo; CHECK-32: # %bb.0: # %entry 48*e2ee27b2SKai Luo; CHECK-32-NEXT: stwu 1, -32(1) 49*e2ee27b2SKai Luo; CHECK-32-NEXT: .cfi_def_cfa_offset 32 50*e2ee27b2SKai Luo; CHECK-32-NEXT: sync 51*e2ee27b2SKai Luo; CHECK-32-NEXT: lfs 0, 0(3) 52*e2ee27b2SKai Luo; CHECK-32-NEXT: b .LBB0_3 53*e2ee27b2SKai Luo; CHECK-32-NEXT: .LBB0_1: # %atomicrmw.start 54*e2ee27b2SKai Luo; CHECK-32-NEXT: # 55*e2ee27b2SKai Luo; CHECK-32-NEXT: stwcx. 5, 0, 3 56*e2ee27b2SKai Luo; CHECK-32-NEXT: .LBB0_2: # %atomicrmw.start 57*e2ee27b2SKai Luo; CHECK-32-NEXT: # 58*e2ee27b2SKai Luo; CHECK-32-NEXT: stw 5, 28(1) 59*e2ee27b2SKai Luo; CHECK-32-NEXT: cmplw 5, 4 60*e2ee27b2SKai Luo; CHECK-32-NEXT: lfs 0, 28(1) 61*e2ee27b2SKai Luo; CHECK-32-NEXT: beq 0, .LBB0_6 62*e2ee27b2SKai Luo; CHECK-32-NEXT: .LBB0_3: # %atomicrmw.start 63*e2ee27b2SKai Luo; CHECK-32-NEXT: # =>This Loop Header: Depth=1 64*e2ee27b2SKai Luo; CHECK-32-NEXT: # Child Loop BB0_4 Depth 2 65*e2ee27b2SKai Luo; CHECK-32-NEXT: fadds 2, 0, 1 66*e2ee27b2SKai Luo; CHECK-32-NEXT: stfs 2, 24(1) 67*e2ee27b2SKai Luo; CHECK-32-NEXT: stfs 0, 20(1) 68*e2ee27b2SKai Luo; CHECK-32-NEXT: lwz 6, 24(1) 69*e2ee27b2SKai Luo; CHECK-32-NEXT: lwz 4, 20(1) 70*e2ee27b2SKai Luo; CHECK-32-NEXT: .LBB0_4: # %atomicrmw.start 71*e2ee27b2SKai Luo; CHECK-32-NEXT: # Parent Loop BB0_3 Depth=1 72*e2ee27b2SKai Luo; CHECK-32-NEXT: # => This Inner Loop Header: Depth=2 73*e2ee27b2SKai Luo; CHECK-32-NEXT: lwarx 5, 0, 3 74*e2ee27b2SKai Luo; CHECK-32-NEXT: cmpw 4, 5 75*e2ee27b2SKai Luo; CHECK-32-NEXT: bne 0, .LBB0_1 76*e2ee27b2SKai Luo; CHECK-32-NEXT: # %bb.5: # %atomicrmw.start 77*e2ee27b2SKai Luo; CHECK-32-NEXT: # 78*e2ee27b2SKai Luo; CHECK-32-NEXT: stwcx. 6, 0, 3 79*e2ee27b2SKai Luo; CHECK-32-NEXT: bne 0, .LBB0_4 80*e2ee27b2SKai Luo; CHECK-32-NEXT: b .LBB0_2 81*e2ee27b2SKai Luo; CHECK-32-NEXT: .LBB0_6: # %atomicrmw.end 82*e2ee27b2SKai Luo; CHECK-32-NEXT: fmr 1, 0 83*e2ee27b2SKai Luo; CHECK-32-NEXT: lwsync 84*e2ee27b2SKai Luo; CHECK-32-NEXT: addi 1, 1, 32 85*e2ee27b2SKai Luo; CHECK-32-NEXT: blr 86*e2ee27b2SKai Luoentry: 87*e2ee27b2SKai Luo %r = atomicrmw fadd float* %ptr, float %incr seq_cst 88*e2ee27b2SKai Luo ret float %r 89*e2ee27b2SKai Luo} 90