932 lines
		
	
	
		
			28 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			932 lines
		
	
	
		
			28 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
 | |
| ; RUN: llc -verify-machineinstrs -mtriple=powerpc64-unknown-unknown \
 | |
| ; RUN:   -mcpu=pwr8 -ppc-asm-full-reg-names -ppc-track-subreg-liveness \
 | |
| ; RUN:   -ppc-quadword-atomics < %s | FileCheck --check-prefix=P8 %s
 | |
| ; RUN: llc -verify-machineinstrs -mtriple=powerpc64-unknown-unknown -mcpu=pwr7 \
 | |
| ; RUN:   -ppc-asm-full-reg-names -ppc-quadword-atomics \
 | |
| ; RUN:   -ppc-track-subreg-liveness < %s | FileCheck --check-prefix=PWR7 %s
 | |
| ; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu -mcpu=pwr8 \
 | |
| ; RUN:   -ppc-asm-full-reg-names -ppc-track-subreg-liveness < %s | FileCheck \
 | |
| ; RUN:   --check-prefix=LE-PWR8 %s
 | |
| ; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-freebsd -mcpu=pwr8 \
 | |
| ; RUN:   -ppc-asm-full-reg-names -ppc-track-subreg-liveness < %s | FileCheck \
 | |
| ; RUN:   --check-prefix=LE-PWR8 %s
 | |
| ; RUN: llc -verify-machineinstrs -mtriple=powerpc64-unknown-aix -mcpu=pwr8 \
 | |
| ; RUN:   -ppc-asm-full-reg-names -ppc-track-subreg-liveness < %s | FileCheck \
 | |
| ; RUN:   --check-prefix=AIX64-PWR8 %s
 | |
| ; RUN: llc -verify-machineinstrs -mtriple=powerpc-unknown-unknown -mcpu=pwr8 \
 | |
| ; RUN:   -ppc-quadword-atomics -ppc-asm-full-reg-names -ppc-track-subreg-liveness < %s \
 | |
| ; RUN: | FileCheck --check-prefix=PPC-PWR8 %s
 | |
| 
 | |
| define dso_local i128 @lq_unordered(i128* %src) {
 | |
| ; P8-LABEL: lq_unordered:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    lq r4, 0(r3)
 | |
| ; P8-NEXT:    mr r3, r4
 | |
| ; P8-NEXT:    mr r4, r5
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: lq_unordered:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    li r4, 0
 | |
| ; PWR7-NEXT:    bl __atomic_load_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: lq_unordered:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    lq r4, 0(r3)
 | |
| ; LE-PWR8-NEXT:    mr r3, r5
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: lq_unordered:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    li r4, 0
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_load_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: lq_unordered:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    mr r4, r3
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    li r6, 0
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_load
 | |
| ; PPC-PWR8-NEXT:    lwz r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   %0 = load atomic i128, i128* %src unordered, align 16
 | |
|   ret i128 %0
 | |
| }
 | |
| 
 | |
| define dso_local i128 @lqx_unordered(i128* %src, i64 %idx) {
 | |
| ; P8-LABEL: lqx_unordered:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    sldi r4, r4, 4
 | |
| ; P8-NEXT:    add r3, r3, r4
 | |
| ; P8-NEXT:    lq r4, 0(r3)
 | |
| ; P8-NEXT:    mr r3, r4
 | |
| ; P8-NEXT:    mr r4, r5
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: lqx_unordered:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    sldi r4, r4, 4
 | |
| ; PWR7-NEXT:    add r3, r3, r4
 | |
| ; PWR7-NEXT:    li r4, 0
 | |
| ; PWR7-NEXT:    bl __atomic_load_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: lqx_unordered:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    sldi r4, r4, 4
 | |
| ; LE-PWR8-NEXT:    std r2, -8(r1) # 8-byte Folded Spill
 | |
| ; LE-PWR8-NEXT:    add r4, r3, r4
 | |
| ; LE-PWR8-NEXT:    lq r2, 0(r4)
 | |
| ; LE-PWR8-NEXT:    mr r4, r2
 | |
| ; LE-PWR8-NEXT:    ld r2, -8(r1) # 8-byte Folded Reload
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: lqx_unordered:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    sldi r4, r4, 4
 | |
| ; AIX64-PWR8-NEXT:    add r3, r3, r4
 | |
| ; AIX64-PWR8-NEXT:    li r4, 0
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_load_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: lqx_unordered:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    slwi r4, r6, 4
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    li r6, 0
 | |
| ; PPC-PWR8-NEXT:    add r4, r3, r4
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_load
 | |
| ; PPC-PWR8-NEXT:    lwz r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   %0 = getelementptr i128, i128* %src, i64 %idx
 | |
|   %1 = load atomic i128, i128* %0 unordered, align 16
 | |
|   ret i128 %1
 | |
| }
 | |
| 
 | |
| define dso_local i128 @lq_big_offset_unordered(i128* %src) {
 | |
| ; P8-LABEL: lq_big_offset_unordered:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    lis r4, 32
 | |
| ; P8-NEXT:    add r3, r3, r4
 | |
| ; P8-NEXT:    lq r4, 0(r3)
 | |
| ; P8-NEXT:    mr r3, r4
 | |
| ; P8-NEXT:    mr r4, r5
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: lq_big_offset_unordered:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    addis r3, r3, 32
 | |
| ; PWR7-NEXT:    li r4, 0
 | |
| ; PWR7-NEXT:    bl __atomic_load_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: lq_big_offset_unordered:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    lis r4, 32
 | |
| ; LE-PWR8-NEXT:    std r2, -8(r1) # 8-byte Folded Spill
 | |
| ; LE-PWR8-NEXT:    add r4, r3, r4
 | |
| ; LE-PWR8-NEXT:    lq r2, 0(r4)
 | |
| ; LE-PWR8-NEXT:    mr r4, r2
 | |
| ; LE-PWR8-NEXT:    ld r2, -8(r1) # 8-byte Folded Reload
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: lq_big_offset_unordered:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    addis r3, r3, 32
 | |
| ; AIX64-PWR8-NEXT:    li r4, 0
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_load_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: lq_big_offset_unordered:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    addis r4, r3, 32
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    li r6, 0
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_load
 | |
| ; PPC-PWR8-NEXT:    lwz r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   %0 = getelementptr i128, i128* %src, i64 131072
 | |
|   %1 = load atomic i128, i128* %0 unordered, align 16
 | |
|   ret i128 %1
 | |
| }
 | |
| 
 | |
| define dso_local i128 @lq_monotonic(i128* %src) {
 | |
| ; P8-LABEL: lq_monotonic:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    lq r4, 0(r3)
 | |
| ; P8-NEXT:    mr r3, r4
 | |
| ; P8-NEXT:    mr r4, r5
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: lq_monotonic:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    li r4, 0
 | |
| ; PWR7-NEXT:    bl __atomic_load_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: lq_monotonic:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    lq r4, 0(r3)
 | |
| ; LE-PWR8-NEXT:    mr r3, r5
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: lq_monotonic:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    li r4, 0
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_load_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: lq_monotonic:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    mr r4, r3
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    li r6, 0
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_load
 | |
| ; PPC-PWR8-NEXT:    lwz r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   %0 = load atomic i128, i128* %src monotonic, align 16
 | |
|   ret i128 %0
 | |
| }
 | |
| 
 | |
| define dso_local i128 @lq_acquire(i128* %src) {
 | |
| ; P8-LABEL: lq_acquire:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    lq r4, 0(r3)
 | |
| ; P8-NEXT:    cmpd cr7, r5, r5
 | |
| ; P8-NEXT:    mr r3, r4
 | |
| ; P8-NEXT:    mr r4, r5
 | |
| ; P8-NEXT:    bne- cr7, .+4
 | |
| ; P8-NEXT:    isync
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: lq_acquire:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    li r4, 2
 | |
| ; PWR7-NEXT:    bl __atomic_load_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: lq_acquire:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    lq r4, 0(r3)
 | |
| ; LE-PWR8-NEXT:    cmpd cr7, r5, r5
 | |
| ; LE-PWR8-NEXT:    mr r3, r5
 | |
| ; LE-PWR8-NEXT:    bne- cr7, .+4
 | |
| ; LE-PWR8-NEXT:    isync
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: lq_acquire:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    li r4, 2
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_load_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: lq_acquire:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    mr r4, r3
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    li r6, 2
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_load
 | |
| ; PPC-PWR8-NEXT:    lwz r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   %0 = load atomic i128, i128* %src acquire, align 16
 | |
|   ret i128 %0
 | |
| }
 | |
| 
 | |
| define dso_local i128 @lq_seqcst(i128* %src) {
 | |
| ; P8-LABEL: lq_seqcst:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    sync
 | |
| ; P8-NEXT:    lq r4, 0(r3)
 | |
| ; P8-NEXT:    cmpd cr7, r5, r5
 | |
| ; P8-NEXT:    mr r3, r4
 | |
| ; P8-NEXT:    mr r4, r5
 | |
| ; P8-NEXT:    bne- cr7, .+4
 | |
| ; P8-NEXT:    isync
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: lq_seqcst:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    li r4, 5
 | |
| ; PWR7-NEXT:    bl __atomic_load_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: lq_seqcst:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    sync
 | |
| ; LE-PWR8-NEXT:    lq r4, 0(r3)
 | |
| ; LE-PWR8-NEXT:    cmpd cr7, r5, r5
 | |
| ; LE-PWR8-NEXT:    mr r3, r5
 | |
| ; LE-PWR8-NEXT:    bne- cr7, .+4
 | |
| ; LE-PWR8-NEXT:    isync
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: lq_seqcst:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    li r4, 5
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_load_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: lq_seqcst:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    mr r4, r3
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    li r6, 5
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_load
 | |
| ; PPC-PWR8-NEXT:    lwz r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   %0 = load atomic i128, i128* %src seq_cst, align 16
 | |
|   ret i128 %0
 | |
| }
 | |
| 
 | |
| define dso_local void @stq_unordered(i128 %val, i128* %dst) {
 | |
| ; P8-LABEL: stq_unordered:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    mr r7, r4
 | |
| ; P8-NEXT:    mr r6, r3
 | |
| ; P8-NEXT:    stq r6, 0(r5)
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: stq_unordered:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    mr r6, r4
 | |
| ; PWR7-NEXT:    mr r4, r3
 | |
| ; PWR7-NEXT:    mr r3, r5
 | |
| ; PWR7-NEXT:    mr r5, r6
 | |
| ; PWR7-NEXT:    li r6, 0
 | |
| ; PWR7-NEXT:    bl __atomic_store_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: stq_unordered:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    mr r7, r3
 | |
| ; LE-PWR8-NEXT:    mr r6, r4
 | |
| ; LE-PWR8-NEXT:    stq r6, 0(r5)
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: stq_unordered:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    mr r6, r4
 | |
| ; AIX64-PWR8-NEXT:    mr r4, r3
 | |
| ; AIX64-PWR8-NEXT:    mr r3, r5
 | |
| ; AIX64-PWR8-NEXT:    mr r5, r6
 | |
| ; AIX64-PWR8-NEXT:    li r6, 0
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_store_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: stq_unordered:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    stw r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    stw r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    li r6, 0
 | |
| ; PPC-PWR8-NEXT:    stw r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    stw r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    mr r4, r7
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_store
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   store atomic i128 %val, i128* %dst unordered, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @stqx_unordered(i128 %val, i128* %dst, i64 %idx) {
 | |
| ; P8-LABEL: stqx_unordered:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    sldi r6, r6, 4
 | |
| ; P8-NEXT:    mr r9, r4
 | |
| ; P8-NEXT:    mr r8, r3
 | |
| ; P8-NEXT:    add r3, r5, r6
 | |
| ; P8-NEXT:    stq r8, 0(r3)
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: stqx_unordered:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    mr r7, r4
 | |
| ; PWR7-NEXT:    mr r4, r3
 | |
| ; PWR7-NEXT:    sldi r3, r6, 4
 | |
| ; PWR7-NEXT:    li r6, 0
 | |
| ; PWR7-NEXT:    add r3, r5, r3
 | |
| ; PWR7-NEXT:    mr r5, r7
 | |
| ; PWR7-NEXT:    bl __atomic_store_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: stqx_unordered:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    sldi r6, r6, 4
 | |
| ; LE-PWR8-NEXT:    mr r9, r3
 | |
| ; LE-PWR8-NEXT:    mr r8, r4
 | |
| ; LE-PWR8-NEXT:    add r3, r5, r6
 | |
| ; LE-PWR8-NEXT:    stq r8, 0(r3)
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: stqx_unordered:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    mr r7, r4
 | |
| ; AIX64-PWR8-NEXT:    mr r4, r3
 | |
| ; AIX64-PWR8-NEXT:    sldi r3, r6, 4
 | |
| ; AIX64-PWR8-NEXT:    li r6, 0
 | |
| ; AIX64-PWR8-NEXT:    add r3, r5, r3
 | |
| ; AIX64-PWR8-NEXT:    mr r5, r7
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_store_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: stqx_unordered:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    slwi r8, r10, 4
 | |
| ; PPC-PWR8-NEXT:    stw r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    stw r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    add r6, r7, r8
 | |
| ; PPC-PWR8-NEXT:    stw r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    stw r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    mr r4, r6
 | |
| ; PPC-PWR8-NEXT:    li r6, 0
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_store
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   %0 = getelementptr i128, i128* %dst, i64 %idx
 | |
|   store atomic i128 %val, i128* %0 unordered, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @stq_big_offset_unordered(i128 %val, i128* %dst) {
 | |
| ; P8-LABEL: stq_big_offset_unordered:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    lis r6, 32
 | |
| ; P8-NEXT:    mr r9, r4
 | |
| ; P8-NEXT:    mr r8, r3
 | |
| ; P8-NEXT:    add r3, r5, r6
 | |
| ; P8-NEXT:    stq r8, 0(r3)
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: stq_big_offset_unordered:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    mr r6, r4
 | |
| ; PWR7-NEXT:    mr r4, r3
 | |
| ; PWR7-NEXT:    addis r3, r5, 32
 | |
| ; PWR7-NEXT:    mr r5, r6
 | |
| ; PWR7-NEXT:    li r6, 0
 | |
| ; PWR7-NEXT:    bl __atomic_store_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: stq_big_offset_unordered:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    lis r6, 32
 | |
| ; LE-PWR8-NEXT:    mr r9, r3
 | |
| ; LE-PWR8-NEXT:    mr r8, r4
 | |
| ; LE-PWR8-NEXT:    add r3, r5, r6
 | |
| ; LE-PWR8-NEXT:    stq r8, 0(r3)
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: stq_big_offset_unordered:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    mr r6, r4
 | |
| ; AIX64-PWR8-NEXT:    mr r4, r3
 | |
| ; AIX64-PWR8-NEXT:    addis r3, r5, 32
 | |
| ; AIX64-PWR8-NEXT:    mr r5, r6
 | |
| ; AIX64-PWR8-NEXT:    li r6, 0
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_store_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: stq_big_offset_unordered:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    stw r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    addis r6, r7, 32
 | |
| ; PPC-PWR8-NEXT:    stw r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    stw r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    stw r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    mr r4, r6
 | |
| ; PPC-PWR8-NEXT:    li r6, 0
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_store
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   %0 = getelementptr i128, i128* %dst, i64 131072
 | |
|   store atomic i128 %val, i128* %0 unordered, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @stq_monotonic(i128 %val, i128* %dst) {
 | |
| ; P8-LABEL: stq_monotonic:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    mr r7, r4
 | |
| ; P8-NEXT:    mr r6, r3
 | |
| ; P8-NEXT:    stq r6, 0(r5)
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: stq_monotonic:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    mr r6, r4
 | |
| ; PWR7-NEXT:    mr r4, r3
 | |
| ; PWR7-NEXT:    mr r3, r5
 | |
| ; PWR7-NEXT:    mr r5, r6
 | |
| ; PWR7-NEXT:    li r6, 0
 | |
| ; PWR7-NEXT:    bl __atomic_store_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: stq_monotonic:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    mr r7, r3
 | |
| ; LE-PWR8-NEXT:    mr r6, r4
 | |
| ; LE-PWR8-NEXT:    stq r6, 0(r5)
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: stq_monotonic:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    mr r6, r4
 | |
| ; AIX64-PWR8-NEXT:    mr r4, r3
 | |
| ; AIX64-PWR8-NEXT:    mr r3, r5
 | |
| ; AIX64-PWR8-NEXT:    mr r5, r6
 | |
| ; AIX64-PWR8-NEXT:    li r6, 0
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_store_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: stq_monotonic:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    stw r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    stw r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    li r6, 0
 | |
| ; PPC-PWR8-NEXT:    stw r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    stw r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    mr r4, r7
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_store
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   store atomic i128 %val, i128* %dst monotonic, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @stq_release(i128 %val, i128* %dst) {
 | |
| ; P8-LABEL: stq_release:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    lwsync
 | |
| ; P8-NEXT:    mr r7, r4
 | |
| ; P8-NEXT:    mr r6, r3
 | |
| ; P8-NEXT:    stq r6, 0(r5)
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: stq_release:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    mr r6, r4
 | |
| ; PWR7-NEXT:    mr r4, r3
 | |
| ; PWR7-NEXT:    mr r3, r5
 | |
| ; PWR7-NEXT:    mr r5, r6
 | |
| ; PWR7-NEXT:    li r6, 3
 | |
| ; PWR7-NEXT:    bl __atomic_store_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: stq_release:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    lwsync
 | |
| ; LE-PWR8-NEXT:    mr r7, r3
 | |
| ; LE-PWR8-NEXT:    mr r6, r4
 | |
| ; LE-PWR8-NEXT:    stq r6, 0(r5)
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: stq_release:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    mr r6, r4
 | |
| ; AIX64-PWR8-NEXT:    mr r4, r3
 | |
| ; AIX64-PWR8-NEXT:    mr r3, r5
 | |
| ; AIX64-PWR8-NEXT:    mr r5, r6
 | |
| ; AIX64-PWR8-NEXT:    li r6, 3
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_store_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: stq_release:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    stw r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    stw r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    li r6, 3
 | |
| ; PPC-PWR8-NEXT:    stw r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    stw r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    mr r4, r7
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_store
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   store atomic i128 %val, i128* %dst release, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @stq_seqcst(i128 %val, i128* %dst) {
 | |
| ; P8-LABEL: stq_seqcst:
 | |
| ; P8:       # %bb.0: # %entry
 | |
| ; P8-NEXT:    sync
 | |
| ; P8-NEXT:    mr r7, r4
 | |
| ; P8-NEXT:    mr r6, r3
 | |
| ; P8-NEXT:    stq r6, 0(r5)
 | |
| ; P8-NEXT:    blr
 | |
| ;
 | |
| ; PWR7-LABEL: stq_seqcst:
 | |
| ; PWR7:       # %bb.0: # %entry
 | |
| ; PWR7-NEXT:    mflr r0
 | |
| ; PWR7-NEXT:    std r0, 16(r1)
 | |
| ; PWR7-NEXT:    stdu r1, -112(r1)
 | |
| ; PWR7-NEXT:    .cfi_def_cfa_offset 112
 | |
| ; PWR7-NEXT:    .cfi_offset lr, 16
 | |
| ; PWR7-NEXT:    mr r6, r4
 | |
| ; PWR7-NEXT:    mr r4, r3
 | |
| ; PWR7-NEXT:    mr r3, r5
 | |
| ; PWR7-NEXT:    mr r5, r6
 | |
| ; PWR7-NEXT:    li r6, 5
 | |
| ; PWR7-NEXT:    bl __atomic_store_16
 | |
| ; PWR7-NEXT:    nop
 | |
| ; PWR7-NEXT:    addi r1, r1, 112
 | |
| ; PWR7-NEXT:    ld r0, 16(r1)
 | |
| ; PWR7-NEXT:    mtlr r0
 | |
| ; PWR7-NEXT:    blr
 | |
| ;
 | |
| ; LE-PWR8-LABEL: stq_seqcst:
 | |
| ; LE-PWR8:       # %bb.0: # %entry
 | |
| ; LE-PWR8-NEXT:    sync
 | |
| ; LE-PWR8-NEXT:    mr r7, r3
 | |
| ; LE-PWR8-NEXT:    mr r6, r4
 | |
| ; LE-PWR8-NEXT:    stq r6, 0(r5)
 | |
| ; LE-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; AIX64-PWR8-LABEL: stq_seqcst:
 | |
| ; AIX64-PWR8:       # %bb.0: # %entry
 | |
| ; AIX64-PWR8-NEXT:    mflr r0
 | |
| ; AIX64-PWR8-NEXT:    std r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    stdu r1, -112(r1)
 | |
| ; AIX64-PWR8-NEXT:    mr r6, r4
 | |
| ; AIX64-PWR8-NEXT:    mr r4, r3
 | |
| ; AIX64-PWR8-NEXT:    mr r3, r5
 | |
| ; AIX64-PWR8-NEXT:    mr r5, r6
 | |
| ; AIX64-PWR8-NEXT:    li r6, 5
 | |
| ; AIX64-PWR8-NEXT:    bl .__atomic_store_16[PR]
 | |
| ; AIX64-PWR8-NEXT:    nop
 | |
| ; AIX64-PWR8-NEXT:    addi r1, r1, 112
 | |
| ; AIX64-PWR8-NEXT:    ld r0, 16(r1)
 | |
| ; AIX64-PWR8-NEXT:    mtlr r0
 | |
| ; AIX64-PWR8-NEXT:    blr
 | |
| ;
 | |
| ; PPC-PWR8-LABEL: stq_seqcst:
 | |
| ; PPC-PWR8:       # %bb.0: # %entry
 | |
| ; PPC-PWR8-NEXT:    mflr r0
 | |
| ; PPC-PWR8-NEXT:    stw r0, 4(r1)
 | |
| ; PPC-PWR8-NEXT:    stwu r1, -32(r1)
 | |
| ; PPC-PWR8-NEXT:    .cfi_def_cfa_offset 32
 | |
| ; PPC-PWR8-NEXT:    .cfi_offset lr, 4
 | |
| ; PPC-PWR8-NEXT:    stw r6, 28(r1)
 | |
| ; PPC-PWR8-NEXT:    stw r5, 24(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r5, r1, 16
 | |
| ; PPC-PWR8-NEXT:    li r6, 5
 | |
| ; PPC-PWR8-NEXT:    stw r4, 20(r1)
 | |
| ; PPC-PWR8-NEXT:    stw r3, 16(r1)
 | |
| ; PPC-PWR8-NEXT:    li r3, 16
 | |
| ; PPC-PWR8-NEXT:    mr r4, r7
 | |
| ; PPC-PWR8-NEXT:    bl __atomic_store
 | |
| ; PPC-PWR8-NEXT:    lwz r0, 36(r1)
 | |
| ; PPC-PWR8-NEXT:    addi r1, r1, 32
 | |
| ; PPC-PWR8-NEXT:    mtlr r0
 | |
| ; PPC-PWR8-NEXT:    blr
 | |
| entry:
 | |
|   store atomic i128 %val, i128* %dst seq_cst, align 16
 | |
|   ret void
 | |
| }
 |