1824 lines
		
	
	
		
			70 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			1824 lines
		
	
	
		
			70 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
 | |
| ; RUN: llc < %s -mtriple=i386-pc-windows-msvc     -mattr=+avx512f,+avx512dq,+avx512vl | FileCheck %s --check-prefixes=CHECK,X32,AVX512_32,AVX512_32_WIN,AVX512DQVL_32_WIN
 | |
| ; RUN: llc < %s -mtriple=i386-unknown-linux-gnu   -mattr=+avx512f,+avx512dq,+avx512vl | FileCheck %s --check-prefixes=CHECK,X32,AVX512_32,AVX512_32_LIN,AVX512DQVL_32_LIN
 | |
| ; RUN: llc < %s -mtriple=x86_64-pc-windows-msvc   -mattr=+avx512f,+avx512dq,+avx512vl | FileCheck %s --check-prefixes=CHECK,X64,AVX512_64,AVX512_64_WIN,AVX512DQVL_64_WIN
 | |
| ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=+avx512f,+avx512dq,+avx512vl | FileCheck %s --check-prefixes=CHECK,X32,AVX512_64,AVX512_64_LIN,AVX512DQVL_64_LIN
 | |
| ; RUN: llc < %s -mtriple=i386-pc-windows-msvc     -mattr=+avx512f,+avx512dq | FileCheck %s --check-prefixes=CHECK,X32,AVX512_32,AVX512_32_WIN,AVX512DQ_32_WIN
 | |
| ; RUN: llc < %s -mtriple=i386-unknown-linux-gnu   -mattr=+avx512f,+avx512dq | FileCheck %s --check-prefixes=CHECK,X32,AVX512_32,AVX512_32_LIN,AVX512DQ_32_LIN
 | |
| ; RUN: llc < %s -mtriple=x86_64-pc-windows-msvc   -mattr=+avx512f,+avx512dq | FileCheck %s --check-prefixes=CHECK,X64,AVX512_64,AVX512_64_WIN,AVX512DQ_64_WIN
 | |
| ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=+avx512f,+avx512dq | FileCheck %s --check-prefixes=CHECK,X32,AVX512_64,AVX512_64_LIN,AVX512DQ_64_LIN
 | |
| ; RUN: llc < %s -mtriple=i386-pc-windows-msvc     -mattr=+avx512f | FileCheck %s --check-prefixes=CHECK,X32,AVX512_32,AVX512_32_WIN,AVX512F_32_WIN
 | |
| ; RUN: llc < %s -mtriple=i386-unknown-linux-gnu   -mattr=+avx512f | FileCheck %s --check-prefixes=CHECK,X32,AVX512_32,AVX512_32_LIN,AVX512F_32_LIN
 | |
| ; RUN: llc < %s -mtriple=x86_64-pc-windows-msvc   -mattr=+avx512f | FileCheck %s --check-prefixes=CHECK,X64,AVX512_64,AVX512_64_WIN,AVX512F_64_WIN
 | |
| ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=+avx512f | FileCheck %s --check-prefixes=CHECK,X32,AVX512_64,AVX512_64_LIN,AVX512F_64_LIN
 | |
| ; RUN: llc < %s -mtriple=i386-pc-windows-msvc     -mattr=+sse3 | FileCheck %s --check-prefixes=CHECK,X32,SSE3_32,SSE3_32_WIN
 | |
| ; RUN: llc < %s -mtriple=i386-unknown-linux-gnu   -mattr=+sse3 | FileCheck %s --check-prefixes=CHECK,X32,SSE3_32,SSE3_32_LIN
 | |
| ; RUN: llc < %s -mtriple=x86_64-pc-windows-msvc   -mattr=+sse3 | FileCheck %s --check-prefixes=CHECK,X64,SSE3_64,SSE3_64_WIN
 | |
| ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=+sse3 | FileCheck %s --check-prefixes=CHECK,X64,SSE3_64,SSE3_64_LIN
 | |
| ; RUN: llc < %s -mtriple=i386-pc-windows-msvc     -mattr=+sse2 | FileCheck %s --check-prefixes=CHECK,X32,SSE2_32,SSE2_32_WIN
 | |
| ; RUN: llc < %s -mtriple=i386-unknown-linux-gnu   -mattr=+sse2 | FileCheck %s --check-prefixes=CHECK,X32,SSE2_32,SSE2_32_LIN
 | |
| ; RUN: llc < %s -mtriple=x86_64-pc-windows-msvc   -mattr=+sse2 | FileCheck %s --check-prefixes=CHECK,X64,SSE2_64,SSE2_64_WIN
 | |
| ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=+sse2 | FileCheck %s --check-prefixes=CHECK,X64,SSE2_64,SSE2_64_LIN
 | |
| ; RUN: llc < %s -mtriple=i386-pc-windows-msvc     -mattr=-sse  | FileCheck %s --check-prefixes=CHECK,X32,X87,X87_WIN
 | |
| ; RUN: llc < %s -mtriple=i386-unknown-linux-gnu   -mattr=-sse  | FileCheck %s --check-prefixes=CHECK,X32,X87,X87_LIN
 | |
| 
 | |
| ; Check that scalar FP conversions to signed and unsigned int64 are using
 | |
| ; reasonable sequences, across platforms and target switches.
 | |
| ;
 | |
| ; The signed case is straight forward, and the tests here basically
 | |
| ; ensure successful compilation (f80 with avx512 was broken at one point).
 | |
| ;
 | |
| ; For the unsigned case there are many possible sequences, so to avoid
 | |
| ; a fragile test we just check for the presence of a few key instructions.
 | |
| ; AVX512 on Intel64 can use vcvtts[ds]2usi directly for float and double.
 | |
| ; Otherwise the sequence will involve an FP subtract (fsub, subss or subsd),
 | |
| ; and a truncating conversion (cvtts[ds]2si, fisttp, or fnstcw+fist).  When
 | |
| ; both a subtract and fnstcw are needed, they can occur in either order.
 | |
| ;
 | |
| ; The interesting subtargets are AVX512F (vcvtts[ds]2usi), SSE3 (fisttp),
 | |
| ; SSE2 (cvtts[ds]2si) and vanilla X87 (fnstcw+fist, 32-bit only).
 | |
| 
 | |
| define i64 @f_to_u64(float %a) nounwind {
 | |
| ; AVX512DQVL_32_WIN-LABEL: f_to_u64:
 | |
| ; AVX512DQVL_32_WIN:       # %bb.0:
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vcvttps2uqq %xmm0, %ymm0
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vzeroupper
 | |
| ; AVX512DQVL_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512DQVL_32_LIN-LABEL: f_to_u64:
 | |
| ; AVX512DQVL_32_LIN:       # %bb.0:
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vcvttps2uqq %xmm0, %ymm0
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vzeroupper
 | |
| ; AVX512DQVL_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_64-LABEL: f_to_u64:
 | |
| ; AVX512_64:       # %bb.0:
 | |
| ; AVX512_64-NEXT:    vcvttss2usi %xmm0, %rax
 | |
| ; AVX512_64-NEXT:    retq
 | |
| ;
 | |
| ; AVX512DQ_32_WIN-LABEL: f_to_u64:
 | |
| ; AVX512DQ_32_WIN:       # %bb.0:
 | |
| ; AVX512DQ_32_WIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512DQ_32_WIN-NEXT:    vcvttps2uqq %ymm0, %zmm0
 | |
| ; AVX512DQ_32_WIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQ_32_WIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQ_32_WIN-NEXT:    vzeroupper
 | |
| ; AVX512DQ_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512DQ_32_LIN-LABEL: f_to_u64:
 | |
| ; AVX512DQ_32_LIN:       # %bb.0:
 | |
| ; AVX512DQ_32_LIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512DQ_32_LIN-NEXT:    vcvttps2uqq %ymm0, %zmm0
 | |
| ; AVX512DQ_32_LIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQ_32_LIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQ_32_LIN-NEXT:    vzeroupper
 | |
| ; AVX512DQ_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512F_32_WIN-LABEL: f_to_u64:
 | |
| ; AVX512F_32_WIN:       # %bb.0:
 | |
| ; AVX512F_32_WIN-NEXT:    pushl %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    subl $16, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512F_32_WIN-NEXT:    vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero
 | |
| ; AVX512F_32_WIN-NEXT:    vcmpltss %xmm1, %xmm0, %k1
 | |
| ; AVX512F_32_WIN-NEXT:    vsubss %xmm1, %xmm0, %xmm2
 | |
| ; AVX512F_32_WIN-NEXT:    vmovss %xmm0, %xmm0, %xmm2 {%k1}
 | |
| ; AVX512F_32_WIN-NEXT:    vmovss %xmm2, {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    xorl %edx, %edx
 | |
| ; AVX512F_32_WIN-NEXT:    vucomiss %xmm0, %xmm1
 | |
| ; AVX512F_32_WIN-NEXT:    setbe %dl
 | |
| ; AVX512F_32_WIN-NEXT:    shll $31, %edx
 | |
| ; AVX512F_32_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512F_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512F_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    popl %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512F_32_LIN-LABEL: f_to_u64:
 | |
| ; AVX512F_32_LIN:       # %bb.0:
 | |
| ; AVX512F_32_LIN-NEXT:    subl $20, %esp
 | |
| ; AVX512F_32_LIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512F_32_LIN-NEXT:    vmovss {{.*#+}} xmm1 = mem[0],zero,zero,zero
 | |
| ; AVX512F_32_LIN-NEXT:    vcmpltss %xmm1, %xmm0, %k1
 | |
| ; AVX512F_32_LIN-NEXT:    vsubss %xmm1, %xmm0, %xmm2
 | |
| ; AVX512F_32_LIN-NEXT:    vmovss %xmm0, %xmm0, %xmm2 {%k1}
 | |
| ; AVX512F_32_LIN-NEXT:    vmovss %xmm2, {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    xorl %edx, %edx
 | |
| ; AVX512F_32_LIN-NEXT:    vucomiss %xmm0, %xmm1
 | |
| ; AVX512F_32_LIN-NEXT:    setbe %dl
 | |
| ; AVX512F_32_LIN-NEXT:    shll $31, %edx
 | |
| ; AVX512F_32_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512F_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512F_32_LIN-NEXT:    addl $20, %esp
 | |
| ; AVX512F_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_WIN-LABEL: f_to_u64:
 | |
| ; SSE3_32_WIN:       # %bb.0:
 | |
| ; SSE3_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE3_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE3_32_WIN-NEXT:    subl $16, %esp
 | |
| ; SSE3_32_WIN-NEXT:    movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; SSE3_32_WIN-NEXT:    movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
 | |
| ; SSE3_32_WIN-NEXT:    movaps %xmm0, %xmm2
 | |
| ; SSE3_32_WIN-NEXT:    cmpltss %xmm1, %xmm2
 | |
| ; SSE3_32_WIN-NEXT:    movaps %xmm2, %xmm3
 | |
| ; SSE3_32_WIN-NEXT:    andps %xmm0, %xmm2
 | |
| ; SSE3_32_WIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE3_32_WIN-NEXT:    ucomiss %xmm0, %xmm1
 | |
| ; SSE3_32_WIN-NEXT:    subss %xmm1, %xmm0
 | |
| ; SSE3_32_WIN-NEXT:    andnps %xmm0, %xmm3
 | |
| ; SSE3_32_WIN-NEXT:    orps %xmm3, %xmm2
 | |
| ; SSE3_32_WIN-NEXT:    movss %xmm2, {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_WIN-NEXT:    setbe %dl
 | |
| ; SSE3_32_WIN-NEXT:    shll $31, %edx
 | |
| ; SSE3_32_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE3_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_LIN-LABEL: f_to_u64:
 | |
| ; SSE3_32_LIN:       # %bb.0:
 | |
| ; SSE3_32_LIN-NEXT:    subl $20, %esp
 | |
| ; SSE3_32_LIN-NEXT:    movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; SSE3_32_LIN-NEXT:    movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
 | |
| ; SSE3_32_LIN-NEXT:    movaps %xmm0, %xmm2
 | |
| ; SSE3_32_LIN-NEXT:    cmpltss %xmm1, %xmm2
 | |
| ; SSE3_32_LIN-NEXT:    movaps %xmm2, %xmm3
 | |
| ; SSE3_32_LIN-NEXT:    andps %xmm0, %xmm2
 | |
| ; SSE3_32_LIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE3_32_LIN-NEXT:    ucomiss %xmm0, %xmm1
 | |
| ; SSE3_32_LIN-NEXT:    subss %xmm1, %xmm0
 | |
| ; SSE3_32_LIN-NEXT:    andnps %xmm0, %xmm3
 | |
| ; SSE3_32_LIN-NEXT:    orps %xmm3, %xmm2
 | |
| ; SSE3_32_LIN-NEXT:    movss %xmm2, {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_LIN-NEXT:    setbe %dl
 | |
| ; SSE3_32_LIN-NEXT:    shll $31, %edx
 | |
| ; SSE3_32_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_LIN-NEXT:    addl $20, %esp
 | |
| ; SSE3_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_64-LABEL: f_to_u64:
 | |
| ; SSE3_64:       # %bb.0:
 | |
| ; SSE3_64-NEXT:    movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
 | |
| ; SSE3_64-NEXT:    movaps %xmm0, %xmm2
 | |
| ; SSE3_64-NEXT:    subss %xmm1, %xmm2
 | |
| ; SSE3_64-NEXT:    cvttss2si %xmm2, %rax
 | |
| ; SSE3_64-NEXT:    movabsq $-9223372036854775808, %rcx # imm = 0x8000000000000000
 | |
| ; SSE3_64-NEXT:    xorq %rax, %rcx
 | |
| ; SSE3_64-NEXT:    cvttss2si %xmm0, %rax
 | |
| ; SSE3_64-NEXT:    ucomiss %xmm1, %xmm0
 | |
| ; SSE3_64-NEXT:    cmovaeq %rcx, %rax
 | |
| ; SSE3_64-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_32_WIN-LABEL: f_to_u64:
 | |
| ; SSE2_32_WIN:       # %bb.0:
 | |
| ; SSE2_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE2_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE2_32_WIN-NEXT:    subl $24, %esp
 | |
| ; SSE2_32_WIN-NEXT:    movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; SSE2_32_WIN-NEXT:    movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
 | |
| ; SSE2_32_WIN-NEXT:    movaps %xmm0, %xmm2
 | |
| ; SSE2_32_WIN-NEXT:    cmpltss %xmm1, %xmm2
 | |
| ; SSE2_32_WIN-NEXT:    movaps %xmm2, %xmm3
 | |
| ; SSE2_32_WIN-NEXT:    andps %xmm0, %xmm2
 | |
| ; SSE2_32_WIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE2_32_WIN-NEXT:    ucomiss %xmm0, %xmm1
 | |
| ; SSE2_32_WIN-NEXT:    subss %xmm1, %xmm0
 | |
| ; SSE2_32_WIN-NEXT:    andnps %xmm0, %xmm3
 | |
| ; SSE2_32_WIN-NEXT:    orps %xmm3, %xmm2
 | |
| ; SSE2_32_WIN-NEXT:    movss %xmm2, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    setbe %dl
 | |
| ; SSE2_32_WIN-NEXT:    shll $31, %edx
 | |
| ; SSE2_32_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE2_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_32_LIN-LABEL: f_to_u64:
 | |
| ; SSE2_32_LIN:       # %bb.0:
 | |
| ; SSE2_32_LIN-NEXT:    subl $28, %esp
 | |
| ; SSE2_32_LIN-NEXT:    movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; SSE2_32_LIN-NEXT:    movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
 | |
| ; SSE2_32_LIN-NEXT:    movaps %xmm0, %xmm2
 | |
| ; SSE2_32_LIN-NEXT:    cmpltss %xmm1, %xmm2
 | |
| ; SSE2_32_LIN-NEXT:    movaps %xmm2, %xmm3
 | |
| ; SSE2_32_LIN-NEXT:    andps %xmm0, %xmm2
 | |
| ; SSE2_32_LIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE2_32_LIN-NEXT:    ucomiss %xmm0, %xmm1
 | |
| ; SSE2_32_LIN-NEXT:    subss %xmm1, %xmm0
 | |
| ; SSE2_32_LIN-NEXT:    andnps %xmm0, %xmm3
 | |
| ; SSE2_32_LIN-NEXT:    orps %xmm3, %xmm2
 | |
| ; SSE2_32_LIN-NEXT:    movss %xmm2, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    setbe %dl
 | |
| ; SSE2_32_LIN-NEXT:    shll $31, %edx
 | |
| ; SSE2_32_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    addl $28, %esp
 | |
| ; SSE2_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_64-LABEL: f_to_u64:
 | |
| ; SSE2_64:       # %bb.0:
 | |
| ; SSE2_64-NEXT:    movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
 | |
| ; SSE2_64-NEXT:    movaps %xmm0, %xmm2
 | |
| ; SSE2_64-NEXT:    subss %xmm1, %xmm2
 | |
| ; SSE2_64-NEXT:    cvttss2si %xmm2, %rax
 | |
| ; SSE2_64-NEXT:    movabsq $-9223372036854775808, %rcx # imm = 0x8000000000000000
 | |
| ; SSE2_64-NEXT:    xorq %rax, %rcx
 | |
| ; SSE2_64-NEXT:    cvttss2si %xmm0, %rax
 | |
| ; SSE2_64-NEXT:    ucomiss %xmm1, %xmm0
 | |
| ; SSE2_64-NEXT:    cmovaeq %rcx, %rax
 | |
| ; SSE2_64-NEXT:    retq
 | |
| ;
 | |
| ; X87_WIN-LABEL: f_to_u64:
 | |
| ; X87_WIN:       # %bb.0:
 | |
| ; X87_WIN-NEXT:    pushl %ebp
 | |
| ; X87_WIN-NEXT:    movl %esp, %ebp
 | |
| ; X87_WIN-NEXT:    andl $-8, %esp
 | |
| ; X87_WIN-NEXT:    subl $16, %esp
 | |
| ; X87_WIN-NEXT:    flds 8(%ebp)
 | |
| ; X87_WIN-NEXT:    flds __real@5f000000
 | |
| ; X87_WIN-NEXT:    fld %st(1)
 | |
| ; X87_WIN-NEXT:    fsub %st(1)
 | |
| ; X87_WIN-NEXT:    fxch %st(1)
 | |
| ; X87_WIN-NEXT:    fucomp %st(2)
 | |
| ; X87_WIN-NEXT:    fnstsw %ax
 | |
| ; X87_WIN-NEXT:    # kill: def $ah killed $ah killed $ax
 | |
| ; X87_WIN-NEXT:    sahf
 | |
| ; X87_WIN-NEXT:    ja LBB0_2
 | |
| ; X87_WIN-NEXT:  # %bb.1:
 | |
| ; X87_WIN-NEXT:    fstp %st(1)
 | |
| ; X87_WIN-NEXT:    fldz
 | |
| ; X87_WIN-NEXT:  LBB0_2:
 | |
| ; X87_WIN-NEXT:    fstp %st(0)
 | |
| ; X87_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    setbe %al
 | |
| ; X87_WIN-NEXT:    movzbl %al, %edx
 | |
| ; X87_WIN-NEXT:    shll $31, %edx
 | |
| ; X87_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movl %ebp, %esp
 | |
| ; X87_WIN-NEXT:    popl %ebp
 | |
| ; X87_WIN-NEXT:    retl
 | |
| ;
 | |
| ; X87_LIN-LABEL: f_to_u64:
 | |
| ; X87_LIN:       # %bb.0:
 | |
| ; X87_LIN-NEXT:    subl $20, %esp
 | |
| ; X87_LIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    flds {{\.LCPI.*}}
 | |
| ; X87_LIN-NEXT:    fld %st(1)
 | |
| ; X87_LIN-NEXT:    fsub %st(1)
 | |
| ; X87_LIN-NEXT:    fxch %st(1)
 | |
| ; X87_LIN-NEXT:    fucomp %st(2)
 | |
| ; X87_LIN-NEXT:    fnstsw %ax
 | |
| ; X87_LIN-NEXT:    # kill: def $ah killed $ah killed $ax
 | |
| ; X87_LIN-NEXT:    sahf
 | |
| ; X87_LIN-NEXT:    ja .LBB0_2
 | |
| ; X87_LIN-NEXT:  # %bb.1:
 | |
| ; X87_LIN-NEXT:    fstp %st(1)
 | |
| ; X87_LIN-NEXT:    fldz
 | |
| ; X87_LIN-NEXT:  .LBB0_2:
 | |
| ; X87_LIN-NEXT:    fstp %st(0)
 | |
| ; X87_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    setbe %al
 | |
| ; X87_LIN-NEXT:    movzbl %al, %edx
 | |
| ; X87_LIN-NEXT:    shll $31, %edx
 | |
| ; X87_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    addl $20, %esp
 | |
| ; X87_LIN-NEXT:    retl
 | |
|   %r = fptoui float %a to i64
 | |
|   ret i64 %r
 | |
| }
 | |
| 
 | |
| define i64 @f_to_s64(float %a) nounwind {
 | |
| ; AVX512DQVL_32_WIN-LABEL: f_to_s64:
 | |
| ; AVX512DQVL_32_WIN:       # %bb.0:
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vcvttps2qq %xmm0, %ymm0
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vzeroupper
 | |
| ; AVX512DQVL_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512DQVL_32_LIN-LABEL: f_to_s64:
 | |
| ; AVX512DQVL_32_LIN:       # %bb.0:
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vcvttps2qq %xmm0, %ymm0
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vzeroupper
 | |
| ; AVX512DQVL_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_64-LABEL: f_to_s64:
 | |
| ; AVX512_64:       # %bb.0:
 | |
| ; AVX512_64-NEXT:    vcvttss2si %xmm0, %rax
 | |
| ; AVX512_64-NEXT:    retq
 | |
| ;
 | |
| ; AVX512DQ_32_WIN-LABEL: f_to_s64:
 | |
| ; AVX512DQ_32_WIN:       # %bb.0:
 | |
| ; AVX512DQ_32_WIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512DQ_32_WIN-NEXT:    vcvttps2qq %ymm0, %zmm0
 | |
| ; AVX512DQ_32_WIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQ_32_WIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQ_32_WIN-NEXT:    vzeroupper
 | |
| ; AVX512DQ_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512DQ_32_LIN-LABEL: f_to_s64:
 | |
| ; AVX512DQ_32_LIN:       # %bb.0:
 | |
| ; AVX512DQ_32_LIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512DQ_32_LIN-NEXT:    vcvttps2qq %ymm0, %zmm0
 | |
| ; AVX512DQ_32_LIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQ_32_LIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQ_32_LIN-NEXT:    vzeroupper
 | |
| ; AVX512DQ_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512F_32_WIN-LABEL: f_to_s64:
 | |
| ; AVX512F_32_WIN:       # %bb.0:
 | |
| ; AVX512F_32_WIN-NEXT:    pushl %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    subl $16, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512F_32_WIN-NEXT:    vmovss %xmm0, {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512F_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512F_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    popl %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512F_32_LIN-LABEL: f_to_s64:
 | |
| ; AVX512F_32_LIN:       # %bb.0:
 | |
| ; AVX512F_32_LIN-NEXT:    subl $20, %esp
 | |
| ; AVX512F_32_LIN-NEXT:    vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; AVX512F_32_LIN-NEXT:    vmovss %xmm0, {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512F_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512F_32_LIN-NEXT:    addl $20, %esp
 | |
| ; AVX512F_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_WIN-LABEL: f_to_s64:
 | |
| ; SSE3_32_WIN:       # %bb.0:
 | |
| ; SSE3_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE3_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE3_32_WIN-NEXT:    subl $16, %esp
 | |
| ; SSE3_32_WIN-NEXT:    movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; SSE3_32_WIN-NEXT:    movss %xmm0, {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE3_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_LIN-LABEL: f_to_s64:
 | |
| ; SSE3_32_LIN:       # %bb.0:
 | |
| ; SSE3_32_LIN-NEXT:    subl $20, %esp
 | |
| ; SSE3_32_LIN-NEXT:    movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; SSE3_32_LIN-NEXT:    movss %xmm0, {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_LIN-NEXT:    addl $20, %esp
 | |
| ; SSE3_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_64-LABEL: f_to_s64:
 | |
| ; SSE3_64:       # %bb.0:
 | |
| ; SSE3_64-NEXT:    cvttss2si %xmm0, %rax
 | |
| ; SSE3_64-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_32_WIN-LABEL: f_to_s64:
 | |
| ; SSE2_32_WIN:       # %bb.0:
 | |
| ; SSE2_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE2_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE2_32_WIN-NEXT:    subl $24, %esp
 | |
| ; SSE2_32_WIN-NEXT:    movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; SSE2_32_WIN-NEXT:    movss %xmm0, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE2_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_32_LIN-LABEL: f_to_s64:
 | |
| ; SSE2_32_LIN:       # %bb.0:
 | |
| ; SSE2_32_LIN-NEXT:    subl $28, %esp
 | |
| ; SSE2_32_LIN-NEXT:    movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
 | |
| ; SSE2_32_LIN-NEXT:    movss %xmm0, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_LIN-NEXT:    addl $28, %esp
 | |
| ; SSE2_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_64-LABEL: f_to_s64:
 | |
| ; SSE2_64:       # %bb.0:
 | |
| ; SSE2_64-NEXT:    cvttss2si %xmm0, %rax
 | |
| ; SSE2_64-NEXT:    retq
 | |
| ;
 | |
| ; X87_WIN-LABEL: f_to_s64:
 | |
| ; X87_WIN:       # %bb.0:
 | |
| ; X87_WIN-NEXT:    pushl %ebp
 | |
| ; X87_WIN-NEXT:    movl %esp, %ebp
 | |
| ; X87_WIN-NEXT:    andl $-8, %esp
 | |
| ; X87_WIN-NEXT:    subl $16, %esp
 | |
| ; X87_WIN-NEXT:    flds 8(%ebp)
 | |
| ; X87_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_WIN-NEXT:    movl %ebp, %esp
 | |
| ; X87_WIN-NEXT:    popl %ebp
 | |
| ; X87_WIN-NEXT:    retl
 | |
| ;
 | |
| ; X87_LIN-LABEL: f_to_s64:
 | |
| ; X87_LIN:       # %bb.0:
 | |
| ; X87_LIN-NEXT:    subl $20, %esp
 | |
| ; X87_LIN-NEXT:    flds {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_LIN-NEXT:    addl $20, %esp
 | |
| ; X87_LIN-NEXT:    retl
 | |
|   %r = fptosi float %a to i64
 | |
|   ret i64 %r
 | |
| }
 | |
| 
 | |
| define i64 @d_to_u64(double %a) nounwind {
 | |
| ; AVX512DQVL_32_WIN-LABEL: d_to_u64:
 | |
| ; AVX512DQVL_32_WIN:       # %bb.0:
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vcvttpd2uqq %ymm0, %ymm0
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vzeroupper
 | |
| ; AVX512DQVL_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512DQVL_32_LIN-LABEL: d_to_u64:
 | |
| ; AVX512DQVL_32_LIN:       # %bb.0:
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vcvttpd2uqq %ymm0, %ymm0
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vzeroupper
 | |
| ; AVX512DQVL_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_64-LABEL: d_to_u64:
 | |
| ; AVX512_64:       # %bb.0:
 | |
| ; AVX512_64-NEXT:    vcvttsd2usi %xmm0, %rax
 | |
| ; AVX512_64-NEXT:    retq
 | |
| ;
 | |
| ; AVX512DQ_32_WIN-LABEL: d_to_u64:
 | |
| ; AVX512DQ_32_WIN:       # %bb.0:
 | |
| ; AVX512DQ_32_WIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512DQ_32_WIN-NEXT:    vcvttpd2uqq %zmm0, %zmm0
 | |
| ; AVX512DQ_32_WIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQ_32_WIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQ_32_WIN-NEXT:    vzeroupper
 | |
| ; AVX512DQ_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512DQ_32_LIN-LABEL: d_to_u64:
 | |
| ; AVX512DQ_32_LIN:       # %bb.0:
 | |
| ; AVX512DQ_32_LIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512DQ_32_LIN-NEXT:    vcvttpd2uqq %zmm0, %zmm0
 | |
| ; AVX512DQ_32_LIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQ_32_LIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQ_32_LIN-NEXT:    vzeroupper
 | |
| ; AVX512DQ_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512F_32_WIN-LABEL: d_to_u64:
 | |
| ; AVX512F_32_WIN:       # %bb.0:
 | |
| ; AVX512F_32_WIN-NEXT:    pushl %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    subl $16, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512F_32_WIN-NEXT:    vmovsd {{.*#+}} xmm1 = mem[0],zero
 | |
| ; AVX512F_32_WIN-NEXT:    vcmpltsd %xmm1, %xmm0, %k1
 | |
| ; AVX512F_32_WIN-NEXT:    vsubsd %xmm1, %xmm0, %xmm2
 | |
| ; AVX512F_32_WIN-NEXT:    vmovsd %xmm0, %xmm0, %xmm2 {%k1}
 | |
| ; AVX512F_32_WIN-NEXT:    vmovsd %xmm2, {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    xorl %edx, %edx
 | |
| ; AVX512F_32_WIN-NEXT:    vucomisd %xmm0, %xmm1
 | |
| ; AVX512F_32_WIN-NEXT:    setbe %dl
 | |
| ; AVX512F_32_WIN-NEXT:    shll $31, %edx
 | |
| ; AVX512F_32_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512F_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512F_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    popl %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512F_32_LIN-LABEL: d_to_u64:
 | |
| ; AVX512F_32_LIN:       # %bb.0:
 | |
| ; AVX512F_32_LIN-NEXT:    subl $20, %esp
 | |
| ; AVX512F_32_LIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512F_32_LIN-NEXT:    vmovsd {{.*#+}} xmm1 = mem[0],zero
 | |
| ; AVX512F_32_LIN-NEXT:    vcmpltsd %xmm1, %xmm0, %k1
 | |
| ; AVX512F_32_LIN-NEXT:    vsubsd %xmm1, %xmm0, %xmm2
 | |
| ; AVX512F_32_LIN-NEXT:    vmovsd %xmm0, %xmm0, %xmm2 {%k1}
 | |
| ; AVX512F_32_LIN-NEXT:    vmovsd %xmm2, {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    xorl %edx, %edx
 | |
| ; AVX512F_32_LIN-NEXT:    vucomisd %xmm0, %xmm1
 | |
| ; AVX512F_32_LIN-NEXT:    setbe %dl
 | |
| ; AVX512F_32_LIN-NEXT:    shll $31, %edx
 | |
| ; AVX512F_32_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512F_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512F_32_LIN-NEXT:    addl $20, %esp
 | |
| ; AVX512F_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_WIN-LABEL: d_to_u64:
 | |
| ; SSE3_32_WIN:       # %bb.0:
 | |
| ; SSE3_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE3_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE3_32_WIN-NEXT:    subl $16, %esp
 | |
| ; SSE3_32_WIN-NEXT:    movsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; SSE3_32_WIN-NEXT:    movsd {{.*#+}} xmm1 = mem[0],zero
 | |
| ; SSE3_32_WIN-NEXT:    movapd %xmm0, %xmm2
 | |
| ; SSE3_32_WIN-NEXT:    cmpltsd %xmm1, %xmm2
 | |
| ; SSE3_32_WIN-NEXT:    movapd %xmm2, %xmm3
 | |
| ; SSE3_32_WIN-NEXT:    andpd %xmm0, %xmm2
 | |
| ; SSE3_32_WIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE3_32_WIN-NEXT:    ucomisd %xmm0, %xmm1
 | |
| ; SSE3_32_WIN-NEXT:    subsd %xmm1, %xmm0
 | |
| ; SSE3_32_WIN-NEXT:    andnpd %xmm0, %xmm3
 | |
| ; SSE3_32_WIN-NEXT:    orpd %xmm3, %xmm2
 | |
| ; SSE3_32_WIN-NEXT:    movsd %xmm2, {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_WIN-NEXT:    setbe %dl
 | |
| ; SSE3_32_WIN-NEXT:    shll $31, %edx
 | |
| ; SSE3_32_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE3_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_LIN-LABEL: d_to_u64:
 | |
| ; SSE3_32_LIN:       # %bb.0:
 | |
| ; SSE3_32_LIN-NEXT:    subl $20, %esp
 | |
| ; SSE3_32_LIN-NEXT:    movsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; SSE3_32_LIN-NEXT:    movsd {{.*#+}} xmm1 = mem[0],zero
 | |
| ; SSE3_32_LIN-NEXT:    movapd %xmm0, %xmm2
 | |
| ; SSE3_32_LIN-NEXT:    cmpltsd %xmm1, %xmm2
 | |
| ; SSE3_32_LIN-NEXT:    movapd %xmm2, %xmm3
 | |
| ; SSE3_32_LIN-NEXT:    andpd %xmm0, %xmm2
 | |
| ; SSE3_32_LIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE3_32_LIN-NEXT:    ucomisd %xmm0, %xmm1
 | |
| ; SSE3_32_LIN-NEXT:    subsd %xmm1, %xmm0
 | |
| ; SSE3_32_LIN-NEXT:    andnpd %xmm0, %xmm3
 | |
| ; SSE3_32_LIN-NEXT:    orpd %xmm3, %xmm2
 | |
| ; SSE3_32_LIN-NEXT:    movsd %xmm2, {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_LIN-NEXT:    setbe %dl
 | |
| ; SSE3_32_LIN-NEXT:    shll $31, %edx
 | |
| ; SSE3_32_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_LIN-NEXT:    addl $20, %esp
 | |
| ; SSE3_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_64-LABEL: d_to_u64:
 | |
| ; SSE3_64:       # %bb.0:
 | |
| ; SSE3_64-NEXT:    movsd {{.*#+}} xmm1 = mem[0],zero
 | |
| ; SSE3_64-NEXT:    movapd %xmm0, %xmm2
 | |
| ; SSE3_64-NEXT:    subsd %xmm1, %xmm2
 | |
| ; SSE3_64-NEXT:    cvttsd2si %xmm2, %rax
 | |
| ; SSE3_64-NEXT:    movabsq $-9223372036854775808, %rcx # imm = 0x8000000000000000
 | |
| ; SSE3_64-NEXT:    xorq %rax, %rcx
 | |
| ; SSE3_64-NEXT:    cvttsd2si %xmm0, %rax
 | |
| ; SSE3_64-NEXT:    ucomisd %xmm1, %xmm0
 | |
| ; SSE3_64-NEXT:    cmovaeq %rcx, %rax
 | |
| ; SSE3_64-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_32_WIN-LABEL: d_to_u64:
 | |
| ; SSE2_32_WIN:       # %bb.0:
 | |
| ; SSE2_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE2_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE2_32_WIN-NEXT:    subl $24, %esp
 | |
| ; SSE2_32_WIN-NEXT:    movsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; SSE2_32_WIN-NEXT:    movsd {{.*#+}} xmm1 = mem[0],zero
 | |
| ; SSE2_32_WIN-NEXT:    movapd %xmm0, %xmm2
 | |
| ; SSE2_32_WIN-NEXT:    cmpltsd %xmm1, %xmm2
 | |
| ; SSE2_32_WIN-NEXT:    movapd %xmm2, %xmm3
 | |
| ; SSE2_32_WIN-NEXT:    andpd %xmm0, %xmm2
 | |
| ; SSE2_32_WIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE2_32_WIN-NEXT:    ucomisd %xmm0, %xmm1
 | |
| ; SSE2_32_WIN-NEXT:    subsd %xmm1, %xmm0
 | |
| ; SSE2_32_WIN-NEXT:    andnpd %xmm0, %xmm3
 | |
| ; SSE2_32_WIN-NEXT:    orpd %xmm3, %xmm2
 | |
| ; SSE2_32_WIN-NEXT:    movsd %xmm2, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    setbe %dl
 | |
| ; SSE2_32_WIN-NEXT:    shll $31, %edx
 | |
| ; SSE2_32_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE2_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_32_LIN-LABEL: d_to_u64:
 | |
| ; SSE2_32_LIN:       # %bb.0:
 | |
| ; SSE2_32_LIN-NEXT:    subl $28, %esp
 | |
| ; SSE2_32_LIN-NEXT:    movsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; SSE2_32_LIN-NEXT:    movsd {{.*#+}} xmm1 = mem[0],zero
 | |
| ; SSE2_32_LIN-NEXT:    movapd %xmm0, %xmm2
 | |
| ; SSE2_32_LIN-NEXT:    cmpltsd %xmm1, %xmm2
 | |
| ; SSE2_32_LIN-NEXT:    movapd %xmm2, %xmm3
 | |
| ; SSE2_32_LIN-NEXT:    andpd %xmm0, %xmm2
 | |
| ; SSE2_32_LIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE2_32_LIN-NEXT:    ucomisd %xmm0, %xmm1
 | |
| ; SSE2_32_LIN-NEXT:    subsd %xmm1, %xmm0
 | |
| ; SSE2_32_LIN-NEXT:    andnpd %xmm0, %xmm3
 | |
| ; SSE2_32_LIN-NEXT:    orpd %xmm3, %xmm2
 | |
| ; SSE2_32_LIN-NEXT:    movsd %xmm2, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    setbe %dl
 | |
| ; SSE2_32_LIN-NEXT:    shll $31, %edx
 | |
| ; SSE2_32_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    addl $28, %esp
 | |
| ; SSE2_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_64-LABEL: d_to_u64:
 | |
| ; SSE2_64:       # %bb.0:
 | |
| ; SSE2_64-NEXT:    movsd {{.*#+}} xmm1 = mem[0],zero
 | |
| ; SSE2_64-NEXT:    movapd %xmm0, %xmm2
 | |
| ; SSE2_64-NEXT:    subsd %xmm1, %xmm2
 | |
| ; SSE2_64-NEXT:    cvttsd2si %xmm2, %rax
 | |
| ; SSE2_64-NEXT:    movabsq $-9223372036854775808, %rcx # imm = 0x8000000000000000
 | |
| ; SSE2_64-NEXT:    xorq %rax, %rcx
 | |
| ; SSE2_64-NEXT:    cvttsd2si %xmm0, %rax
 | |
| ; SSE2_64-NEXT:    ucomisd %xmm1, %xmm0
 | |
| ; SSE2_64-NEXT:    cmovaeq %rcx, %rax
 | |
| ; SSE2_64-NEXT:    retq
 | |
| ;
 | |
| ; X87_WIN-LABEL: d_to_u64:
 | |
| ; X87_WIN:       # %bb.0:
 | |
| ; X87_WIN-NEXT:    pushl %ebp
 | |
| ; X87_WIN-NEXT:    movl %esp, %ebp
 | |
| ; X87_WIN-NEXT:    andl $-8, %esp
 | |
| ; X87_WIN-NEXT:    subl $16, %esp
 | |
| ; X87_WIN-NEXT:    fldl 8(%ebp)
 | |
| ; X87_WIN-NEXT:    flds __real@5f000000
 | |
| ; X87_WIN-NEXT:    fld %st(1)
 | |
| ; X87_WIN-NEXT:    fsub %st(1)
 | |
| ; X87_WIN-NEXT:    fxch %st(1)
 | |
| ; X87_WIN-NEXT:    fucomp %st(2)
 | |
| ; X87_WIN-NEXT:    fnstsw %ax
 | |
| ; X87_WIN-NEXT:    # kill: def $ah killed $ah killed $ax
 | |
| ; X87_WIN-NEXT:    sahf
 | |
| ; X87_WIN-NEXT:    ja LBB2_2
 | |
| ; X87_WIN-NEXT:  # %bb.1:
 | |
| ; X87_WIN-NEXT:    fstp %st(1)
 | |
| ; X87_WIN-NEXT:    fldz
 | |
| ; X87_WIN-NEXT:  LBB2_2:
 | |
| ; X87_WIN-NEXT:    fstp %st(0)
 | |
| ; X87_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    setbe %al
 | |
| ; X87_WIN-NEXT:    movzbl %al, %edx
 | |
| ; X87_WIN-NEXT:    shll $31, %edx
 | |
| ; X87_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movl %ebp, %esp
 | |
| ; X87_WIN-NEXT:    popl %ebp
 | |
| ; X87_WIN-NEXT:    retl
 | |
| ;
 | |
| ; X87_LIN-LABEL: d_to_u64:
 | |
| ; X87_LIN:       # %bb.0:
 | |
| ; X87_LIN-NEXT:    subl $20, %esp
 | |
| ; X87_LIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    flds {{\.LCPI.*}}
 | |
| ; X87_LIN-NEXT:    fld %st(1)
 | |
| ; X87_LIN-NEXT:    fsub %st(1)
 | |
| ; X87_LIN-NEXT:    fxch %st(1)
 | |
| ; X87_LIN-NEXT:    fucomp %st(2)
 | |
| ; X87_LIN-NEXT:    fnstsw %ax
 | |
| ; X87_LIN-NEXT:    # kill: def $ah killed $ah killed $ax
 | |
| ; X87_LIN-NEXT:    sahf
 | |
| ; X87_LIN-NEXT:    ja .LBB2_2
 | |
| ; X87_LIN-NEXT:  # %bb.1:
 | |
| ; X87_LIN-NEXT:    fstp %st(1)
 | |
| ; X87_LIN-NEXT:    fldz
 | |
| ; X87_LIN-NEXT:  .LBB2_2:
 | |
| ; X87_LIN-NEXT:    fstp %st(0)
 | |
| ; X87_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    setbe %al
 | |
| ; X87_LIN-NEXT:    movzbl %al, %edx
 | |
| ; X87_LIN-NEXT:    shll $31, %edx
 | |
| ; X87_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    addl $20, %esp
 | |
| ; X87_LIN-NEXT:    retl
 | |
|   %r = fptoui double %a to i64
 | |
|   ret i64 %r
 | |
| }
 | |
| 
 | |
| define i64 @d_to_s64(double %a) nounwind {
 | |
| ; AVX512DQVL_32_WIN-LABEL: d_to_s64:
 | |
| ; AVX512DQVL_32_WIN:       # %bb.0:
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vcvttpd2qq %ymm0, %ymm0
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQVL_32_WIN-NEXT:    vzeroupper
 | |
| ; AVX512DQVL_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512DQVL_32_LIN-LABEL: d_to_s64:
 | |
| ; AVX512DQVL_32_LIN:       # %bb.0:
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vcvttpd2qq %ymm0, %ymm0
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQVL_32_LIN-NEXT:    vzeroupper
 | |
| ; AVX512DQVL_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_64-LABEL: d_to_s64:
 | |
| ; AVX512_64:       # %bb.0:
 | |
| ; AVX512_64-NEXT:    vcvttsd2si %xmm0, %rax
 | |
| ; AVX512_64-NEXT:    retq
 | |
| ;
 | |
| ; AVX512DQ_32_WIN-LABEL: d_to_s64:
 | |
| ; AVX512DQ_32_WIN:       # %bb.0:
 | |
| ; AVX512DQ_32_WIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512DQ_32_WIN-NEXT:    vcvttpd2qq %zmm0, %zmm0
 | |
| ; AVX512DQ_32_WIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQ_32_WIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQ_32_WIN-NEXT:    vzeroupper
 | |
| ; AVX512DQ_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512DQ_32_LIN-LABEL: d_to_s64:
 | |
| ; AVX512DQ_32_LIN:       # %bb.0:
 | |
| ; AVX512DQ_32_LIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512DQ_32_LIN-NEXT:    vcvttpd2qq %zmm0, %zmm0
 | |
| ; AVX512DQ_32_LIN-NEXT:    vmovd %xmm0, %eax
 | |
| ; AVX512DQ_32_LIN-NEXT:    vpextrd $1, %xmm0, %edx
 | |
| ; AVX512DQ_32_LIN-NEXT:    vzeroupper
 | |
| ; AVX512DQ_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512F_32_WIN-LABEL: d_to_s64:
 | |
| ; AVX512F_32_WIN:       # %bb.0:
 | |
| ; AVX512F_32_WIN-NEXT:    pushl %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    subl $16, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512F_32_WIN-NEXT:    vmovsd %xmm0, {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512F_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512F_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512F_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; AVX512F_32_WIN-NEXT:    popl %ebp
 | |
| ; AVX512F_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512F_32_LIN-LABEL: d_to_s64:
 | |
| ; AVX512F_32_LIN:       # %bb.0:
 | |
| ; AVX512F_32_LIN-NEXT:    subl $20, %esp
 | |
| ; AVX512F_32_LIN-NEXT:    vmovsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; AVX512F_32_LIN-NEXT:    vmovsd %xmm0, {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512F_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512F_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512F_32_LIN-NEXT:    addl $20, %esp
 | |
| ; AVX512F_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_WIN-LABEL: d_to_s64:
 | |
| ; SSE3_32_WIN:       # %bb.0:
 | |
| ; SSE3_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE3_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE3_32_WIN-NEXT:    subl $16, %esp
 | |
| ; SSE3_32_WIN-NEXT:    movsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; SSE3_32_WIN-NEXT:    movsd %xmm0, {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE3_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_LIN-LABEL: d_to_s64:
 | |
| ; SSE3_32_LIN:       # %bb.0:
 | |
| ; SSE3_32_LIN-NEXT:    subl $20, %esp
 | |
| ; SSE3_32_LIN-NEXT:    movsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; SSE3_32_LIN-NEXT:    movsd %xmm0, {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_LIN-NEXT:    addl $20, %esp
 | |
| ; SSE3_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_64-LABEL: d_to_s64:
 | |
| ; SSE3_64:       # %bb.0:
 | |
| ; SSE3_64-NEXT:    cvttsd2si %xmm0, %rax
 | |
| ; SSE3_64-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_32_WIN-LABEL: d_to_s64:
 | |
| ; SSE2_32_WIN:       # %bb.0:
 | |
| ; SSE2_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE2_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE2_32_WIN-NEXT:    subl $24, %esp
 | |
| ; SSE2_32_WIN-NEXT:    movsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; SSE2_32_WIN-NEXT:    movsd %xmm0, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE2_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_32_LIN-LABEL: d_to_s64:
 | |
| ; SSE2_32_LIN:       # %bb.0:
 | |
| ; SSE2_32_LIN-NEXT:    subl $28, %esp
 | |
| ; SSE2_32_LIN-NEXT:    movsd {{.*#+}} xmm0 = mem[0],zero
 | |
| ; SSE2_32_LIN-NEXT:    movsd %xmm0, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_LIN-NEXT:    addl $28, %esp
 | |
| ; SSE2_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_64-LABEL: d_to_s64:
 | |
| ; SSE2_64:       # %bb.0:
 | |
| ; SSE2_64-NEXT:    cvttsd2si %xmm0, %rax
 | |
| ; SSE2_64-NEXT:    retq
 | |
| ;
 | |
| ; X87_WIN-LABEL: d_to_s64:
 | |
| ; X87_WIN:       # %bb.0:
 | |
| ; X87_WIN-NEXT:    pushl %ebp
 | |
| ; X87_WIN-NEXT:    movl %esp, %ebp
 | |
| ; X87_WIN-NEXT:    andl $-8, %esp
 | |
| ; X87_WIN-NEXT:    subl $16, %esp
 | |
| ; X87_WIN-NEXT:    fldl 8(%ebp)
 | |
| ; X87_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_WIN-NEXT:    movl %ebp, %esp
 | |
| ; X87_WIN-NEXT:    popl %ebp
 | |
| ; X87_WIN-NEXT:    retl
 | |
| ;
 | |
| ; X87_LIN-LABEL: d_to_s64:
 | |
| ; X87_LIN:       # %bb.0:
 | |
| ; X87_LIN-NEXT:    subl $20, %esp
 | |
| ; X87_LIN-NEXT:    fldl {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_LIN-NEXT:    addl $20, %esp
 | |
| ; X87_LIN-NEXT:    retl
 | |
|   %r = fptosi double %a to i64
 | |
|   ret i64 %r
 | |
| }
 | |
| 
 | |
| define i64 @x_to_u64(x86_fp80 %a) nounwind {
 | |
| ; AVX512_32_WIN-LABEL: x_to_u64:
 | |
| ; AVX512_32_WIN:       # %bb.0:
 | |
| ; AVX512_32_WIN-NEXT:    pushl %ebp
 | |
| ; AVX512_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; AVX512_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; AVX512_32_WIN-NEXT:    subl $8, %esp
 | |
| ; AVX512_32_WIN-NEXT:    fldt 8(%ebp)
 | |
| ; AVX512_32_WIN-NEXT:    flds __real@5f000000
 | |
| ; AVX512_32_WIN-NEXT:    fld %st(1)
 | |
| ; AVX512_32_WIN-NEXT:    fsub %st(1)
 | |
| ; AVX512_32_WIN-NEXT:    xorl %edx, %edx
 | |
| ; AVX512_32_WIN-NEXT:    fxch %st(1)
 | |
| ; AVX512_32_WIN-NEXT:    fucompi %st(2)
 | |
| ; AVX512_32_WIN-NEXT:    fcmovnbe %st(1), %st(0)
 | |
| ; AVX512_32_WIN-NEXT:    fstp %st(1)
 | |
| ; AVX512_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512_32_WIN-NEXT:    setbe %dl
 | |
| ; AVX512_32_WIN-NEXT:    shll $31, %edx
 | |
| ; AVX512_32_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; AVX512_32_WIN-NEXT:    popl %ebp
 | |
| ; AVX512_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_32_LIN-LABEL: x_to_u64:
 | |
| ; AVX512_32_LIN:       # %bb.0:
 | |
| ; AVX512_32_LIN-NEXT:    subl $12, %esp
 | |
| ; AVX512_32_LIN-NEXT:    fldt {{[0-9]+}}(%esp)
 | |
| ; AVX512_32_LIN-NEXT:    flds {{\.LCPI.*}}
 | |
| ; AVX512_32_LIN-NEXT:    fld %st(1)
 | |
| ; AVX512_32_LIN-NEXT:    fsub %st(1)
 | |
| ; AVX512_32_LIN-NEXT:    xorl %edx, %edx
 | |
| ; AVX512_32_LIN-NEXT:    fxch %st(1)
 | |
| ; AVX512_32_LIN-NEXT:    fucompi %st(2)
 | |
| ; AVX512_32_LIN-NEXT:    fcmovnbe %st(1), %st(0)
 | |
| ; AVX512_32_LIN-NEXT:    fstp %st(1)
 | |
| ; AVX512_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512_32_LIN-NEXT:    setbe %dl
 | |
| ; AVX512_32_LIN-NEXT:    shll $31, %edx
 | |
| ; AVX512_32_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512_32_LIN-NEXT:    addl $12, %esp
 | |
| ; AVX512_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_64_WIN-LABEL: x_to_u64:
 | |
| ; AVX512_64_WIN:       # %bb.0:
 | |
| ; AVX512_64_WIN-NEXT:    pushq %rax
 | |
| ; AVX512_64_WIN-NEXT:    fldt (%rcx)
 | |
| ; AVX512_64_WIN-NEXT:    flds __real@{{.*}}(%rip)
 | |
| ; AVX512_64_WIN-NEXT:    fld %st(1)
 | |
| ; AVX512_64_WIN-NEXT:    fsub %st(1)
 | |
| ; AVX512_64_WIN-NEXT:    xorl %ecx, %ecx
 | |
| ; AVX512_64_WIN-NEXT:    fxch %st(1)
 | |
| ; AVX512_64_WIN-NEXT:    fucompi %st(2)
 | |
| ; AVX512_64_WIN-NEXT:    fcmovnbe %st(1), %st(0)
 | |
| ; AVX512_64_WIN-NEXT:    fstp %st(1)
 | |
| ; AVX512_64_WIN-NEXT:    fisttpll (%rsp)
 | |
| ; AVX512_64_WIN-NEXT:    setbe %cl
 | |
| ; AVX512_64_WIN-NEXT:    shll $31, %ecx
 | |
| ; AVX512_64_WIN-NEXT:    xorl {{[0-9]+}}(%rsp), %ecx
 | |
| ; AVX512_64_WIN-NEXT:    shlq $32, %rcx
 | |
| ; AVX512_64_WIN-NEXT:    movl (%rsp), %eax
 | |
| ; AVX512_64_WIN-NEXT:    orq %rcx, %rax
 | |
| ; AVX512_64_WIN-NEXT:    popq %rcx
 | |
| ; AVX512_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; AVX512_64_LIN-LABEL: x_to_u64:
 | |
| ; AVX512_64_LIN:       # %bb.0:
 | |
| ; AVX512_64_LIN-NEXT:    fldt {{[0-9]+}}(%rsp)
 | |
| ; AVX512_64_LIN-NEXT:    flds {{.*}}(%rip)
 | |
| ; AVX512_64_LIN-NEXT:    fld %st(1)
 | |
| ; AVX512_64_LIN-NEXT:    fsub %st(1)
 | |
| ; AVX512_64_LIN-NEXT:    xorl %ecx, %ecx
 | |
| ; AVX512_64_LIN-NEXT:    fxch %st(1)
 | |
| ; AVX512_64_LIN-NEXT:    fucompi %st(2)
 | |
| ; AVX512_64_LIN-NEXT:    fcmovnbe %st(1), %st(0)
 | |
| ; AVX512_64_LIN-NEXT:    fstp %st(1)
 | |
| ; AVX512_64_LIN-NEXT:    fisttpll -{{[0-9]+}}(%rsp)
 | |
| ; AVX512_64_LIN-NEXT:    setbe %cl
 | |
| ; AVX512_64_LIN-NEXT:    shll $31, %ecx
 | |
| ; AVX512_64_LIN-NEXT:    xorl -{{[0-9]+}}(%rsp), %ecx
 | |
| ; AVX512_64_LIN-NEXT:    shlq $32, %rcx
 | |
| ; AVX512_64_LIN-NEXT:    movl -{{[0-9]+}}(%rsp), %eax
 | |
| ; AVX512_64_LIN-NEXT:    orq %rcx, %rax
 | |
| ; AVX512_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE3_32_WIN-LABEL: x_to_u64:
 | |
| ; SSE3_32_WIN:       # %bb.0:
 | |
| ; SSE3_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE3_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE3_32_WIN-NEXT:    subl $8, %esp
 | |
| ; SSE3_32_WIN-NEXT:    fldt 8(%ebp)
 | |
| ; SSE3_32_WIN-NEXT:    flds __real@5f000000
 | |
| ; SSE3_32_WIN-NEXT:    fld %st(1)
 | |
| ; SSE3_32_WIN-NEXT:    fsub %st(1)
 | |
| ; SSE3_32_WIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE3_32_WIN-NEXT:    fxch %st(1)
 | |
| ; SSE3_32_WIN-NEXT:    fucompi %st(2)
 | |
| ; SSE3_32_WIN-NEXT:    fcmovnbe %st(1), %st(0)
 | |
| ; SSE3_32_WIN-NEXT:    fstp %st(1)
 | |
| ; SSE3_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_WIN-NEXT:    setbe %dl
 | |
| ; SSE3_32_WIN-NEXT:    shll $31, %edx
 | |
| ; SSE3_32_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE3_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_LIN-LABEL: x_to_u64:
 | |
| ; SSE3_32_LIN:       # %bb.0:
 | |
| ; SSE3_32_LIN-NEXT:    subl $12, %esp
 | |
| ; SSE3_32_LIN-NEXT:    fldt {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    flds {{\.LCPI.*}}
 | |
| ; SSE3_32_LIN-NEXT:    fld %st(1)
 | |
| ; SSE3_32_LIN-NEXT:    fsub %st(1)
 | |
| ; SSE3_32_LIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE3_32_LIN-NEXT:    fxch %st(1)
 | |
| ; SSE3_32_LIN-NEXT:    fucompi %st(2)
 | |
| ; SSE3_32_LIN-NEXT:    fcmovnbe %st(1), %st(0)
 | |
| ; SSE3_32_LIN-NEXT:    fstp %st(1)
 | |
| ; SSE3_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_LIN-NEXT:    setbe %dl
 | |
| ; SSE3_32_LIN-NEXT:    shll $31, %edx
 | |
| ; SSE3_32_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_LIN-NEXT:    addl $12, %esp
 | |
| ; SSE3_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_64_WIN-LABEL: x_to_u64:
 | |
| ; SSE3_64_WIN:       # %bb.0:
 | |
| ; SSE3_64_WIN-NEXT:    subq $16, %rsp
 | |
| ; SSE3_64_WIN-NEXT:    fldt (%rcx)
 | |
| ; SSE3_64_WIN-NEXT:    flds __real@{{.*}}(%rip)
 | |
| ; SSE3_64_WIN-NEXT:    fld %st(1)
 | |
| ; SSE3_64_WIN-NEXT:    fsub %st(1)
 | |
| ; SSE3_64_WIN-NEXT:    fisttpll {{[0-9]+}}(%rsp)
 | |
| ; SSE3_64_WIN-NEXT:    fld %st(1)
 | |
| ; SSE3_64_WIN-NEXT:    fisttpll (%rsp)
 | |
| ; SSE3_64_WIN-NEXT:    fucompi %st(1)
 | |
| ; SSE3_64_WIN-NEXT:    fstp %st(0)
 | |
| ; SSE3_64_WIN-NEXT:    jbe .LBB4_1
 | |
| ; SSE3_64_WIN-NEXT:  # %bb.2:
 | |
| ; SSE3_64_WIN-NEXT:    movq (%rsp), %rax
 | |
| ; SSE3_64_WIN-NEXT:    addq $16, %rsp
 | |
| ; SSE3_64_WIN-NEXT:    retq
 | |
| ; SSE3_64_WIN-NEXT:  .LBB4_1:
 | |
| ; SSE3_64_WIN-NEXT:    movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
 | |
| ; SSE3_64_WIN-NEXT:    xorq {{[0-9]+}}(%rsp), %rax
 | |
| ; SSE3_64_WIN-NEXT:    addq $16, %rsp
 | |
| ; SSE3_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE3_64_LIN-LABEL: x_to_u64:
 | |
| ; SSE3_64_LIN:       # %bb.0:
 | |
| ; SSE3_64_LIN-NEXT:    fldt {{[0-9]+}}(%rsp)
 | |
| ; SSE3_64_LIN-NEXT:    flds {{.*}}(%rip)
 | |
| ; SSE3_64_LIN-NEXT:    fld %st(1)
 | |
| ; SSE3_64_LIN-NEXT:    fsub %st(1)
 | |
| ; SSE3_64_LIN-NEXT:    fisttpll -{{[0-9]+}}(%rsp)
 | |
| ; SSE3_64_LIN-NEXT:    fld %st(1)
 | |
| ; SSE3_64_LIN-NEXT:    fisttpll -{{[0-9]+}}(%rsp)
 | |
| ; SSE3_64_LIN-NEXT:    fucompi %st(1)
 | |
| ; SSE3_64_LIN-NEXT:    fstp %st(0)
 | |
| ; SSE3_64_LIN-NEXT:    jbe .LBB4_1
 | |
| ; SSE3_64_LIN-NEXT:  # %bb.2:
 | |
| ; SSE3_64_LIN-NEXT:    movq -{{[0-9]+}}(%rsp), %rax
 | |
| ; SSE3_64_LIN-NEXT:    retq
 | |
| ; SSE3_64_LIN-NEXT:  .LBB4_1:
 | |
| ; SSE3_64_LIN-NEXT:    movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
 | |
| ; SSE3_64_LIN-NEXT:    xorq -{{[0-9]+}}(%rsp), %rax
 | |
| ; SSE3_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_32_WIN-LABEL: x_to_u64:
 | |
| ; SSE2_32_WIN:       # %bb.0:
 | |
| ; SSE2_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE2_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE2_32_WIN-NEXT:    subl $16, %esp
 | |
| ; SSE2_32_WIN-NEXT:    fldt 8(%ebp)
 | |
| ; SSE2_32_WIN-NEXT:    flds __real@5f000000
 | |
| ; SSE2_32_WIN-NEXT:    fld %st(1)
 | |
| ; SSE2_32_WIN-NEXT:    fsub %st(1)
 | |
| ; SSE2_32_WIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE2_32_WIN-NEXT:    fxch %st(1)
 | |
| ; SSE2_32_WIN-NEXT:    fucompi %st(2)
 | |
| ; SSE2_32_WIN-NEXT:    fcmovnbe %st(1), %st(0)
 | |
| ; SSE2_32_WIN-NEXT:    fstp %st(1)
 | |
| ; SSE2_32_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    setbe %dl
 | |
| ; SSE2_32_WIN-NEXT:    shll $31, %edx
 | |
| ; SSE2_32_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE2_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_32_LIN-LABEL: x_to_u64:
 | |
| ; SSE2_32_LIN:       # %bb.0:
 | |
| ; SSE2_32_LIN-NEXT:    subl $20, %esp
 | |
| ; SSE2_32_LIN-NEXT:    fldt {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    flds {{\.LCPI.*}}
 | |
| ; SSE2_32_LIN-NEXT:    fld %st(1)
 | |
| ; SSE2_32_LIN-NEXT:    fsub %st(1)
 | |
| ; SSE2_32_LIN-NEXT:    xorl %edx, %edx
 | |
| ; SSE2_32_LIN-NEXT:    fxch %st(1)
 | |
| ; SSE2_32_LIN-NEXT:    fucompi %st(2)
 | |
| ; SSE2_32_LIN-NEXT:    fcmovnbe %st(1), %st(0)
 | |
| ; SSE2_32_LIN-NEXT:    fstp %st(1)
 | |
| ; SSE2_32_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    setbe %dl
 | |
| ; SSE2_32_LIN-NEXT:    shll $31, %edx
 | |
| ; SSE2_32_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    addl $20, %esp
 | |
| ; SSE2_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_64_WIN-LABEL: x_to_u64:
 | |
| ; SSE2_64_WIN:       # %bb.0:
 | |
| ; SSE2_64_WIN-NEXT:    subq $24, %rsp
 | |
| ; SSE2_64_WIN-NEXT:    fldt (%rcx)
 | |
| ; SSE2_64_WIN-NEXT:    flds __real@{{.*}}(%rip)
 | |
| ; SSE2_64_WIN-NEXT:    fld %st(1)
 | |
| ; SSE2_64_WIN-NEXT:    fsub %st(1)
 | |
| ; SSE2_64_WIN-NEXT:    fnstcw {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    movzwl {{[0-9]+}}(%rsp), %eax
 | |
| ; SSE2_64_WIN-NEXT:    movw $3199, {{[0-9]+}}(%rsp) # imm = 0xC7F
 | |
| ; SSE2_64_WIN-NEXT:    fldcw {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    movw %ax, {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    fistpll {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    fldcw {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    fnstcw {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    movzwl {{[0-9]+}}(%rsp), %eax
 | |
| ; SSE2_64_WIN-NEXT:    movw $3199, {{[0-9]+}}(%rsp) # imm = 0xC7F
 | |
| ; SSE2_64_WIN-NEXT:    fldcw {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    movw %ax, {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    fld %st(1)
 | |
| ; SSE2_64_WIN-NEXT:    fistpll {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    fldcw {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    fucompi %st(1)
 | |
| ; SSE2_64_WIN-NEXT:    fstp %st(0)
 | |
| ; SSE2_64_WIN-NEXT:    jbe .LBB4_1
 | |
| ; SSE2_64_WIN-NEXT:  # %bb.2:
 | |
| ; SSE2_64_WIN-NEXT:    movq {{[0-9]+}}(%rsp), %rax
 | |
| ; SSE2_64_WIN-NEXT:    addq $24, %rsp
 | |
| ; SSE2_64_WIN-NEXT:    retq
 | |
| ; SSE2_64_WIN-NEXT:  .LBB4_1:
 | |
| ; SSE2_64_WIN-NEXT:    movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
 | |
| ; SSE2_64_WIN-NEXT:    xorq {{[0-9]+}}(%rsp), %rax
 | |
| ; SSE2_64_WIN-NEXT:    addq $24, %rsp
 | |
| ; SSE2_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_64_LIN-LABEL: x_to_u64:
 | |
| ; SSE2_64_LIN:       # %bb.0:
 | |
| ; SSE2_64_LIN-NEXT:    fldt {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    flds {{.*}}(%rip)
 | |
| ; SSE2_64_LIN-NEXT:    fld %st(1)
 | |
| ; SSE2_64_LIN-NEXT:    fsub %st(1)
 | |
| ; SSE2_64_LIN-NEXT:    fnstcw -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    movzwl -{{[0-9]+}}(%rsp), %eax
 | |
| ; SSE2_64_LIN-NEXT:    movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F
 | |
| ; SSE2_64_LIN-NEXT:    fldcw -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    movw %ax, -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    fistpll -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    fldcw -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    fnstcw -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    movzwl -{{[0-9]+}}(%rsp), %eax
 | |
| ; SSE2_64_LIN-NEXT:    movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F
 | |
| ; SSE2_64_LIN-NEXT:    fldcw -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    movw %ax, -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    fld %st(1)
 | |
| ; SSE2_64_LIN-NEXT:    fistpll -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    fldcw -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    fucompi %st(1)
 | |
| ; SSE2_64_LIN-NEXT:    fstp %st(0)
 | |
| ; SSE2_64_LIN-NEXT:    jbe .LBB4_1
 | |
| ; SSE2_64_LIN-NEXT:  # %bb.2:
 | |
| ; SSE2_64_LIN-NEXT:    movq -{{[0-9]+}}(%rsp), %rax
 | |
| ; SSE2_64_LIN-NEXT:    retq
 | |
| ; SSE2_64_LIN-NEXT:  .LBB4_1:
 | |
| ; SSE2_64_LIN-NEXT:    movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
 | |
| ; SSE2_64_LIN-NEXT:    xorq -{{[0-9]+}}(%rsp), %rax
 | |
| ; SSE2_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; X87_WIN-LABEL: x_to_u64:
 | |
| ; X87_WIN:       # %bb.0:
 | |
| ; X87_WIN-NEXT:    pushl %ebp
 | |
| ; X87_WIN-NEXT:    movl %esp, %ebp
 | |
| ; X87_WIN-NEXT:    andl $-8, %esp
 | |
| ; X87_WIN-NEXT:    subl $16, %esp
 | |
| ; X87_WIN-NEXT:    fldt 8(%ebp)
 | |
| ; X87_WIN-NEXT:    flds __real@5f000000
 | |
| ; X87_WIN-NEXT:    fld %st(1)
 | |
| ; X87_WIN-NEXT:    fsub %st(1)
 | |
| ; X87_WIN-NEXT:    fxch %st(1)
 | |
| ; X87_WIN-NEXT:    fucomp %st(2)
 | |
| ; X87_WIN-NEXT:    fnstsw %ax
 | |
| ; X87_WIN-NEXT:    # kill: def $ah killed $ah killed $ax
 | |
| ; X87_WIN-NEXT:    sahf
 | |
| ; X87_WIN-NEXT:    ja LBB4_2
 | |
| ; X87_WIN-NEXT:  # %bb.1:
 | |
| ; X87_WIN-NEXT:    fstp %st(1)
 | |
| ; X87_WIN-NEXT:    fldz
 | |
| ; X87_WIN-NEXT:  LBB4_2:
 | |
| ; X87_WIN-NEXT:    fstp %st(0)
 | |
| ; X87_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    setbe %al
 | |
| ; X87_WIN-NEXT:    movzbl %al, %edx
 | |
| ; X87_WIN-NEXT:    shll $31, %edx
 | |
| ; X87_WIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movl %ebp, %esp
 | |
| ; X87_WIN-NEXT:    popl %ebp
 | |
| ; X87_WIN-NEXT:    retl
 | |
| ;
 | |
| ; X87_LIN-LABEL: x_to_u64:
 | |
| ; X87_LIN:       # %bb.0:
 | |
| ; X87_LIN-NEXT:    subl $20, %esp
 | |
| ; X87_LIN-NEXT:    fldt {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    flds {{\.LCPI.*}}
 | |
| ; X87_LIN-NEXT:    fld %st(1)
 | |
| ; X87_LIN-NEXT:    fsub %st(1)
 | |
| ; X87_LIN-NEXT:    fxch %st(1)
 | |
| ; X87_LIN-NEXT:    fucomp %st(2)
 | |
| ; X87_LIN-NEXT:    fnstsw %ax
 | |
| ; X87_LIN-NEXT:    # kill: def $ah killed $ah killed $ax
 | |
| ; X87_LIN-NEXT:    sahf
 | |
| ; X87_LIN-NEXT:    ja .LBB4_2
 | |
| ; X87_LIN-NEXT:  # %bb.1:
 | |
| ; X87_LIN-NEXT:    fstp %st(1)
 | |
| ; X87_LIN-NEXT:    fldz
 | |
| ; X87_LIN-NEXT:  .LBB4_2:
 | |
| ; X87_LIN-NEXT:    fstp %st(0)
 | |
| ; X87_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    setbe %al
 | |
| ; X87_LIN-NEXT:    movzbl %al, %edx
 | |
| ; X87_LIN-NEXT:    shll $31, %edx
 | |
| ; X87_LIN-NEXT:    xorl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    addl $20, %esp
 | |
| ; X87_LIN-NEXT:    retl
 | |
|   %r = fptoui x86_fp80 %a to i64
 | |
|   ret i64 %r
 | |
| }
 | |
| 
 | |
| define i64 @x_to_s64(x86_fp80 %a) nounwind {
 | |
| ; AVX512_32_WIN-LABEL: x_to_s64:
 | |
| ; AVX512_32_WIN:       # %bb.0:
 | |
| ; AVX512_32_WIN-NEXT:    pushl %ebp
 | |
| ; AVX512_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; AVX512_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; AVX512_32_WIN-NEXT:    subl $8, %esp
 | |
| ; AVX512_32_WIN-NEXT:    fldt 8(%ebp)
 | |
| ; AVX512_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; AVX512_32_WIN-NEXT:    popl %ebp
 | |
| ; AVX512_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_32_LIN-LABEL: x_to_s64:
 | |
| ; AVX512_32_LIN:       # %bb.0:
 | |
| ; AVX512_32_LIN-NEXT:    subl $12, %esp
 | |
| ; AVX512_32_LIN-NEXT:    fldt {{[0-9]+}}(%esp)
 | |
| ; AVX512_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; AVX512_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; AVX512_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; AVX512_32_LIN-NEXT:    addl $12, %esp
 | |
| ; AVX512_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_64_WIN-LABEL: x_to_s64:
 | |
| ; AVX512_64_WIN:       # %bb.0:
 | |
| ; AVX512_64_WIN-NEXT:    pushq %rax
 | |
| ; AVX512_64_WIN-NEXT:    fldt (%rcx)
 | |
| ; AVX512_64_WIN-NEXT:    fisttpll (%rsp)
 | |
| ; AVX512_64_WIN-NEXT:    movq (%rsp), %rax
 | |
| ; AVX512_64_WIN-NEXT:    popq %rcx
 | |
| ; AVX512_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; AVX512_64_LIN-LABEL: x_to_s64:
 | |
| ; AVX512_64_LIN:       # %bb.0:
 | |
| ; AVX512_64_LIN-NEXT:    fldt {{[0-9]+}}(%rsp)
 | |
| ; AVX512_64_LIN-NEXT:    fisttpll -{{[0-9]+}}(%rsp)
 | |
| ; AVX512_64_LIN-NEXT:    movq -{{[0-9]+}}(%rsp), %rax
 | |
| ; AVX512_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE3_32_WIN-LABEL: x_to_s64:
 | |
| ; SSE3_32_WIN:       # %bb.0:
 | |
| ; SSE3_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE3_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE3_32_WIN-NEXT:    subl $8, %esp
 | |
| ; SSE3_32_WIN-NEXT:    fldt 8(%ebp)
 | |
| ; SSE3_32_WIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_WIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE3_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE3_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_LIN-LABEL: x_to_s64:
 | |
| ; SSE3_32_LIN:       # %bb.0:
 | |
| ; SSE3_32_LIN-NEXT:    subl $12, %esp
 | |
| ; SSE3_32_LIN-NEXT:    fldt {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    fisttpll (%esp)
 | |
| ; SSE3_32_LIN-NEXT:    movl (%esp), %eax
 | |
| ; SSE3_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE3_32_LIN-NEXT:    addl $12, %esp
 | |
| ; SSE3_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_64_WIN-LABEL: x_to_s64:
 | |
| ; SSE3_64_WIN:       # %bb.0:
 | |
| ; SSE3_64_WIN-NEXT:    pushq %rax
 | |
| ; SSE3_64_WIN-NEXT:    fldt (%rcx)
 | |
| ; SSE3_64_WIN-NEXT:    fisttpll (%rsp)
 | |
| ; SSE3_64_WIN-NEXT:    movq (%rsp), %rax
 | |
| ; SSE3_64_WIN-NEXT:    popq %rcx
 | |
| ; SSE3_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE3_64_LIN-LABEL: x_to_s64:
 | |
| ; SSE3_64_LIN:       # %bb.0:
 | |
| ; SSE3_64_LIN-NEXT:    fldt {{[0-9]+}}(%rsp)
 | |
| ; SSE3_64_LIN-NEXT:    fisttpll -{{[0-9]+}}(%rsp)
 | |
| ; SSE3_64_LIN-NEXT:    movq -{{[0-9]+}}(%rsp), %rax
 | |
| ; SSE3_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_32_WIN-LABEL: x_to_s64:
 | |
| ; SSE2_32_WIN:       # %bb.0:
 | |
| ; SSE2_32_WIN-NEXT:    pushl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    movl %esp, %ebp
 | |
| ; SSE2_32_WIN-NEXT:    andl $-8, %esp
 | |
| ; SSE2_32_WIN-NEXT:    subl $16, %esp
 | |
| ; SSE2_32_WIN-NEXT:    fldt 8(%ebp)
 | |
| ; SSE2_32_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_WIN-NEXT:    movl %ebp, %esp
 | |
| ; SSE2_32_WIN-NEXT:    popl %ebp
 | |
| ; SSE2_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_32_LIN-LABEL: x_to_s64:
 | |
| ; SSE2_32_LIN:       # %bb.0:
 | |
| ; SSE2_32_LIN-NEXT:    subl $20, %esp
 | |
| ; SSE2_32_LIN-NEXT:    fldt {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; SSE2_32_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; SSE2_32_LIN-NEXT:    addl $20, %esp
 | |
| ; SSE2_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_64_WIN-LABEL: x_to_s64:
 | |
| ; SSE2_64_WIN:       # %bb.0:
 | |
| ; SSE2_64_WIN-NEXT:    subq $16, %rsp
 | |
| ; SSE2_64_WIN-NEXT:    fldt (%rcx)
 | |
| ; SSE2_64_WIN-NEXT:    fnstcw {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    movzwl {{[0-9]+}}(%rsp), %eax
 | |
| ; SSE2_64_WIN-NEXT:    movw $3199, {{[0-9]+}}(%rsp) # imm = 0xC7F
 | |
| ; SSE2_64_WIN-NEXT:    fldcw {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    movw %ax, {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    fistpll {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    fldcw {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_WIN-NEXT:    movq {{[0-9]+}}(%rsp), %rax
 | |
| ; SSE2_64_WIN-NEXT:    addq $16, %rsp
 | |
| ; SSE2_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_64_LIN-LABEL: x_to_s64:
 | |
| ; SSE2_64_LIN:       # %bb.0:
 | |
| ; SSE2_64_LIN-NEXT:    fldt {{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    fnstcw -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    movzwl -{{[0-9]+}}(%rsp), %eax
 | |
| ; SSE2_64_LIN-NEXT:    movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F
 | |
| ; SSE2_64_LIN-NEXT:    fldcw -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    movw %ax, -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    fistpll -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    fldcw -{{[0-9]+}}(%rsp)
 | |
| ; SSE2_64_LIN-NEXT:    movq -{{[0-9]+}}(%rsp), %rax
 | |
| ; SSE2_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; X87_WIN-LABEL: x_to_s64:
 | |
| ; X87_WIN:       # %bb.0:
 | |
| ; X87_WIN-NEXT:    pushl %ebp
 | |
| ; X87_WIN-NEXT:    movl %esp, %ebp
 | |
| ; X87_WIN-NEXT:    andl $-8, %esp
 | |
| ; X87_WIN-NEXT:    subl $16, %esp
 | |
| ; X87_WIN-NEXT:    fldt 8(%ebp)
 | |
| ; X87_WIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_WIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_WIN-NEXT:    movl %ebp, %esp
 | |
| ; X87_WIN-NEXT:    popl %ebp
 | |
| ; X87_WIN-NEXT:    retl
 | |
| ;
 | |
| ; X87_LIN-LABEL: x_to_s64:
 | |
| ; X87_LIN:       # %bb.0:
 | |
| ; X87_LIN-NEXT:    subl $20, %esp
 | |
| ; X87_LIN-NEXT:    fldt {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fnstcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movzwl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    movw $3199, {{[0-9]+}}(%esp) # imm = 0xC7F
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movw %ax, {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fistpll {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    fldcw {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    movl {{[0-9]+}}(%esp), %eax
 | |
| ; X87_LIN-NEXT:    movl {{[0-9]+}}(%esp), %edx
 | |
| ; X87_LIN-NEXT:    addl $20, %esp
 | |
| ; X87_LIN-NEXT:    retl
 | |
|   %r = fptosi x86_fp80 %a to i64
 | |
|   ret i64 %r
 | |
| }
 | |
| 
 | |
| define i64 @t_to_u64(fp128 %a) nounwind {
 | |
| ; AVX512_32_WIN-LABEL: t_to_u64:
 | |
| ; AVX512_32_WIN:       # %bb.0:
 | |
| ; AVX512_32_WIN-NEXT:    subl $16, %esp
 | |
| ; AVX512_32_WIN-NEXT:    vmovups {{[0-9]+}}(%esp), %xmm0
 | |
| ; AVX512_32_WIN-NEXT:    vmovups %xmm0, (%esp)
 | |
| ; AVX512_32_WIN-NEXT:    calll ___fixunstfdi
 | |
| ; AVX512_32_WIN-NEXT:    addl $16, %esp
 | |
| ; AVX512_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_32_LIN-LABEL: t_to_u64:
 | |
| ; AVX512_32_LIN:       # %bb.0:
 | |
| ; AVX512_32_LIN-NEXT:    subl $28, %esp
 | |
| ; AVX512_32_LIN-NEXT:    vmovaps {{[0-9]+}}(%esp), %xmm0
 | |
| ; AVX512_32_LIN-NEXT:    vmovups %xmm0, (%esp)
 | |
| ; AVX512_32_LIN-NEXT:    calll __fixunstfdi
 | |
| ; AVX512_32_LIN-NEXT:    addl $28, %esp
 | |
| ; AVX512_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_64_WIN-LABEL: t_to_u64:
 | |
| ; AVX512_64_WIN:       # %bb.0:
 | |
| ; AVX512_64_WIN-NEXT:    subq $40, %rsp
 | |
| ; AVX512_64_WIN-NEXT:    callq __fixunstfdi
 | |
| ; AVX512_64_WIN-NEXT:    addq $40, %rsp
 | |
| ; AVX512_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; AVX512_64_LIN-LABEL: t_to_u64:
 | |
| ; AVX512_64_LIN:       # %bb.0:
 | |
| ; AVX512_64_LIN-NEXT:    pushq %rax
 | |
| ; AVX512_64_LIN-NEXT:    callq __fixunstfdi
 | |
| ; AVX512_64_LIN-NEXT:    popq %rcx
 | |
| ; AVX512_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE3_32_WIN-LABEL: t_to_u64:
 | |
| ; SSE3_32_WIN:       # %bb.0:
 | |
| ; SSE3_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    calll ___fixunstfdi
 | |
| ; SSE3_32_WIN-NEXT:    addl $16, %esp
 | |
| ; SSE3_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_LIN-LABEL: t_to_u64:
 | |
| ; SSE3_32_LIN:       # %bb.0:
 | |
| ; SSE3_32_LIN-NEXT:    subl $12, %esp
 | |
| ; SSE3_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    calll __fixunstfdi
 | |
| ; SSE3_32_LIN-NEXT:    addl $28, %esp
 | |
| ; SSE3_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_64_WIN-LABEL: t_to_u64:
 | |
| ; SSE3_64_WIN:       # %bb.0:
 | |
| ; SSE3_64_WIN-NEXT:    subq $40, %rsp
 | |
| ; SSE3_64_WIN-NEXT:    callq __fixunstfdi
 | |
| ; SSE3_64_WIN-NEXT:    addq $40, %rsp
 | |
| ; SSE3_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE3_64_LIN-LABEL: t_to_u64:
 | |
| ; SSE3_64_LIN:       # %bb.0:
 | |
| ; SSE3_64_LIN-NEXT:    pushq %rax
 | |
| ; SSE3_64_LIN-NEXT:    callq __fixunstfdi
 | |
| ; SSE3_64_LIN-NEXT:    popq %rcx
 | |
| ; SSE3_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_32_WIN-LABEL: t_to_u64:
 | |
| ; SSE2_32_WIN:       # %bb.0:
 | |
| ; SSE2_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    calll ___fixunstfdi
 | |
| ; SSE2_32_WIN-NEXT:    addl $16, %esp
 | |
| ; SSE2_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_32_LIN-LABEL: t_to_u64:
 | |
| ; SSE2_32_LIN:       # %bb.0:
 | |
| ; SSE2_32_LIN-NEXT:    subl $12, %esp
 | |
| ; SSE2_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    calll __fixunstfdi
 | |
| ; SSE2_32_LIN-NEXT:    addl $28, %esp
 | |
| ; SSE2_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_64_WIN-LABEL: t_to_u64:
 | |
| ; SSE2_64_WIN:       # %bb.0:
 | |
| ; SSE2_64_WIN-NEXT:    subq $40, %rsp
 | |
| ; SSE2_64_WIN-NEXT:    callq __fixunstfdi
 | |
| ; SSE2_64_WIN-NEXT:    addq $40, %rsp
 | |
| ; SSE2_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_64_LIN-LABEL: t_to_u64:
 | |
| ; SSE2_64_LIN:       # %bb.0:
 | |
| ; SSE2_64_LIN-NEXT:    pushq %rax
 | |
| ; SSE2_64_LIN-NEXT:    callq __fixunstfdi
 | |
| ; SSE2_64_LIN-NEXT:    popq %rcx
 | |
| ; SSE2_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; X87_WIN-LABEL: t_to_u64:
 | |
| ; X87_WIN:       # %bb.0:
 | |
| ; X87_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    calll ___fixunstfdi
 | |
| ; X87_WIN-NEXT:    addl $16, %esp
 | |
| ; X87_WIN-NEXT:    retl
 | |
| ;
 | |
| ; X87_LIN-LABEL: t_to_u64:
 | |
| ; X87_LIN:       # %bb.0:
 | |
| ; X87_LIN-NEXT:    subl $12, %esp
 | |
| ; X87_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    calll __fixunstfdi
 | |
| ; X87_LIN-NEXT:    addl $28, %esp
 | |
| ; X87_LIN-NEXT:    retl
 | |
|   %r = fptoui fp128 %a to i64
 | |
|   ret i64 %r
 | |
| }
 | |
| 
 | |
| define i64 @t_to_s64(fp128 %a) nounwind {
 | |
| ; AVX512_32_WIN-LABEL: t_to_s64:
 | |
| ; AVX512_32_WIN:       # %bb.0:
 | |
| ; AVX512_32_WIN-NEXT:    subl $16, %esp
 | |
| ; AVX512_32_WIN-NEXT:    vmovups {{[0-9]+}}(%esp), %xmm0
 | |
| ; AVX512_32_WIN-NEXT:    vmovups %xmm0, (%esp)
 | |
| ; AVX512_32_WIN-NEXT:    calll ___fixtfdi
 | |
| ; AVX512_32_WIN-NEXT:    addl $16, %esp
 | |
| ; AVX512_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_32_LIN-LABEL: t_to_s64:
 | |
| ; AVX512_32_LIN:       # %bb.0:
 | |
| ; AVX512_32_LIN-NEXT:    subl $28, %esp
 | |
| ; AVX512_32_LIN-NEXT:    vmovaps {{[0-9]+}}(%esp), %xmm0
 | |
| ; AVX512_32_LIN-NEXT:    vmovups %xmm0, (%esp)
 | |
| ; AVX512_32_LIN-NEXT:    calll __fixtfdi
 | |
| ; AVX512_32_LIN-NEXT:    addl $28, %esp
 | |
| ; AVX512_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; AVX512_64_WIN-LABEL: t_to_s64:
 | |
| ; AVX512_64_WIN:       # %bb.0:
 | |
| ; AVX512_64_WIN-NEXT:    subq $40, %rsp
 | |
| ; AVX512_64_WIN-NEXT:    callq __fixtfdi
 | |
| ; AVX512_64_WIN-NEXT:    addq $40, %rsp
 | |
| ; AVX512_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; AVX512_64_LIN-LABEL: t_to_s64:
 | |
| ; AVX512_64_LIN:       # %bb.0:
 | |
| ; AVX512_64_LIN-NEXT:    pushq %rax
 | |
| ; AVX512_64_LIN-NEXT:    callq __fixtfdi
 | |
| ; AVX512_64_LIN-NEXT:    popq %rcx
 | |
| ; AVX512_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE3_32_WIN-LABEL: t_to_s64:
 | |
| ; SSE3_32_WIN:       # %bb.0:
 | |
| ; SSE3_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_WIN-NEXT:    calll ___fixtfdi
 | |
| ; SSE3_32_WIN-NEXT:    addl $16, %esp
 | |
| ; SSE3_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_32_LIN-LABEL: t_to_s64:
 | |
| ; SSE3_32_LIN:       # %bb.0:
 | |
| ; SSE3_32_LIN-NEXT:    subl $12, %esp
 | |
| ; SSE3_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE3_32_LIN-NEXT:    calll __fixtfdi
 | |
| ; SSE3_32_LIN-NEXT:    addl $28, %esp
 | |
| ; SSE3_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE3_64_WIN-LABEL: t_to_s64:
 | |
| ; SSE3_64_WIN:       # %bb.0:
 | |
| ; SSE3_64_WIN-NEXT:    subq $40, %rsp
 | |
| ; SSE3_64_WIN-NEXT:    callq __fixtfdi
 | |
| ; SSE3_64_WIN-NEXT:    addq $40, %rsp
 | |
| ; SSE3_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE3_64_LIN-LABEL: t_to_s64:
 | |
| ; SSE3_64_LIN:       # %bb.0:
 | |
| ; SSE3_64_LIN-NEXT:    pushq %rax
 | |
| ; SSE3_64_LIN-NEXT:    callq __fixtfdi
 | |
| ; SSE3_64_LIN-NEXT:    popq %rcx
 | |
| ; SSE3_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_32_WIN-LABEL: t_to_s64:
 | |
| ; SSE2_32_WIN:       # %bb.0:
 | |
| ; SSE2_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_WIN-NEXT:    calll ___fixtfdi
 | |
| ; SSE2_32_WIN-NEXT:    addl $16, %esp
 | |
| ; SSE2_32_WIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_32_LIN-LABEL: t_to_s64:
 | |
| ; SSE2_32_LIN:       # %bb.0:
 | |
| ; SSE2_32_LIN-NEXT:    subl $12, %esp
 | |
| ; SSE2_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; SSE2_32_LIN-NEXT:    calll __fixtfdi
 | |
| ; SSE2_32_LIN-NEXT:    addl $28, %esp
 | |
| ; SSE2_32_LIN-NEXT:    retl
 | |
| ;
 | |
| ; SSE2_64_WIN-LABEL: t_to_s64:
 | |
| ; SSE2_64_WIN:       # %bb.0:
 | |
| ; SSE2_64_WIN-NEXT:    subq $40, %rsp
 | |
| ; SSE2_64_WIN-NEXT:    callq __fixtfdi
 | |
| ; SSE2_64_WIN-NEXT:    addq $40, %rsp
 | |
| ; SSE2_64_WIN-NEXT:    retq
 | |
| ;
 | |
| ; SSE2_64_LIN-LABEL: t_to_s64:
 | |
| ; SSE2_64_LIN:       # %bb.0:
 | |
| ; SSE2_64_LIN-NEXT:    pushq %rax
 | |
| ; SSE2_64_LIN-NEXT:    callq __fixtfdi
 | |
| ; SSE2_64_LIN-NEXT:    popq %rcx
 | |
| ; SSE2_64_LIN-NEXT:    retq
 | |
| ;
 | |
| ; X87_WIN-LABEL: t_to_s64:
 | |
| ; X87_WIN:       # %bb.0:
 | |
| ; X87_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_WIN-NEXT:    calll ___fixtfdi
 | |
| ; X87_WIN-NEXT:    addl $16, %esp
 | |
| ; X87_WIN-NEXT:    retl
 | |
| ;
 | |
| ; X87_LIN-LABEL: t_to_s64:
 | |
| ; X87_LIN:       # %bb.0:
 | |
| ; X87_LIN-NEXT:    subl $12, %esp
 | |
| ; X87_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    pushl {{[0-9]+}}(%esp)
 | |
| ; X87_LIN-NEXT:    calll __fixtfdi
 | |
| ; X87_LIN-NEXT:    addl $28, %esp
 | |
| ; X87_LIN-NEXT:    retl
 | |
|   %r = fptosi fp128 %a to i64
 | |
|   ret i64 %r
 | |
| }
 |