[X86] Regenerate test. NFCI.

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@313259 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
Simon Pilgrim 2017-09-14 13:00:27 +00:00
parent 2664884ef8
commit da89c08512

View File

@ -1,18 +1,33 @@
; RUN: llc -mtriple=x86_64-apple-macosx -mattr=+sse2 -verify-machineinstrs < %s | FileCheck %s
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=x86_64-apple-macosx -mattr=+sse2 -verify-machineinstrs | FileCheck %s
; After tail duplication, two copies in an early exit BB can be cancelled out.
; rdar://10640363
define i32 @t1(i32 %a, i32 %b) nounwind {
entry:
; CHECK-LABEL: t1:
; CHECK: je [[LABEL:.*BB.*]]
; CHECK: ## BB#0: ## %entry
; CHECK-NEXT: movl %esi, %edx
; CHECK-NEXT: movl %edi, %eax
; CHECK-NEXT: testl %edx, %edx
; CHECK-NEXT: je LBB0_1
; CHECK-NEXT: .p2align 4, 0x90
; CHECK-NEXT: LBB0_2: ## %while.body
; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
; CHECK-NEXT: movl %edx, %ecx
; CHECK-NEXT: cltd
; CHECK-NEXT: idivl %ecx
; CHECK-NEXT: testl %edx, %edx
; CHECK-NEXT: movl %ecx, %eax
; CHECK-NEXT: jne LBB0_2
; CHECK-NEXT: ## BB#3: ## %while.end
; CHECK-NEXT: movl %ecx, %eax
; CHECK-NEXT: retq
; CHECK-NEXT: LBB0_1:
; CHECK-NEXT: retq
entry:
%cmp1 = icmp eq i32 %b, 0
br i1 %cmp1, label %while.end, label %while.body
; CHECK: [[LABEL]]:
; CHECK-NOT: mov
; CHECK: ret
while.body: ; preds = %entry, %while.body
%a.addr.03 = phi i32 [ %b.addr.02, %while.body ], [ %a, %entry ]
%b.addr.02 = phi i32 [ %rem, %while.body ], [ %b, %entry ]
@ -28,24 +43,42 @@ while.end: ; preds = %while.body, %entry
; Two movdqa (from phi-elimination) in the entry BB cancels out.
; rdar://10428165
define <8 x i16> @t2(<8 x i16> %T0, <8 x i16> %T1) nounwind readnone {
entry:
; CHECK-LABEL: t2:
; CHECK-NOT: movdqa
; CHECK: ## BB#0: ## %entry
; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[3,1,2,3]
; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[0,1,1,2,4,5,6,7]
; CHECK-NEXT: punpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]
; CHECK-NEXT: retq
entry:
%tmp8 = shufflevector <8 x i16> %T0, <8 x i16> %T1, <8 x i32> < i32 undef, i32 undef, i32 7, i32 2, i32 8, i32 undef, i32 undef , i32 undef >
ret <8 x i16> %tmp8
}
define i32 @t3(i64 %a, i64 %b) nounwind {
entry:
; CHECK-LABEL: t3:
; CHECK: je [[LABEL:.*BB.*]]
; CHECK: ## BB#0: ## %entry
; CHECK-NEXT: movq %rsi, %rdx
; CHECK-NEXT: movq %rdi, %rax
; CHECK-NEXT: testq %rdx, %rdx
; CHECK-NEXT: je LBB2_1
; CHECK-NEXT: .p2align 4, 0x90
; CHECK-NEXT: LBB2_2: ## %while.body
; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
; CHECK-NEXT: movq %rdx, %rcx
; CHECK-NEXT: cqto
; CHECK-NEXT: idivq %rcx
; CHECK-NEXT: testq %rdx, %rdx
; CHECK-NEXT: movq %rcx, %rax
; CHECK-NEXT: jne LBB2_2
; CHECK-NEXT: ## BB#3: ## %while.end
; CHECK-NEXT: movl %ecx, %eax
; CHECK-NEXT: retq
; CHECK-NEXT: LBB2_1:
; CHECK-NEXT: retq
entry:
%cmp1 = icmp eq i64 %b, 0
br i1 %cmp1, label %while.end, label %while.body
; CHECK: [[LABEL]]:
; CHECK-NOT: mov
; CHECK: ret
while.body: ; preds = %entry, %while.body
%a.addr.03 = phi i64 [ %b.addr.02, %while.body ], [ %a, %entry ]
%b.addr.02 = phi i64 [ %rem, %while.body ], [ %b, %entry ]
@ -63,27 +96,123 @@ while.end: ; preds = %while.body, %entry
; dst = copy src <-- do not kill that.
; ... = op1 dst<undef>
; ... = op2 dst <-- this is used here.
;
; CHECK-LABEL: foo:
; CHECK: psllw $7,
; CHECK: psllw $7, [[SRC1:%xmm[0-9]+]]
; CHECK-NEXT: pand {{.*}}(%rip), [[SRC1]]
; CHECK-NEXT: pcmpgtb [[SRC1]], [[SRC2:%xmm[0-9]+]]
; CHECK-NEXT: pand %xmm{{[0-9]+}}, [[SRC2]]
; CHECK-NEXT: movdqa [[SRC2]], [[CPY1:%xmm[0-9]+]]
; CHECK-NEXT: punpcklbw %xmm{{[0-9]+}}, [[CPY1]]
; Check that CPY1 is not redefined.
; CHECK-NOT: , [[CPY1]]
; CHECK: punpckhwd %xmm{{[0-9]+}}, [[CPY1]]
; CHECK-NEXT: pslld $31, [[CPY1]]
; CHECK-NEXT: psrad $31, [[CPY1]]
; CHECK: punpckhbw %xmm{{[0-9]+}}, [[CPY2:%xmm[0-9]+]]
; Check that CPY2 is not redefined.
; CHECK-NOT: , [[CPY2]]
; CHECK: punpckhwd %xmm{{[0-9]+}}, [[CPY2]]
; CHECK-NEXT: pslld $31, [[CPY2]]
; CHECK-NEXT: psrad $31, [[CPY2]]
define <16 x float> @foo(<16 x float> %x) {
; CHECK-LABEL: foo:
; CHECK: ## BB#0: ## %bb
; CHECK-NEXT: movaps %xmm3, %xmm9
; CHECK-NEXT: movaps %xmm1, -{{[0-9]+}}(%rsp) ## 16-byte Spill
; CHECK-NEXT: xorps %xmm3, %xmm3
; CHECK-NEXT: pxor %xmm6, %xmm6
; CHECK-NEXT: pcmpgtd %xmm0, %xmm6
; CHECK-NEXT: pshuflw {{.*#+}} xmm4 = xmm6[0,2,2,0,4,5,6,7]
; CHECK-NEXT: pshufhw {{.*#+}} xmm4 = xmm4[0,1,2,3,4,6,6,4]
; CHECK-NEXT: pshufd {{.*#+}} xmm4 = xmm4[0,3,2,1]
; CHECK-NEXT: pshuflw {{.*#+}} xmm4 = xmm4[0,1,3,2,4,5,6,7]
; CHECK-NEXT: pshufhw {{.*#+}} xmm4 = xmm4[0,1,2,3,7,6,4,5]
; CHECK-NEXT: psllw $15, %xmm4
; CHECK-NEXT: psraw $15, %xmm4
; CHECK-NEXT: pand {{.*}}(%rip), %xmm4
; CHECK-NEXT: packuswb %xmm4, %xmm4
; CHECK-NEXT: psllw $7, %xmm4
; CHECK-NEXT: pand {{.*}}(%rip), %xmm4
; CHECK-NEXT: pxor %xmm15, %xmm15
; CHECK-NEXT: pcmpgtb %xmm4, %xmm15
; CHECK-NEXT: movdqa %xmm0, %xmm12
; CHECK-NEXT: cmpltps %xmm3, %xmm12
; CHECK-NEXT: movdqa %xmm6, %xmm10
; CHECK-NEXT: pxor %xmm12, %xmm10
; CHECK-NEXT: movaps %xmm1, %xmm11
; CHECK-NEXT: cmpltps %xmm3, %xmm11
; CHECK-NEXT: movdqa %xmm6, %xmm4
; CHECK-NEXT: pxor %xmm11, %xmm4
; CHECK-NEXT: cvttps2dq %xmm2, %xmm8
; CHECK-NEXT: cmpltps %xmm3, %xmm2
; CHECK-NEXT: movdqa %xmm6, %xmm7
; CHECK-NEXT: pxor %xmm2, %xmm7
; CHECK-NEXT: cvttps2dq %xmm9, %xmm13
; CHECK-NEXT: cmpltps %xmm3, %xmm9
; CHECK-NEXT: pxor %xmm9, %xmm6
; CHECK-NEXT: movdqa {{.*#+}} xmm14 = [1,1,1,1]
; CHECK-NEXT: pand %xmm14, %xmm6
; CHECK-NEXT: pand %xmm14, %xmm7
; CHECK-NEXT: pand %xmm14, %xmm4
; CHECK-NEXT: pand %xmm14, %xmm10
; CHECK-NEXT: cvtdq2ps %xmm8, %xmm14
; CHECK-NEXT: cvtdq2ps %xmm13, %xmm1
; CHECK-NEXT: movaps %xmm1, -{{[0-9]+}}(%rsp) ## 16-byte Spill
; CHECK-NEXT: xorps %xmm5, %xmm5
; CHECK-NEXT: cmpltps %xmm1, %xmm5
; CHECK-NEXT: pshuflw {{.*#+}} xmm5 = xmm5[0,2,2,3,4,5,6,7]
; CHECK-NEXT: pshufhw {{.*#+}} xmm5 = xmm5[0,1,2,3,4,6,6,7]
; CHECK-NEXT: pshufd {{.*#+}} xmm5 = xmm5[0,2,2,3]
; CHECK-NEXT: xorps %xmm1, %xmm1
; CHECK-NEXT: cmpltps %xmm14, %xmm1
; CHECK-NEXT: pshuflw {{.*#+}} xmm1 = xmm1[0,2,2,3,4,5,6,7]
; CHECK-NEXT: pshufhw {{.*#+}} xmm1 = xmm1[0,1,2,3,4,6,6,7]
; CHECK-NEXT: pshufd {{.*#+}} xmm1 = xmm1[0,2,2,3]
; CHECK-NEXT: punpcklqdq {{.*#+}} xmm1 = xmm1[0],xmm5[0]
; CHECK-NEXT: cvttps2dq -{{[0-9]+}}(%rsp), %xmm5 ## 16-byte Folded Reload
; CHECK-NEXT: cvttps2dq %xmm0, %xmm0
; CHECK-NEXT: cvtdq2ps %xmm0, %xmm8
; CHECK-NEXT: cvtdq2ps %xmm5, %xmm13
; CHECK-NEXT: xorps %xmm0, %xmm0
; CHECK-NEXT: cmpltps %xmm13, %xmm0
; CHECK-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[0,2,2,3,4,5,6,7]
; CHECK-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,4,6,6,7]
; CHECK-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,2,2,3]
; CHECK-NEXT: xorps %xmm5, %xmm5
; CHECK-NEXT: cmpltps %xmm8, %xmm5
; CHECK-NEXT: pshuflw {{.*#+}} xmm5 = xmm5[0,2,2,3,4,5,6,7]
; CHECK-NEXT: pshufhw {{.*#+}} xmm5 = xmm5[0,1,2,3,4,6,6,7]
; CHECK-NEXT: pshufd {{.*#+}} xmm5 = xmm5[0,2,2,3]
; CHECK-NEXT: punpcklqdq {{.*#+}} xmm5 = xmm5[0],xmm0[0]
; CHECK-NEXT: psllw $15, %xmm1
; CHECK-NEXT: psraw $15, %xmm1
; CHECK-NEXT: movdqa {{.*#+}} xmm0 = [255,255,255,255,255,255,255,255]
; CHECK-NEXT: pand %xmm0, %xmm1
; CHECK-NEXT: psllw $15, %xmm5
; CHECK-NEXT: psraw $15, %xmm5
; CHECK-NEXT: pand %xmm0, %xmm5
; CHECK-NEXT: packuswb %xmm1, %xmm5
; CHECK-NEXT: psllw $7, %xmm5
; CHECK-NEXT: pand {{.*}}(%rip), %xmm5
; CHECK-NEXT: pcmpgtb %xmm5, %xmm3
; CHECK-NEXT: pand %xmm15, %xmm3
; CHECK-NEXT: movdqa %xmm3, %xmm1
; CHECK-NEXT: punpcklbw {{.*#+}} xmm1 = xmm1[0],xmm0[0],xmm1[1],xmm0[1],xmm1[2],xmm0[2],xmm1[3],xmm0[3],xmm1[4],xmm0[4],xmm1[5],xmm0[5],xmm1[6],xmm0[6],xmm1[7],xmm0[7]
; CHECK-NEXT: movdqa %xmm1, %xmm0
; CHECK-NEXT: punpcklwd {{.*#+}} xmm0 = xmm0[0,0,1,1,2,2,3,3]
; CHECK-NEXT: pslld $31, %xmm0
; CHECK-NEXT: psrad $31, %xmm0
; CHECK-NEXT: pxor %xmm10, %xmm0
; CHECK-NEXT: pxor %xmm8, %xmm0
; CHECK-NEXT: punpckhwd {{.*#+}} xmm1 = xmm1[4],xmm0[4],xmm1[5],xmm0[5],xmm1[6],xmm0[6],xmm1[7],xmm0[7]
; CHECK-NEXT: pslld $31, %xmm1
; CHECK-NEXT: psrad $31, %xmm1
; CHECK-NEXT: punpckhbw {{.*#+}} xmm3 = xmm3[8],xmm0[8],xmm3[9],xmm0[9],xmm3[10],xmm0[10],xmm3[11],xmm0[11],xmm3[12],xmm0[12],xmm3[13],xmm0[13],xmm3[14],xmm0[14],xmm3[15],xmm0[15]
; CHECK-NEXT: pxor %xmm4, %xmm1
; CHECK-NEXT: pxor %xmm13, %xmm1
; CHECK-NEXT: movdqa %xmm3, %xmm5
; CHECK-NEXT: punpcklwd {{.*#+}} xmm5 = xmm5[0],xmm0[0],xmm5[1],xmm0[1],xmm5[2],xmm0[2],xmm5[3],xmm0[3]
; CHECK-NEXT: pslld $31, %xmm5
; CHECK-NEXT: psrad $31, %xmm5
; CHECK-NEXT: pxor %xmm7, %xmm5
; CHECK-NEXT: pxor %xmm14, %xmm5
; CHECK-NEXT: punpckhwd {{.*#+}} xmm3 = xmm3[4],xmm0[4],xmm3[5],xmm0[5],xmm3[6],xmm0[6],xmm3[7],xmm0[7]
; CHECK-NEXT: pslld $31, %xmm3
; CHECK-NEXT: psrad $31, %xmm3
; CHECK-NEXT: pxor %xmm6, %xmm3
; CHECK-NEXT: pxor -{{[0-9]+}}(%rsp), %xmm3 ## 16-byte Folded Reload
; CHECK-NEXT: pand %xmm9, %xmm3
; CHECK-NEXT: pand %xmm2, %xmm5
; CHECK-NEXT: pand %xmm11, %xmm1
; CHECK-NEXT: pand %xmm12, %xmm0
; CHECK-NEXT: pxor %xmm10, %xmm0
; CHECK-NEXT: pxor %xmm4, %xmm1
; CHECK-NEXT: pxor %xmm7, %xmm5
; CHECK-NEXT: pxor %xmm6, %xmm3
; CHECK-NEXT: movdqa %xmm5, %xmm2
; CHECK-NEXT: retq
bb:
%v3 = icmp slt <16 x i32> undef, zeroinitializer
%v14 = zext <16 x i1> %v3 to <16 x i32>