mirror of
https://github.com/RPCSX/llvm.git
synced 2024-11-27 21:50:40 +00:00
[CostModel][X86] Tidied up checks
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@269770 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
9ae1fd1674
commit
7537c45fbd
@ -1,8 +1,8 @@
|
||||
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=pentium4 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=SSE2
|
||||
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=SSE42
|
||||
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7-avx -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=AVX
|
||||
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=core-avx2 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=AVX2
|
||||
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=bdver2 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=XOP -check-prefix=XOPAVX
|
||||
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=pentium4 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=SSE -check-prefix=SSE2
|
||||
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=SSE -check-prefix=SSE42
|
||||
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7-avx -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=AVX -check-prefix=AVX1
|
||||
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=core-avx2 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=AVX -check-prefix=AVX2
|
||||
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=bdver2 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=XOP -check-prefix=XOPAVX1
|
||||
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=bdver4 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=XOP -check-prefix=XOPAVX2
|
||||
|
||||
; Verify the cost of vector population count instructions.
|
||||
@ -19,10 +19,8 @@ declare <32 x i8> @llvm.ctpop.v32i8(<32 x i8>)
|
||||
|
||||
define <2 x i64> @var_ctpop_v2i64(<2 x i64> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctpop_v2i64':
|
||||
; SSE2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; SSE42: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; SSE: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; XOP: Found an estimated cost of 2 for instruction: %ctpop
|
||||
%ctpop = call <2 x i64> @llvm.ctpop.v2i64(<2 x i64> %a)
|
||||
ret <2 x i64> %ctpop
|
||||
@ -30,10 +28,8 @@ define <2 x i64> @var_ctpop_v2i64(<2 x i64> %a) {
|
||||
|
||||
define <4 x i64> @var_ctpop_v4i64(<4 x i64> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctpop_v4i64':
|
||||
; SSE2: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; SSE42: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; SSE: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; AVX: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; XOP: Found an estimated cost of 2 for instruction: %ctpop
|
||||
%ctpop = call <4 x i64> @llvm.ctpop.v4i64(<4 x i64> %a)
|
||||
ret <4 x i64> %ctpop
|
||||
@ -41,10 +37,8 @@ define <4 x i64> @var_ctpop_v4i64(<4 x i64> %a) {
|
||||
|
||||
define <4 x i32> @var_ctpop_v4i32(<4 x i32> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctpop_v4i32':
|
||||
; SSE2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; SSE42: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; SSE: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; XOP: Found an estimated cost of 2 for instruction: %ctpop
|
||||
%ctpop = call <4 x i32> @llvm.ctpop.v4i32(<4 x i32> %a)
|
||||
ret <4 x i32> %ctpop
|
||||
@ -52,10 +46,8 @@ define <4 x i32> @var_ctpop_v4i32(<4 x i32> %a) {
|
||||
|
||||
define <8 x i32> @var_ctpop_v8i32(<8 x i32> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctpop_v8i32':
|
||||
; SSE2: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; SSE42: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; SSE: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; AVX: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; XOP: Found an estimated cost of 2 for instruction: %ctpop
|
||||
%ctpop = call <8 x i32> @llvm.ctpop.v8i32(<8 x i32> %a)
|
||||
ret <8 x i32> %ctpop
|
||||
@ -63,10 +55,8 @@ define <8 x i32> @var_ctpop_v8i32(<8 x i32> %a) {
|
||||
|
||||
define <8 x i16> @var_ctpop_v8i16(<8 x i16> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctpop_v8i16':
|
||||
; SSE2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; SSE42: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; SSE: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; XOP: Found an estimated cost of 2 for instruction: %ctpop
|
||||
%ctpop = call <8 x i16> @llvm.ctpop.v8i16(<8 x i16> %a)
|
||||
ret <8 x i16> %ctpop
|
||||
@ -74,10 +64,8 @@ define <8 x i16> @var_ctpop_v8i16(<8 x i16> %a) {
|
||||
|
||||
define <16 x i16> @var_ctpop_v16i16(<16 x i16> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctpop_v16i16':
|
||||
; SSE2: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; SSE42: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; SSE: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; AVX: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; XOP: Found an estimated cost of 2 for instruction: %ctpop
|
||||
%ctpop = call <16 x i16> @llvm.ctpop.v16i16(<16 x i16> %a)
|
||||
ret <16 x i16> %ctpop
|
||||
@ -85,10 +73,8 @@ define <16 x i16> @var_ctpop_v16i16(<16 x i16> %a) {
|
||||
|
||||
define <16 x i8> @var_ctpop_v16i8(<16 x i8> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctpop_v16i8':
|
||||
; SSE2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; SSE42: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; SSE: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; XOP: Found an estimated cost of 2 for instruction: %ctpop
|
||||
%ctpop = call <16 x i8> @llvm.ctpop.v16i8(<16 x i8> %a)
|
||||
ret <16 x i8> %ctpop
|
||||
@ -96,10 +82,8 @@ define <16 x i8> @var_ctpop_v16i8(<16 x i8> %a) {
|
||||
|
||||
define <32 x i8> @var_ctpop_v32i8(<32 x i8> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctpop_v32i8':
|
||||
; SSE2: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; SSE42: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; SSE: Found an estimated cost of 4 for instruction: %ctpop
|
||||
; AVX: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; AVX2: Found an estimated cost of 2 for instruction: %ctpop
|
||||
; XOP: Found an estimated cost of 2 for instruction: %ctpop
|
||||
%ctpop = call <32 x i8> @llvm.ctpop.v32i8(<32 x i8> %a)
|
||||
ret <32 x i8> %ctpop
|
||||
@ -119,10 +103,8 @@ declare <32 x i8> @llvm.ctlz.v32i8(<32 x i8>, i1)
|
||||
|
||||
define <2 x i64> @var_ctlz_v2i64(<2 x i64> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v2i64':
|
||||
; SSE2: Found an estimated cost of 6 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 6 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 6 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 6 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 6 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 6 for instruction: %ctlz
|
||||
%ctlz = call <2 x i64> @llvm.ctlz.v2i64(<2 x i64> %a, i1 0)
|
||||
ret <2 x i64> %ctlz
|
||||
@ -130,10 +112,8 @@ define <2 x i64> @var_ctlz_v2i64(<2 x i64> %a) {
|
||||
|
||||
define <2 x i64> @var_ctlz_v2i64u(<2 x i64> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v2i64u':
|
||||
; SSE2: Found an estimated cost of 6 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 6 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 6 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 6 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 6 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 6 for instruction: %ctlz
|
||||
%ctlz = call <2 x i64> @llvm.ctlz.v2i64(<2 x i64> %a, i1 1)
|
||||
ret <2 x i64> %ctlz
|
||||
@ -141,10 +121,8 @@ define <2 x i64> @var_ctlz_v2i64u(<2 x i64> %a) {
|
||||
|
||||
define <4 x i64> @var_ctlz_v4i64(<4 x i64> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v4i64':
|
||||
; SSE2: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 12 for instruction: %ctlz
|
||||
%ctlz = call <4 x i64> @llvm.ctlz.v4i64(<4 x i64> %a, i1 0)
|
||||
ret <4 x i64> %ctlz
|
||||
@ -152,10 +130,8 @@ define <4 x i64> @var_ctlz_v4i64(<4 x i64> %a) {
|
||||
|
||||
define <4 x i64> @var_ctlz_v4i64u(<4 x i64> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v4i64u':
|
||||
; SSE2: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 12 for instruction: %ctlz
|
||||
%ctlz = call <4 x i64> @llvm.ctlz.v4i64(<4 x i64> %a, i1 1)
|
||||
ret <4 x i64> %ctlz
|
||||
@ -163,10 +139,8 @@ define <4 x i64> @var_ctlz_v4i64u(<4 x i64> %a) {
|
||||
|
||||
define <4 x i32> @var_ctlz_v4i32(<4 x i32> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v4i32':
|
||||
; SSE2: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 12 for instruction: %ctlz
|
||||
%ctlz = call <4 x i32> @llvm.ctlz.v4i32(<4 x i32> %a, i1 0)
|
||||
ret <4 x i32> %ctlz
|
||||
@ -174,10 +148,8 @@ define <4 x i32> @var_ctlz_v4i32(<4 x i32> %a) {
|
||||
|
||||
define <4 x i32> @var_ctlz_v4i32u(<4 x i32> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v4i32u':
|
||||
; SSE2: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 12 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 12 for instruction: %ctlz
|
||||
%ctlz = call <4 x i32> @llvm.ctlz.v4i32(<4 x i32> %a, i1 1)
|
||||
ret <4 x i32> %ctlz
|
||||
@ -185,10 +157,8 @@ define <4 x i32> @var_ctlz_v4i32u(<4 x i32> %a) {
|
||||
|
||||
define <8 x i32> @var_ctlz_v8i32(<8 x i32> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v8i32':
|
||||
; SSE2: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 24 for instruction: %ctlz
|
||||
%ctlz = call <8 x i32> @llvm.ctlz.v8i32(<8 x i32> %a, i1 0)
|
||||
ret <8 x i32> %ctlz
|
||||
@ -196,10 +166,8 @@ define <8 x i32> @var_ctlz_v8i32(<8 x i32> %a) {
|
||||
|
||||
define <8 x i32> @var_ctlz_v8i32u(<8 x i32> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v8i32u':
|
||||
; SSE2: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 24 for instruction: %ctlz
|
||||
%ctlz = call <8 x i32> @llvm.ctlz.v8i32(<8 x i32> %a, i1 1)
|
||||
ret <8 x i32> %ctlz
|
||||
@ -207,10 +175,8 @@ define <8 x i32> @var_ctlz_v8i32u(<8 x i32> %a) {
|
||||
|
||||
define <8 x i16> @var_ctlz_v8i16(<8 x i16> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v8i16':
|
||||
; SSE2: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 24 for instruction: %ctlz
|
||||
%ctlz = call <8 x i16> @llvm.ctlz.v8i16(<8 x i16> %a, i1 0)
|
||||
ret <8 x i16> %ctlz
|
||||
@ -218,10 +184,8 @@ define <8 x i16> @var_ctlz_v8i16(<8 x i16> %a) {
|
||||
|
||||
define <8 x i16> @var_ctlz_v8i16u(<8 x i16> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v8i16u':
|
||||
; SSE2: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 24 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 24 for instruction: %ctlz
|
||||
%ctlz = call <8 x i16> @llvm.ctlz.v8i16(<8 x i16> %a, i1 1)
|
||||
ret <8 x i16> %ctlz
|
||||
@ -229,10 +193,8 @@ define <8 x i16> @var_ctlz_v8i16u(<8 x i16> %a) {
|
||||
|
||||
define <16 x i16> @var_ctlz_v16i16(<16 x i16> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v16i16':
|
||||
; SSE2: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 48 for instruction: %ctlz
|
||||
%ctlz = call <16 x i16> @llvm.ctlz.v16i16(<16 x i16> %a, i1 0)
|
||||
ret <16 x i16> %ctlz
|
||||
@ -240,10 +202,8 @@ define <16 x i16> @var_ctlz_v16i16(<16 x i16> %a) {
|
||||
|
||||
define <16 x i16> @var_ctlz_v16i16u(<16 x i16> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v16i16u':
|
||||
; SSE2: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 48 for instruction: %ctlz
|
||||
%ctlz = call <16 x i16> @llvm.ctlz.v16i16(<16 x i16> %a, i1 1)
|
||||
ret <16 x i16> %ctlz
|
||||
@ -251,10 +211,8 @@ define <16 x i16> @var_ctlz_v16i16u(<16 x i16> %a) {
|
||||
|
||||
define <16 x i8> @var_ctlz_v16i8(<16 x i8> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v16i8':
|
||||
; SSE2: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 48 for instruction: %ctlz
|
||||
%ctlz = call <16 x i8> @llvm.ctlz.v16i8(<16 x i8> %a, i1 0)
|
||||
ret <16 x i8> %ctlz
|
||||
@ -262,10 +220,8 @@ define <16 x i8> @var_ctlz_v16i8(<16 x i8> %a) {
|
||||
|
||||
define <16 x i8> @var_ctlz_v16i8u(<16 x i8> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v16i8u':
|
||||
; SSE2: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 48 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 48 for instruction: %ctlz
|
||||
%ctlz = call <16 x i8> @llvm.ctlz.v16i8(<16 x i8> %a, i1 1)
|
||||
ret <16 x i8> %ctlz
|
||||
@ -273,10 +229,8 @@ define <16 x i8> @var_ctlz_v16i8u(<16 x i8> %a) {
|
||||
|
||||
define <32 x i8> @var_ctlz_v32i8(<32 x i8> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v32i8':
|
||||
; SSE2: Found an estimated cost of 96 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 96 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 96 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 96 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 96 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 96 for instruction: %ctlz
|
||||
%ctlz = call <32 x i8> @llvm.ctlz.v32i8(<32 x i8> %a, i1 0)
|
||||
ret <32 x i8> %ctlz
|
||||
@ -284,10 +238,8 @@ define <32 x i8> @var_ctlz_v32i8(<32 x i8> %a) {
|
||||
|
||||
define <32 x i8> @var_ctlz_v32i8u(<32 x i8> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_ctlz_v32i8u':
|
||||
; SSE2: Found an estimated cost of 96 for instruction: %ctlz
|
||||
; SSE42: Found an estimated cost of 96 for instruction: %ctlz
|
||||
; SSE: Found an estimated cost of 96 for instruction: %ctlz
|
||||
; AVX: Found an estimated cost of 96 for instruction: %ctlz
|
||||
; AVX2: Found an estimated cost of 96 for instruction: %ctlz
|
||||
; XOP: Found an estimated cost of 96 for instruction: %ctlz
|
||||
%ctlz = call <32 x i8> @llvm.ctlz.v32i8(<32 x i8> %a, i1 1)
|
||||
ret <32 x i8> %ctlz
|
||||
@ -307,10 +259,8 @@ declare <32 x i8> @llvm.cttz.v32i8(<32 x i8>, i1)
|
||||
|
||||
define <2 x i64> @var_cttz_v2i64(<2 x i64> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v2i64':
|
||||
; SSE2: Found an estimated cost of 6 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 6 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 6 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 6 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 6 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 6 for instruction: %cttz
|
||||
%cttz = call <2 x i64> @llvm.cttz.v2i64(<2 x i64> %a, i1 0)
|
||||
ret <2 x i64> %cttz
|
||||
@ -318,10 +268,8 @@ define <2 x i64> @var_cttz_v2i64(<2 x i64> %a) {
|
||||
|
||||
define <2 x i64> @var_cttz_v2i64u(<2 x i64> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v2i64u':
|
||||
; SSE2: Found an estimated cost of 6 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 6 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 6 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 6 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 6 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 6 for instruction: %cttz
|
||||
%cttz = call <2 x i64> @llvm.cttz.v2i64(<2 x i64> %a, i1 1)
|
||||
ret <2 x i64> %cttz
|
||||
@ -329,10 +277,8 @@ define <2 x i64> @var_cttz_v2i64u(<2 x i64> %a) {
|
||||
|
||||
define <4 x i64> @var_cttz_v4i64(<4 x i64> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v4i64':
|
||||
; SSE2: Found an estimated cost of 12 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 12 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 12 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 12 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 12 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 12 for instruction: %cttz
|
||||
%cttz = call <4 x i64> @llvm.cttz.v4i64(<4 x i64> %a, i1 0)
|
||||
ret <4 x i64> %cttz
|
||||
@ -340,10 +286,8 @@ define <4 x i64> @var_cttz_v4i64(<4 x i64> %a) {
|
||||
|
||||
define <4 x i64> @var_cttz_v4i64u(<4 x i64> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v4i64u':
|
||||
; SSE2: Found an estimated cost of 12 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 12 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 12 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 12 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 12 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 12 for instruction: %cttz
|
||||
%cttz = call <4 x i64> @llvm.cttz.v4i64(<4 x i64> %a, i1 1)
|
||||
ret <4 x i64> %cttz
|
||||
@ -351,10 +295,8 @@ define <4 x i64> @var_cttz_v4i64u(<4 x i64> %a) {
|
||||
|
||||
define <4 x i32> @var_cttz_v4i32(<4 x i32> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v4i32':
|
||||
; SSE2: Found an estimated cost of 12 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 12 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 12 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 12 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 12 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 12 for instruction: %cttz
|
||||
%cttz = call <4 x i32> @llvm.cttz.v4i32(<4 x i32> %a, i1 0)
|
||||
ret <4 x i32> %cttz
|
||||
@ -362,10 +304,8 @@ define <4 x i32> @var_cttz_v4i32(<4 x i32> %a) {
|
||||
|
||||
define <4 x i32> @var_cttz_v4i32u(<4 x i32> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v4i32u':
|
||||
; SSE2: Found an estimated cost of 12 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 12 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 12 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 12 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 12 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 12 for instruction: %cttz
|
||||
%cttz = call <4 x i32> @llvm.cttz.v4i32(<4 x i32> %a, i1 1)
|
||||
ret <4 x i32> %cttz
|
||||
@ -373,10 +313,8 @@ define <4 x i32> @var_cttz_v4i32u(<4 x i32> %a) {
|
||||
|
||||
define <8 x i32> @var_cttz_v8i32(<8 x i32> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v8i32':
|
||||
; SSE2: Found an estimated cost of 24 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 24 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 24 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 24 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 24 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 24 for instruction: %cttz
|
||||
%cttz = call <8 x i32> @llvm.cttz.v8i32(<8 x i32> %a, i1 0)
|
||||
ret <8 x i32> %cttz
|
||||
@ -384,10 +322,8 @@ define <8 x i32> @var_cttz_v8i32(<8 x i32> %a) {
|
||||
|
||||
define <8 x i32> @var_cttz_v8i32u(<8 x i32> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v8i32u':
|
||||
; SSE2: Found an estimated cost of 24 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 24 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 24 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 24 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 24 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 24 for instruction: %cttz
|
||||
%cttz = call <8 x i32> @llvm.cttz.v8i32(<8 x i32> %a, i1 1)
|
||||
ret <8 x i32> %cttz
|
||||
@ -395,10 +331,8 @@ define <8 x i32> @var_cttz_v8i32u(<8 x i32> %a) {
|
||||
|
||||
define <8 x i16> @var_cttz_v8i16(<8 x i16> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v8i16':
|
||||
; SSE2: Found an estimated cost of 24 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 24 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 24 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 24 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 24 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 24 for instruction: %cttz
|
||||
%cttz = call <8 x i16> @llvm.cttz.v8i16(<8 x i16> %a, i1 0)
|
||||
ret <8 x i16> %cttz
|
||||
@ -406,10 +340,8 @@ define <8 x i16> @var_cttz_v8i16(<8 x i16> %a) {
|
||||
|
||||
define <8 x i16> @var_cttz_v8i16u(<8 x i16> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v8i16u':
|
||||
; SSE2: Found an estimated cost of 24 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 24 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 24 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 24 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 24 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 24 for instruction: %cttz
|
||||
%cttz = call <8 x i16> @llvm.cttz.v8i16(<8 x i16> %a, i1 1)
|
||||
ret <8 x i16> %cttz
|
||||
@ -417,10 +349,8 @@ define <8 x i16> @var_cttz_v8i16u(<8 x i16> %a) {
|
||||
|
||||
define <16 x i16> @var_cttz_v16i16(<16 x i16> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v16i16':
|
||||
; SSE2: Found an estimated cost of 48 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 48 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 48 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 48 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 48 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 48 for instruction: %cttz
|
||||
%cttz = call <16 x i16> @llvm.cttz.v16i16(<16 x i16> %a, i1 0)
|
||||
ret <16 x i16> %cttz
|
||||
@ -428,10 +358,8 @@ define <16 x i16> @var_cttz_v16i16(<16 x i16> %a) {
|
||||
|
||||
define <16 x i16> @var_cttz_v16i16u(<16 x i16> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v16i16u':
|
||||
; SSE2: Found an estimated cost of 48 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 48 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 48 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 48 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 48 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 48 for instruction: %cttz
|
||||
%cttz = call <16 x i16> @llvm.cttz.v16i16(<16 x i16> %a, i1 1)
|
||||
ret <16 x i16> %cttz
|
||||
@ -439,10 +367,8 @@ define <16 x i16> @var_cttz_v16i16u(<16 x i16> %a) {
|
||||
|
||||
define <16 x i8> @var_cttz_v16i8(<16 x i8> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v16i8':
|
||||
; SSE2: Found an estimated cost of 48 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 48 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 48 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 48 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 48 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 48 for instruction: %cttz
|
||||
%cttz = call <16 x i8> @llvm.cttz.v16i8(<16 x i8> %a, i1 0)
|
||||
ret <16 x i8> %cttz
|
||||
@ -450,10 +376,8 @@ define <16 x i8> @var_cttz_v16i8(<16 x i8> %a) {
|
||||
|
||||
define <16 x i8> @var_cttz_v16i8u(<16 x i8> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v16i8u':
|
||||
; SSE2: Found an estimated cost of 48 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 48 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 48 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 48 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 48 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 48 for instruction: %cttz
|
||||
%cttz = call <16 x i8> @llvm.cttz.v16i8(<16 x i8> %a, i1 1)
|
||||
ret <16 x i8> %cttz
|
||||
@ -461,10 +385,8 @@ define <16 x i8> @var_cttz_v16i8u(<16 x i8> %a) {
|
||||
|
||||
define <32 x i8> @var_cttz_v32i8(<32 x i8> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v32i8':
|
||||
; SSE2: Found an estimated cost of 96 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 96 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 96 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 96 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 96 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 96 for instruction: %cttz
|
||||
%cttz = call <32 x i8> @llvm.cttz.v32i8(<32 x i8> %a, i1 0)
|
||||
ret <32 x i8> %cttz
|
||||
@ -472,10 +394,8 @@ define <32 x i8> @var_cttz_v32i8(<32 x i8> %a) {
|
||||
|
||||
define <32 x i8> @var_cttz_v32i8u(<32 x i8> %a) {
|
||||
; CHECK: 'Cost Model Analysis' for function 'var_cttz_v32i8u':
|
||||
; SSE2: Found an estimated cost of 96 for instruction: %cttz
|
||||
; SSE42: Found an estimated cost of 96 for instruction: %cttz
|
||||
; SSE: Found an estimated cost of 96 for instruction: %cttz
|
||||
; AVX: Found an estimated cost of 96 for instruction: %cttz
|
||||
; AVX2: Found an estimated cost of 96 for instruction: %cttz
|
||||
; XOP: Found an estimated cost of 96 for instruction: %cttz
|
||||
%cttz = call <32 x i8> @llvm.cttz.v32i8(<32 x i8> %a, i1 1)
|
||||
ret <32 x i8> %cttz
|
||||
|
Loading…
Reference in New Issue
Block a user