| ; RUN: opt < %s -cost-model -analyze -mtriple=x86_64-apple-macosx10.8.0 -mcpu=corei7-avx | FileCheck --check-prefix=AVX1 %s |
| ; RUN: opt < %s -cost-model -analyze -mtriple=x86_64-apple-macosx10.8.0 -mcpu=core-avx2 | FileCheck --check-prefix=AVX2 %s |
| |
| target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128" |
| target triple = "x86_64-apple-macosx10.8.0" |
| |
| define i32 @cmp(i32 %arg) { |
| ; -- floats -- |
| ;AVX1: cost of 1 {{.*}} fcmp |
| ;AVX2: cost of 1 {{.*}} fcmp |
| %A = fcmp olt <2 x float> undef, undef |
| ;AVX1: cost of 1 {{.*}} fcmp |
| ;AVX2: cost of 1 {{.*}} fcmp |
| %B = fcmp olt <4 x float> undef, undef |
| ;AVX1: cost of 1 {{.*}} fcmp |
| ;AVX2: cost of 1 {{.*}} fcmp |
| %C = fcmp olt <8 x float> undef, undef |
| ;AVX1: cost of 1 {{.*}} fcmp |
| ;AVX2: cost of 1 {{.*}} fcmp |
| %D = fcmp olt <2 x double> undef, undef |
| ;AVX1: cost of 1 {{.*}} fcmp |
| ;AVX2: cost of 1 {{.*}} fcmp |
| %E = fcmp olt <4 x double> undef, undef |
| |
| ; -- integers -- |
| |
| ;AVX1: cost of 1 {{.*}} icmp |
| ;AVX2: cost of 1 {{.*}} icmp |
| %F = icmp eq <16 x i8> undef, undef |
| ;AVX1: cost of 1 {{.*}} icmp |
| ;AVX2: cost of 1 {{.*}} icmp |
| %G = icmp eq <8 x i16> undef, undef |
| ;AVX1: cost of 1 {{.*}} icmp |
| ;AVX2: cost of 1 {{.*}} icmp |
| %H = icmp eq <4 x i32> undef, undef |
| ;AVX1: cost of 1 {{.*}} icmp |
| ;AVX2: cost of 1 {{.*}} icmp |
| %I = icmp eq <2 x i64> undef, undef |
| ;AVX1: cost of 4 {{.*}} icmp |
| ;AVX2: cost of 1 {{.*}} icmp |
| %J = icmp eq <4 x i64> undef, undef |
| ;AVX1: cost of 4 {{.*}} icmp |
| ;AVX2: cost of 1 {{.*}} icmp |
| %K = icmp eq <8 x i32> undef, undef |
| ;AVX1: cost of 4 {{.*}} icmp |
| ;AVX2: cost of 1 {{.*}} icmp |
| %L = icmp eq <16 x i16> undef, undef |
| ;AVX1: cost of 4 {{.*}} icmp |
| ;AVX2: cost of 1 {{.*}} icmp |
| %M = icmp eq <32 x i8> undef, undef |
| |
| ;CHECK: cost of 0 {{.*}} ret |
| ret i32 undef |
| } |
| |
| |