| ; RUN: llc < %s -march=x86-64 -mattr=+ssse3,-avx | FileCheck %s -check-prefix=SSSE3 |
| ; RUN: llc < %s -march=x86-64 -mattr=-ssse3,+avx | FileCheck %s -check-prefix=AVX |
| |
| ; SSSE3: phaddw1: |
| ; SSSE3-NOT: vphaddw |
| ; SSSE3: phaddw |
| ; AVX: phaddw1: |
| ; AVX: vphaddw |
| define <8 x i16> @phaddw1(<8 x i16> %x, <8 x i16> %y) { |
| %a = shufflevector <8 x i16> %x, <8 x i16> %y, <8 x i32> <i32 0, i32 2, i32 4, i32 6, i32 8, i32 10, i32 12, i32 14> |
| %b = shufflevector <8 x i16> %x, <8 x i16> %y, <8 x i32> <i32 1, i32 3, i32 5, i32 7, i32 9, i32 11, i32 13, i32 15> |
| %r = add <8 x i16> %a, %b |
| ret <8 x i16> %r |
| } |
| |
| ; SSSE3: phaddw2: |
| ; SSSE3-NOT: vphaddw |
| ; SSSE3: phaddw |
| ; AVX: phaddw2: |
| ; AVX: vphaddw |
| define <8 x i16> @phaddw2(<8 x i16> %x, <8 x i16> %y) { |
| %a = shufflevector <8 x i16> %x, <8 x i16> %y, <8 x i32> <i32 1, i32 2, i32 5, i32 6, i32 9, i32 10, i32 13, i32 14> |
| %b = shufflevector <8 x i16> %y, <8 x i16> %x, <8 x i32> <i32 8, i32 11, i32 12, i32 15, i32 0, i32 3, i32 4, i32 7> |
| %r = add <8 x i16> %a, %b |
| ret <8 x i16> %r |
| } |
| |
| ; SSSE3: phaddd1: |
| ; SSSE3-NOT: vphaddd |
| ; SSSE3: phaddd |
| ; AVX: phaddd1: |
| ; AVX: vphaddd |
| define <4 x i32> @phaddd1(<4 x i32> %x, <4 x i32> %y) { |
| %a = shufflevector <4 x i32> %x, <4 x i32> %y, <4 x i32> <i32 0, i32 2, i32 4, i32 6> |
| %b = shufflevector <4 x i32> %x, <4 x i32> %y, <4 x i32> <i32 1, i32 3, i32 5, i32 7> |
| %r = add <4 x i32> %a, %b |
| ret <4 x i32> %r |
| } |
| |
| ; SSSE3: phaddd2: |
| ; SSSE3-NOT: vphaddd |
| ; SSSE3: phaddd |
| ; AVX: phaddd2: |
| ; AVX: vphaddd |
| define <4 x i32> @phaddd2(<4 x i32> %x, <4 x i32> %y) { |
| %a = shufflevector <4 x i32> %x, <4 x i32> %y, <4 x i32> <i32 1, i32 2, i32 5, i32 6> |
| %b = shufflevector <4 x i32> %y, <4 x i32> %x, <4 x i32> <i32 4, i32 7, i32 0, i32 3> |
| %r = add <4 x i32> %a, %b |
| ret <4 x i32> %r |
| } |
| |
| ; SSSE3: phaddd3: |
| ; SSSE3-NOT: vphaddd |
| ; SSSE3: phaddd |
| ; AVX: phaddd3: |
| ; AVX: vphaddd |
| define <4 x i32> @phaddd3(<4 x i32> %x) { |
| %a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 2, i32 4, i32 6> |
| %b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 3, i32 5, i32 7> |
| %r = add <4 x i32> %a, %b |
| ret <4 x i32> %r |
| } |
| |
| ; SSSE3: phaddd4: |
| ; SSSE3-NOT: vphaddd |
| ; SSSE3: phaddd |
| ; AVX: phaddd4: |
| ; AVX: vphaddd |
| define <4 x i32> @phaddd4(<4 x i32> %x) { |
| %a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 0, i32 2, i32 undef, i32 undef> |
| %b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 1, i32 3, i32 undef, i32 undef> |
| %r = add <4 x i32> %a, %b |
| ret <4 x i32> %r |
| } |
| |
| ; SSSE3: phaddd5: |
| ; SSSE3-NOT: vphaddd |
| ; SSSE3: phaddd |
| ; AVX: phaddd5: |
| ; AVX: vphaddd |
| define <4 x i32> @phaddd5(<4 x i32> %x) { |
| %a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 0, i32 3, i32 undef, i32 undef> |
| %b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 1, i32 2, i32 undef, i32 undef> |
| %r = add <4 x i32> %a, %b |
| ret <4 x i32> %r |
| } |
| |
| ; SSSE3: phaddd6: |
| ; SSSE3-NOT: vphaddd |
| ; SSSE3: phaddd |
| ; AVX: phaddd6: |
| ; AVX: vphaddd |
| define <4 x i32> @phaddd6(<4 x i32> %x) { |
| %a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 0, i32 undef, i32 undef, i32 undef> |
| %b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 1, i32 undef, i32 undef, i32 undef> |
| %r = add <4 x i32> %a, %b |
| ret <4 x i32> %r |
| } |
| |
| ; SSSE3: phaddd7: |
| ; SSSE3-NOT: vphaddd |
| ; SSSE3: phaddd |
| ; AVX: phaddd7: |
| ; AVX: vphaddd |
| define <4 x i32> @phaddd7(<4 x i32> %x) { |
| %a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 3, i32 undef, i32 undef> |
| %b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 2, i32 undef, i32 undef> |
| %r = add <4 x i32> %a, %b |
| ret <4 x i32> %r |
| } |
| |
| ; SSSE3: phsubw1: |
| ; SSSE3-NOT: vphsubw |
| ; SSSE3: phsubw |
| ; AVX: phsubw1: |
| ; AVX: vphsubw |
| define <8 x i16> @phsubw1(<8 x i16> %x, <8 x i16> %y) { |
| %a = shufflevector <8 x i16> %x, <8 x i16> %y, <8 x i32> <i32 0, i32 2, i32 4, i32 6, i32 8, i32 10, i32 12, i32 14> |
| %b = shufflevector <8 x i16> %x, <8 x i16> %y, <8 x i32> <i32 1, i32 3, i32 5, i32 7, i32 9, i32 11, i32 13, i32 15> |
| %r = sub <8 x i16> %a, %b |
| ret <8 x i16> %r |
| } |
| |
| ; SSSE3: phsubd1: |
| ; SSSE3-NOT: vphsubd |
| ; SSSE3: phsubd |
| ; AVX: phsubd1: |
| ; AVX: vphsubd |
| define <4 x i32> @phsubd1(<4 x i32> %x, <4 x i32> %y) { |
| %a = shufflevector <4 x i32> %x, <4 x i32> %y, <4 x i32> <i32 0, i32 2, i32 4, i32 6> |
| %b = shufflevector <4 x i32> %x, <4 x i32> %y, <4 x i32> <i32 1, i32 3, i32 5, i32 7> |
| %r = sub <4 x i32> %a, %b |
| ret <4 x i32> %r |
| } |
| |
| ; SSSE3: phsubd2: |
| ; SSSE3-NOT: vphsubd |
| ; SSSE3: phsubd |
| ; AVX: phsubd2: |
| ; AVX: vphsubd |
| define <4 x i32> @phsubd2(<4 x i32> %x) { |
| %a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 2, i32 4, i32 6> |
| %b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 undef, i32 3, i32 5, i32 7> |
| %r = sub <4 x i32> %a, %b |
| ret <4 x i32> %r |
| } |
| |
| ; SSSE3: phsubd3: |
| ; SSSE3-NOT: vphsubd |
| ; SSSE3: phsubd |
| ; AVX: phsubd3: |
| ; AVX: vphsubd |
| define <4 x i32> @phsubd3(<4 x i32> %x) { |
| %a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 0, i32 2, i32 undef, i32 undef> |
| %b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 1, i32 3, i32 undef, i32 undef> |
| %r = sub <4 x i32> %a, %b |
| ret <4 x i32> %r |
| } |
| |
| ; SSSE3: phsubd4: |
| ; SSSE3-NOT: vphsubd |
| ; SSSE3: phsubd |
| ; AVX: phsubd4: |
| ; AVX: vphsubd |
| define <4 x i32> @phsubd4(<4 x i32> %x) { |
| %a = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 0, i32 undef, i32 undef, i32 undef> |
| %b = shufflevector <4 x i32> %x, <4 x i32> undef, <4 x i32> <i32 1, i32 undef, i32 undef, i32 undef> |
| %r = sub <4 x i32> %a, %b |
| ret <4 x i32> %r |
| } |