X-Git-Url: http://plrg.eecs.uci.edu/git/?a=blobdiff_plain;ds=sidebyside;f=test%2FCodeGen%2FX86%2Fviabs.ll;h=fe528fd4ea24f982c98932a4cc3aa9415b7be95b;hb=90c9a16dbfa347016977fa49b0cfe0db438a9504;hp=f748a14836c8f5086605d26bd68521edaa77cb48;hpb=fdfdd4cf8257c1a0ba0eec3d08f4e73f61c9cf62;p=oota-llvm.git diff --git a/test/CodeGen/X86/viabs.ll b/test/CodeGen/X86/viabs.ll index f748a14836c..fe528fd4ea2 100644 --- a/test/CodeGen/X86/viabs.ll +++ b/test/CodeGen/X86/viabs.ll @@ -1,22 +1,27 @@ -; RUN: llc < %s -march=x86-64 -mcpu=x86-64 | FileCheck %s -check-prefix=SSE2 -; RUN: llc < %s -march=x86-64 -mcpu=corei7 | FileCheck %s -check-prefix=SSSE3 -; RUN: llc < %s -march=x86-64 -mcpu=core-avx2 | FileCheck %s -check-prefix=AVX2 +; RUN: llc < %s -march=x86-64 -mattr=sse2 | FileCheck %s -check-prefix=SSE2 +; RUN: llc < %s -march=x86-64 -mattr=ssse3 | FileCheck %s -check-prefix=SSSE3 +; RUN: llc < %s -march=x86-64 -mattr=avx2 | FileCheck %s -check-prefix=AVX2 +; RUN: llc < %s -march=x86-64 -mattr=avx512f | FileCheck %s -check-prefix=AVX512 define <4 x i32> @test1(<4 x i32> %a) nounwind { -; SSE2: test1: +; SSE2-LABEL: test1: ; SSE2: movdqa ; SSE2: psrad $31 ; SSE2-NEXT: padd ; SSE2-NEXT: pxor ; SSE2-NEXT: ret -; SSSE3: test1: +; SSSE3-LABEL: test1: ; SSSE3: pabsd ; SSSE3-NEXT: ret -; AVX2: test1: +; AVX2-LABEL: test1: ; AVX2: vpabsd ; AVX2-NEXT: ret + +; AVX512-LABEL: test1: +; AVX512: vpabsd +; AVX512-NEXT: ret %tmp1neg = sub <4 x i32> zeroinitializer, %a %b = icmp sgt <4 x i32> %a, %abs = select <4 x i1> %b, <4 x i32> %a, <4 x i32> %tmp1neg @@ -24,20 +29,24 @@ define <4 x i32> @test1(<4 x i32> %a) nounwind { } define <4 x i32> @test2(<4 x i32> %a) nounwind { -; SSE2: test2: +; SSE2-LABEL: test2: ; SSE2: movdqa ; SSE2: psrad $31 ; SSE2-NEXT: padd ; SSE2-NEXT: pxor ; SSE2-NEXT: ret -; SSSE3: test2: +; SSSE3-LABEL: test2: ; SSSE3: pabsd ; SSSE3-NEXT: ret -; AVX2: test2: +; AVX2-LABEL: test2: ; AVX2: vpabsd ; AVX2-NEXT: ret + +; AVX512-LABEL: test2: +; AVX512: vpabsd +; AVX512-NEXT: ret %tmp1neg = sub <4 x i32> zeroinitializer, %a %b = icmp sge <4 x i32> %a, zeroinitializer %abs = select <4 x i1> %b, <4 x i32> %a, <4 x i32> %tmp1neg @@ -45,20 +54,24 @@ define <4 x i32> @test2(<4 x i32> %a) nounwind { } define <8 x i16> @test3(<8 x i16> %a) nounwind { -; SSE2: test3: +; SSE2-LABEL: test3: ; SSE2: movdqa ; SSE2: psraw $15 ; SSE2-NEXT: padd ; SSE2-NEXT: pxor ; SSE2-NEXT: ret -; SSSE3: test3: +; SSSE3-LABEL: test3: ; SSSE3: pabsw ; SSSE3-NEXT: ret -; AVX2: test3: +; AVX2-LABEL: test3: ; AVX2: vpabsw ; AVX2-NEXT: ret + +; AVX512-LABEL: test3: +; AVX512: vpabsw +; AVX512-NEXT: ret %tmp1neg = sub <8 x i16> zeroinitializer, %a %b = icmp sgt <8 x i16> %a, zeroinitializer %abs = select <8 x i1> %b, <8 x i16> %a, <8 x i16> %tmp1neg @@ -66,20 +79,24 @@ define <8 x i16> @test3(<8 x i16> %a) nounwind { } define <16 x i8> @test4(<16 x i8> %a) nounwind { -; SSE2: test4: +; SSE2-LABEL: test4: ; SSE2: pxor ; SSE2: pcmpgtb ; SSE2-NEXT: padd ; SSE2-NEXT: pxor ; SSE2-NEXT: ret -; SSSE3: test4: +; SSSE3-LABEL: test4: ; SSSE3: pabsb ; SSSE3-NEXT: ret -; AVX2: test4: +; AVX2-LABEL: test4: ; AVX2: vpabsb ; AVX2-NEXT: ret + +; AVX512-LABEL: test4: +; AVX512: vpabsb +; AVX512-NEXT: ret %tmp1neg = sub <16 x i8> zeroinitializer, %a %b = icmp slt <16 x i8> %a, zeroinitializer %abs = select <16 x i1> %b, <16 x i8> %tmp1neg, <16 x i8> %a @@ -87,20 +104,24 @@ define <16 x i8> @test4(<16 x i8> %a) nounwind { } define <4 x i32> @test5(<4 x i32> %a) nounwind { -; SSE2: test5: +; SSE2-LABEL: test5: ; SSE2: movdqa ; SSE2: psrad $31 ; SSE2-NEXT: padd ; SSE2-NEXT: pxor ; SSE2-NEXT: ret -; SSSE3: test5: +; SSSE3-LABEL: test5: ; SSSE3: pabsd ; SSSE3-NEXT: ret -; AVX2: test5: +; AVX2-LABEL: test5: ; AVX2: vpabsd ; AVX2-NEXT: ret + +; AVX512-LABEL: test5: +; AVX512: vpabsd +; AVX512-NEXT: ret %tmp1neg = sub <4 x i32> zeroinitializer, %a %b = icmp sle <4 x i32> %a, zeroinitializer %abs = select <4 x i1> %b, <4 x i32> %tmp1neg, <4 x i32> %a @@ -108,14 +129,18 @@ define <4 x i32> @test5(<4 x i32> %a) nounwind { } define <8 x i32> @test6(<8 x i32> %a) nounwind { -; SSSE3: test6: +; SSSE3-LABEL: test6: ; SSSE3: pabsd ; SSSE3: pabsd ; SSSE3-NEXT: ret -; AVX2: test6: +; AVX2-LABEL: test6: ; AVX2: vpabsd {{.*}}%ymm ; AVX2-NEXT: ret + +; AVX512-LABEL: test6: +; AVX512: vpabsd {{.*}}%ymm +; AVX512-NEXT: ret %tmp1neg = sub <8 x i32> zeroinitializer, %a %b = icmp sgt <8 x i32> %a, %abs = select <8 x i1> %b, <8 x i32> %a, <8 x i32> %tmp1neg @@ -123,14 +148,18 @@ define <8 x i32> @test6(<8 x i32> %a) nounwind { } define <8 x i32> @test7(<8 x i32> %a) nounwind { -; SSSE3: test7: +; SSSE3-LABEL: test7: ; SSSE3: pabsd ; SSSE3: pabsd ; SSSE3-NEXT: ret -; AVX2: test7: +; AVX2-LABEL: test7: ; AVX2: vpabsd {{.*}}%ymm ; AVX2-NEXT: ret + +; AVX512-LABEL: test7: +; AVX512: vpabsd {{.*}}%ymm +; AVX512-NEXT: ret %tmp1neg = sub <8 x i32> zeroinitializer, %a %b = icmp sge <8 x i32> %a, zeroinitializer %abs = select <8 x i1> %b, <8 x i32> %a, <8 x i32> %tmp1neg @@ -138,14 +167,18 @@ define <8 x i32> @test7(<8 x i32> %a) nounwind { } define <16 x i16> @test8(<16 x i16> %a) nounwind { -; SSSE3: test8: +; SSSE3-LABEL: test8: ; SSSE3: pabsw ; SSSE3: pabsw ; SSSE3-NEXT: ret -; AVX2: test8: +; AVX2-LABEL: test8: ; AVX2: vpabsw {{.*}}%ymm ; AVX2-NEXT: ret + +; AVX512-LABEL: test8: +; AVX512: vpabsw {{.*}}%ymm +; AVX512-NEXT: ret %tmp1neg = sub <16 x i16> zeroinitializer, %a %b = icmp sgt <16 x i16> %a, zeroinitializer %abs = select <16 x i1> %b, <16 x i16> %a, <16 x i16> %tmp1neg @@ -153,14 +186,18 @@ define <16 x i16> @test8(<16 x i16> %a) nounwind { } define <32 x i8> @test9(<32 x i8> %a) nounwind { -; SSSE3: test9: +; SSSE3-LABEL: test9: ; SSSE3: pabsb ; SSSE3: pabsb ; SSSE3-NEXT: ret -; AVX2: test9: +; AVX2-LABEL: test9: ; AVX2: vpabsb {{.*}}%ymm ; AVX2-NEXT: ret + +; AVX512-LABEL: test9: +; AVX512: vpabsb {{.*}}%ymm +; AVX512-NEXT: ret %tmp1neg = sub <32 x i8> zeroinitializer, %a %b = icmp slt <32 x i8> %a, zeroinitializer %abs = select <32 x i1> %b, <32 x i8> %tmp1neg, <32 x i8> %a @@ -168,16 +205,66 @@ define <32 x i8> @test9(<32 x i8> %a) nounwind { } define <8 x i32> @test10(<8 x i32> %a) nounwind { -; SSSE3: test10: +; SSSE3-LABEL: test10: ; SSSE3: pabsd ; SSSE3: pabsd ; SSSE3-NEXT: ret -; AVX2: test10: +; AVX2-LABEL: test10: ; AVX2: vpabsd {{.*}}%ymm ; AVX2-NEXT: ret + +; AVX512-LABEL: test10: +; AVX512: vpabsd {{.*}}%ymm +; AVX512-NEXT: ret %tmp1neg = sub <8 x i32> zeroinitializer, %a %b = icmp sle <8 x i32> %a, zeroinitializer %abs = select <8 x i1> %b, <8 x i32> %tmp1neg, <8 x i32> %a ret <8 x i32> %abs } + +define <16 x i32> @test11(<16 x i32> %a) nounwind { +; AVX2-LABEL: test11: +; AVX2: vpabsd +; AVX2: vpabsd +; AVX2-NEXT: ret + +; AVX512-LABEL: test11: +; AVX512: vpabsd {{.*}}%zmm +; AVX512-NEXT: ret + %tmp1neg = sub <16 x i32> zeroinitializer, %a + %b = icmp sle <16 x i32> %a, zeroinitializer + %abs = select <16 x i1> %b, <16 x i32> %tmp1neg, <16 x i32> %a + ret <16 x i32> %abs +} + +define <8 x i64> @test12(<8 x i64> %a) nounwind { +; AVX2-LABEL: test12: +; AVX2: vpxor +; AVX2: vpxor +; AVX2-NEXT: ret + +; AVX512-LABEL: test12: +; AVX512: vpabsq {{.*}}%zmm +; AVX512-NEXT: ret + %tmp1neg = sub <8 x i64> zeroinitializer, %a + %b = icmp sle <8 x i64> %a, zeroinitializer + %abs = select <8 x i1> %b, <8 x i64> %tmp1neg, <8 x i64> %a + ret <8 x i64> %abs +} + +define <8 x i64> @test13(<8 x i64>* %a.ptr) nounwind { +; AVX2-LABEL: test13: +; AVX2: vpxor +; AVX2: vpxor +; AVX2-NEXT: ret + +; AVX512-LABEL: test13: +; AVX512: vpabsq (% +; AVX512-NEXT: ret + %a = load <8 x i64>, <8 x i64>* %a.ptr, align 8 + %tmp1neg = sub <8 x i64> zeroinitializer, %a + %b = icmp sle <8 x i64> %a, zeroinitializer + %abs = select <8 x i1> %b, <8 x i64> %tmp1neg, <8 x i64> %a + ret <8 x i64> %abs +}