X-Git-Url: http://plrg.eecs.uci.edu/git/?a=blobdiff_plain;f=test%2FCodeGen%2FX86%2Ffast-isel-x86-64.ll;h=d748cba2f8f80e9aa4027b3587e72067b38ad3ad;hb=3791d56da63baf5072fa6ecaa872ace6adbc6892;hp=d45a54fb1423a21aac8309684c8d25b53dd27d67;hpb=b686af053e6544191420978f6a3adc7e74ab0192;p=oota-llvm.git diff --git a/test/CodeGen/X86/fast-isel-x86-64.ll b/test/CodeGen/X86/fast-isel-x86-64.ll index d45a54fb142..d748cba2f8f 100644 --- a/test/CodeGen/X86/fast-isel-x86-64.ll +++ b/test/CodeGen/X86/fast-isel-x86-64.ll @@ -1,4 +1,5 @@ -; RUN: llc < %s -fast-isel -O0 -regalloc=fast -asm-verbose=0 -fast-isel-abort | FileCheck %s +; RUN: llc < %s -mattr=-avx -fast-isel -mcpu=core2 -O0 -regalloc=fast -asm-verbose=0 -fast-isel-abort=1 | FileCheck %s +; RUN: llc < %s -mattr=+avx -fast-isel -mcpu=core2 -O0 -regalloc=fast -asm-verbose=0 -fast-isel-abort=1 | FileCheck %s --check-prefix=AVX target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64" target triple = "x86_64-apple-darwin10.0.0" @@ -10,7 +11,7 @@ define i32 @test1(i32 %i) nounwind ssp { ret i32 %and } -; CHECK: test1: +; CHECK-LABEL: test1: ; CHECK: andl $8, @@ -19,7 +20,7 @@ define void @test2(i64 %x) nounwind ssp { entry: %x.addr = alloca i64, align 8 store i64 %x, i64* %x.addr, align 8 - %tmp = load i64* %x.addr, align 8 + %tmp = load i64, i64* %x.addr, align 8 %cmp = icmp sgt i64 %tmp, 42 br i1 %cmp, label %if.then, label %if.end @@ -28,7 +29,7 @@ if.then: ; preds = %entry if.end: ; preds = %if.then, %entry ret void -; CHECK: test2: +; CHECK-LABEL: test2: ; CHECK: movq %rdi, -8(%rsp) ; CHECK: cmpq $42, -8(%rsp) } @@ -40,7 +41,7 @@ if.end: ; preds = %if.then, %entry define i64 @test3() nounwind { %A = ptrtoint i32* @G to i64 ret i64 %A -; CHECK: test3: +; CHECK-LABEL: test3: ; CHECK: movq _G@GOTPCREL(%rip), %rax ; CHECK-NEXT: ret } @@ -51,12 +52,12 @@ define i64 @test3() nounwind { @rtx_length = external global [153 x i8] define i32 @test4(i64 %idxprom9) nounwind { - %arrayidx10 = getelementptr inbounds [153 x i8]* @rtx_length, i32 0, i64 %idxprom9 - %tmp11 = load i8* %arrayidx10, align 1 + %arrayidx10 = getelementptr inbounds [153 x i8], [153 x i8]* @rtx_length, i32 0, i64 %idxprom9 + %tmp11 = load i8, i8* %arrayidx10, align 1 %conv = zext i8 %tmp11 to i32 ret i32 %conv -; CHECK: test4: +; CHECK-LABEL: test4: ; CHECK: movq _rtx_length@GOTPCREL(%rip), %rax ; CHECK-NEXT: movzbl (%rax,%rdi), %eax ; CHECK-NEXT: ret @@ -69,7 +70,7 @@ define void @test5(i32 %x, i32* %p) nounwind { store i32 %y, i32* %p ret void -; CHECK: test5: +; CHECK-LABEL: test5: ; CHECK: movl $50000, %ecx ; CHECK: sarl %cl, %edi ; CHECK: ret @@ -81,16 +82,16 @@ entry: %mul = mul nsw i64 %x, 8 ret i64 %mul -; CHECK: test6: -; CHECK: leaq (,%rdi,8), %rax +; CHECK-LABEL: test6: +; CHECK: shlq $3, %rdi } define i32 @test7(i32 %x) nounwind ssp { entry: %mul = mul nsw i32 %x, 8 ret i32 %mul -; CHECK: test7: -; CHECK: leal (,%rdi,8), %eax +; CHECK-LABEL: test7: +; CHECK: shll $3, %edi } @@ -100,7 +101,7 @@ entry: %add = add nsw i64 %x, 7 ret i64 %add -; CHECK: test8: +; CHECK-LABEL: test8: ; CHECK: addq $7, %rdi } @@ -108,7 +109,7 @@ define i64 @test9(i64 %x) nounwind ssp { entry: %add = mul nsw i64 %x, 7 ret i64 %add -; CHECK: test9: +; CHECK-LABEL: test9: ; CHECK: imulq $7, %rdi, %rax } @@ -116,14 +117,14 @@ entry: define i32 @test10(i32 %X) nounwind { %Y = udiv i32 %X, 8 ret i32 %Y -; CHECK: test10: +; CHECK-LABEL: test10: ; CHECK: shrl $3, } define i32 @test11(i32 %X) nounwind { %Y = sdiv exact i32 %X, 8 ret i32 %Y -; CHECK: test11: +; CHECK-LABEL: test11: ; CHECK: sarl $3, } @@ -140,10 +141,10 @@ if.then: ; preds = %entry if.end: ; preds = %if.then, %entry ret void -; CHECK: test12: +; CHECK-LABEL: test12: ; CHECK: testb $1, ; CHECK-NEXT: je L -; CHECK-NEXT: movl $0, %edi +; CHECK-NEXT: xorl %edi, %edi ; CHECK-NEXT: callq } @@ -152,8 +153,8 @@ declare void @test13f(i1 %X) define void @test13() nounwind { call void @test13f(i1 0) ret void -; CHECK: test13: -; CHECK: movl $0, %edi +; CHECK-LABEL: test13: +; CHECK: xorl %edi, %edi ; CHECK-NEXT: callq } @@ -165,7 +166,7 @@ entry: %tobool = trunc i8 %tmp to i1 call void @test13f(i1 zeroext %tobool) noredzone ret void -; CHECK: test14: +; CHECK-LABEL: test14: ; CHECK: andb $1, ; CHECK: callq } @@ -176,7 +177,7 @@ declare void @llvm.memcpy.p0i8.p0i8.i64(i8*, i8*, i64, i32, i1) define void @test15(i8* %a, i8* %b) nounwind { call void @llvm.memcpy.p0i8.p0i8.i64(i8* %a, i8* %b, i64 4, i32 4, i1 false) ret void -; CHECK: test15: +; CHECK-LABEL: test15: ; CHECK-NEXT: movl (%rsi), %eax ; CHECK-NEXT: movl %eax, (%rdi) ; CHECK-NEXT: ret @@ -185,19 +186,22 @@ define void @test15(i8* %a, i8* %b) nounwind { ; Handling for varargs calls declare void @test16callee(...) nounwind define void @test16() nounwind { -; CHECK: test16: +; CHECK-LABEL: test16: ; CHECK: movl $1, %edi ; CHECK: movb $0, %al ; CHECK: callq _test16callee - call void (...)* @test16callee(i32 1) + call void (...) @test16callee(i32 1) br label %block2 block2: -; CHECK: movabsq $1 -; CHECK: cvtsi2sdq {{.*}} %xmm0 +; CHECK: movsd LCP{{.*}}_{{.*}}(%rip), %xmm0 ; CHECK: movb $1, %al ; CHECK: callq _test16callee - call void (...)* @test16callee(double 1.000000e+00) + +; AVX: vmovsd LCP{{.*}}_{{.*}}(%rip), %xmm0 +; AVX: movb $1, %al +; AVX: callq _test16callee + call void (...) @test16callee(double 1.000000e+00) ret void } @@ -208,7 +212,7 @@ declare void @foo() unnamed_addr ssp align 2 ; w.r.t. the call. define i32 @test17(i32 *%P) ssp nounwind { entry: - %tmp = load i32* %P + %tmp = load i32, i32* %P %cmp = icmp ne i32 %tmp, 5 call void @foo() br i1 %cmp, label %if.then, label %if.else @@ -218,10 +222,93 @@ if.then: ; preds = %entry if.else: ; preds = %entry ret i32 2 -; CHECK: test17: +; CHECK-LABEL: test17: ; CHECK: movl (%rdi), %eax ; CHECK: callq _foo ; CHECK: cmpl $5, %eax ; CHECK-NEXT: je } +; Check that 0.0 is materialized using xorps +define void @test18(float* %p1) { + store float 0.0, float* %p1 + ret void +; CHECK-LABEL: test18: +; CHECK: xorps +} + +; Without any type hints, doubles use the smaller xorps instead of xorpd. +define void @test19(double* %p1) { + store double 0.0, double* %p1 + ret void +; CHECK-LABEL: test19: +; CHECK: xorps +} + +; Check that we fast-isel sret +%struct.a = type { i64, i64, i64 } +define void @test20() nounwind ssp { +entry: + %tmp = alloca %struct.a, align 8 + call void @test20sret(%struct.a* sret %tmp) + ret void +; CHECK-LABEL: test20: +; CHECK: leaq (%rsp), %rdi +; CHECK: callq _test20sret +} +declare void @test20sret(%struct.a* sret) + +; Check that -0.0 is not materialized using xor +define void @test21(double* %p1) { + store double -0.0, double* %p1 + ret void +; CHECK-LABEL: test21: +; CHECK-NOT: xor +; CHECK: movsd LCPI +} + +; Check that immediate arguments to a function +; do not cause massive spilling and are used +; as immediates just before the call. +define void @test22() nounwind { +entry: + call void @foo22(i32 0) + call void @foo22(i32 1) + call void @foo22(i32 2) + call void @foo22(i32 3) + ret void +; CHECK-LABEL: test22: +; CHECK: xorl %edi, %edi +; CHECK: callq _foo22 +; CHECK: movl $1, %edi +; CHECK: callq _foo22 +; CHECK: movl $2, %edi +; CHECK: callq _foo22 +; CHECK: movl $3, %edi +; CHECK: callq _foo22 +} + +declare void @foo22(i32) + +; PR13563 +define void @test23(i8* noalias sret %result) { + %a = alloca i8 + %b = call i8* @foo23() + ret void +; CHECK-LABEL: test23: +; CHECK: call +; CHECK: movq %rdi, %rax +; CHECK: ret +} + +declare i8* @foo23() + +declare void @takesi32ptr(i32* %arg) + +; CHECK-LABEL: allocamaterialize +define void @allocamaterialize() { + %a = alloca i32 +; CHECK: leaq {{.*}}, %rdi + call void @takesi32ptr(i32* %a) + ret void +}