X-Git-Url: http://plrg.eecs.uci.edu/git/?a=blobdiff_plain;f=test%2FCodeGen%2FAArch64%2Farm64-xaluo.ll;h=71300c4dd2c2634d819e969714d4763d1add83d8;hb=506ed4d4a5ed65f40e1b2d4b68b5f79883c8c3fa;hp=6cffbdeef8a109f784e30668de46cbb9899edc5d;hpb=29f94c72014eaa5d0d3b920686e689e79759cacb;p=oota-llvm.git diff --git a/test/CodeGen/AArch64/arm64-xaluo.ll b/test/CodeGen/AArch64/arm64-xaluo.ll index 6cffbdeef8a..71300c4dd2c 100644 --- a/test/CodeGen/AArch64/arm64-xaluo.ll +++ b/test/CodeGen/AArch64/arm64-xaluo.ll @@ -1,13 +1,14 @@ -; RUN: llc < %s -march=arm64 | FileCheck %s +; RUN: llc -march=arm64 -aarch64-atomic-cfg-tidy=0 < %s | FileCheck %s +; RUN: llc -march=arm64 -aarch64-atomic-cfg-tidy=0 -fast-isel -fast-isel-abort < %s | FileCheck %s ; ; Get the actual value of the overflow bit. ; -define i1 @saddo.i32(i32 %v1, i32 %v2, i32* %res) { +define zeroext i1 @saddo1.i32(i32 %v1, i32 %v2, i32* %res) { entry: -; CHECK-LABEL: saddo.i32 -; CHECK: adds w8, w0, w1 -; CHECK-NEXT: cset w0, vs +; CHECK-LABEL: saddo1.i32 +; CHECK: adds {{w[0-9]+}}, w0, w1 +; CHECK-NEXT: cset {{w[0-9]+}}, vs %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 %v2) %val = extractvalue {i32, i1} %t, 0 %obit = extractvalue {i32, i1} %t, 1 @@ -15,11 +16,64 @@ entry: ret i1 %obit } -define i1 @saddo.i64(i64 %v1, i64 %v2, i64* %res) { +; Test the immediate version. +define zeroext i1 @saddo2.i32(i32 %v1, i32* %res) { entry: -; CHECK-LABEL: saddo.i64 -; CHECK: adds x8, x0, x1 -; CHECK-NEXT: cset w0, vs +; CHECK-LABEL: saddo2.i32 +; CHECK: adds {{w[0-9]+}}, w0, #4 +; CHECK-NEXT: cset {{w[0-9]+}}, vs + %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 4) + %val = extractvalue {i32, i1} %t, 0 + %obit = extractvalue {i32, i1} %t, 1 + store i32 %val, i32* %res + ret i1 %obit +} + +; Test negative immediates. +define zeroext i1 @saddo3.i32(i32 %v1, i32* %res) { +entry: +; CHECK-LABEL: saddo3.i32 +; CHECK: subs {{w[0-9]+}}, w0, #4 +; CHECK-NEXT: cset {{w[0-9]+}}, vs + %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 -4) + %val = extractvalue {i32, i1} %t, 0 + %obit = extractvalue {i32, i1} %t, 1 + store i32 %val, i32* %res + ret i1 %obit +} + +; Test immediates that are too large to be encoded. +define zeroext i1 @saddo4.i32(i32 %v1, i32* %res) { +entry: +; CHECK-LABEL: saddo4.i32 +; CHECK: adds {{w[0-9]+}}, w0, {{w[0-9]+}} +; CHECK-NEXT: cset {{w[0-9]+}}, vs + %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 16777215) + %val = extractvalue {i32, i1} %t, 0 + %obit = extractvalue {i32, i1} %t, 1 + store i32 %val, i32* %res + ret i1 %obit +} + +; Test shift folding. +define zeroext i1 @saddo5.i32(i32 %v1, i32 %v2, i32* %res) { +entry: +; CHECK-LABEL: saddo5.i32 +; CHECK: adds {{w[0-9]+}}, w0, w1 +; CHECK-NEXT: cset {{w[0-9]+}}, vs + %lsl = shl i32 %v2, 16 + %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 %lsl) + %val = extractvalue {i32, i1} %t, 0 + %obit = extractvalue {i32, i1} %t, 1 + store i32 %val, i32* %res + ret i1 %obit +} + +define zeroext i1 @saddo1.i64(i64 %v1, i64 %v2, i64* %res) { +entry: +; CHECK-LABEL: saddo1.i64 +; CHECK: adds {{x[0-9]+}}, x0, x1 +; CHECK-NEXT: cset {{w[0-9]+}}, vs %t = call {i64, i1} @llvm.sadd.with.overflow.i64(i64 %v1, i64 %v2) %val = extractvalue {i64, i1} %t, 0 %obit = extractvalue {i64, i1} %t, 1 @@ -27,11 +81,35 @@ entry: ret i1 %obit } -define i1 @uaddo.i32(i32 %v1, i32 %v2, i32* %res) { +define zeroext i1 @saddo2.i64(i64 %v1, i64* %res) { +entry: +; CHECK-LABEL: saddo2.i64 +; CHECK: adds {{x[0-9]+}}, x0, #4 +; CHECK-NEXT: cset {{w[0-9]+}}, vs + %t = call {i64, i1} @llvm.sadd.with.overflow.i64(i64 %v1, i64 4) + %val = extractvalue {i64, i1} %t, 0 + %obit = extractvalue {i64, i1} %t, 1 + store i64 %val, i64* %res + ret i1 %obit +} + +define zeroext i1 @saddo3.i64(i64 %v1, i64* %res) { +entry: +; CHECK-LABEL: saddo3.i64 +; CHECK: subs {{x[0-9]+}}, x0, #4 +; CHECK-NEXT: cset {{w[0-9]+}}, vs + %t = call {i64, i1} @llvm.sadd.with.overflow.i64(i64 %v1, i64 -4) + %val = extractvalue {i64, i1} %t, 0 + %obit = extractvalue {i64, i1} %t, 1 + store i64 %val, i64* %res + ret i1 %obit +} + +define zeroext i1 @uaddo.i32(i32 %v1, i32 %v2, i32* %res) { entry: ; CHECK-LABEL: uaddo.i32 -; CHECK: adds w8, w0, w1 -; CHECK-NEXT: cset w0, hs +; CHECK: adds {{w[0-9]+}}, w0, w1 +; CHECK-NEXT: cset {{w[0-9]+}}, hs %t = call {i32, i1} @llvm.uadd.with.overflow.i32(i32 %v1, i32 %v2) %val = extractvalue {i32, i1} %t, 0 %obit = extractvalue {i32, i1} %t, 1 @@ -39,11 +117,11 @@ entry: ret i1 %obit } -define i1 @uaddo.i64(i64 %v1, i64 %v2, i64* %res) { +define zeroext i1 @uaddo.i64(i64 %v1, i64 %v2, i64* %res) { entry: ; CHECK-LABEL: uaddo.i64 -; CHECK: adds x8, x0, x1 -; CHECK-NEXT: cset w0, hs +; CHECK: adds {{x[0-9]+}}, x0, x1 +; CHECK-NEXT: cset {{w[0-9]+}}, hs %t = call {i64, i1} @llvm.uadd.with.overflow.i64(i64 %v1, i64 %v2) %val = extractvalue {i64, i1} %t, 0 %obit = extractvalue {i64, i1} %t, 1 @@ -51,11 +129,11 @@ entry: ret i1 %obit } -define i1 @ssubo.i32(i32 %v1, i32 %v2, i32* %res) { +define zeroext i1 @ssubo1.i32(i32 %v1, i32 %v2, i32* %res) { entry: -; CHECK-LABEL: ssubo.i32 -; CHECK: subs w8, w0, w1 -; CHECK-NEXT: cset w0, vs +; CHECK-LABEL: ssubo1.i32 +; CHECK: subs {{w[0-9]+}}, w0, w1 +; CHECK-NEXT: cset {{w[0-9]+}}, vs %t = call {i32, i1} @llvm.ssub.with.overflow.i32(i32 %v1, i32 %v2) %val = extractvalue {i32, i1} %t, 0 %obit = extractvalue {i32, i1} %t, 1 @@ -63,11 +141,23 @@ entry: ret i1 %obit } -define i1 @ssubo.i64(i64 %v1, i64 %v2, i64* %res) { +define zeroext i1 @ssubo2.i32(i32 %v1, i32* %res) { +entry: +; CHECK-LABEL: ssubo2.i32 +; CHECK: adds {{w[0-9]+}}, w0, #4 +; CHECK-NEXT: cset {{w[0-9]+}}, vs + %t = call {i32, i1} @llvm.ssub.with.overflow.i32(i32 %v1, i32 -4) + %val = extractvalue {i32, i1} %t, 0 + %obit = extractvalue {i32, i1} %t, 1 + store i32 %val, i32* %res + ret i1 %obit +} + +define zeroext i1 @ssubo.i64(i64 %v1, i64 %v2, i64* %res) { entry: ; CHECK-LABEL: ssubo.i64 -; CHECK: subs x8, x0, x1 -; CHECK-NEXT: cset w0, vs +; CHECK: subs {{x[0-9]+}}, x0, x1 +; CHECK-NEXT: cset {{w[0-9]+}}, vs %t = call {i64, i1} @llvm.ssub.with.overflow.i64(i64 %v1, i64 %v2) %val = extractvalue {i64, i1} %t, 0 %obit = extractvalue {i64, i1} %t, 1 @@ -75,11 +165,11 @@ entry: ret i1 %obit } -define i1 @usubo.i32(i32 %v1, i32 %v2, i32* %res) { +define zeroext i1 @usubo.i32(i32 %v1, i32 %v2, i32* %res) { entry: ; CHECK-LABEL: usubo.i32 -; CHECK: subs w8, w0, w1 -; CHECK-NEXT: cset w0, lo +; CHECK: subs {{w[0-9]+}}, w0, w1 +; CHECK-NEXT: cset {{w[0-9]+}}, lo %t = call {i32, i1} @llvm.usub.with.overflow.i32(i32 %v1, i32 %v2) %val = extractvalue {i32, i1} %t, 0 %obit = extractvalue {i32, i1} %t, 1 @@ -87,11 +177,11 @@ entry: ret i1 %obit } -define i1 @usubo.i64(i64 %v1, i64 %v2, i64* %res) { +define zeroext i1 @usubo.i64(i64 %v1, i64 %v2, i64* %res) { entry: ; CHECK-LABEL: usubo.i64 -; CHECK: subs x8, x0, x1 -; CHECK-NEXT: cset w0, lo +; CHECK: subs {{x[0-9]+}}, x0, x1 +; CHECK-NEXT: cset {{w[0-9]+}}, lo %t = call {i64, i1} @llvm.usub.with.overflow.i64(i64 %v1, i64 %v2) %val = extractvalue {i64, i1} %t, 0 %obit = extractvalue {i64, i1} %t, 1 @@ -99,13 +189,13 @@ entry: ret i1 %obit } -define i1 @smulo.i32(i32 %v1, i32 %v2, i32* %res) { +define zeroext i1 @smulo.i32(i32 %v1, i32 %v2, i32* %res) { entry: ; CHECK-LABEL: smulo.i32 -; CHECK: smull x8, w0, w1 -; CHECK-NEXT: lsr x9, x8, #32 -; CHECK-NEXT: cmp w9, w8, asr #31 -; CHECK-NEXT: cset w0, ne +; CHECK: smull x[[MREG:[0-9]+]], w0, w1 +; CHECK-NEXT: lsr x[[SREG:[0-9]+]], x[[MREG]], #32 +; CHECK-NEXT: cmp w[[SREG]], w[[MREG]], asr #31 +; CHECK-NEXT: cset {{w[0-9]+}}, ne %t = call {i32, i1} @llvm.smul.with.overflow.i32(i32 %v1, i32 %v2) %val = extractvalue {i32, i1} %t, 0 %obit = extractvalue {i32, i1} %t, 1 @@ -113,13 +203,13 @@ entry: ret i1 %obit } -define i1 @smulo.i64(i64 %v1, i64 %v2, i64* %res) { +define zeroext i1 @smulo.i64(i64 %v1, i64 %v2, i64* %res) { entry: ; CHECK-LABEL: smulo.i64 -; CHECK: mul x8, x0, x1 -; CHECK-NEXT: smulh x9, x0, x1 -; CHECK-NEXT: cmp x9, x8, asr #63 -; CHECK-NEXT: cset w0, ne +; CHECK: mul [[MREG:x[0-9]+]], x0, x1 +; CHECK-NEXT: smulh [[HREG:x[0-9]+]], x0, x1 +; CHECK-NEXT: cmp [[HREG]], [[MREG]], asr #63 +; CHECK-NEXT: cset {{w[0-9]+}}, ne %t = call {i64, i1} @llvm.smul.with.overflow.i64(i64 %v1, i64 %v2) %val = extractvalue {i64, i1} %t, 0 %obit = extractvalue {i64, i1} %t, 1 @@ -127,12 +217,12 @@ entry: ret i1 %obit } -define i1 @umulo.i32(i32 %v1, i32 %v2, i32* %res) { +define zeroext i1 @umulo.i32(i32 %v1, i32 %v2, i32* %res) { entry: ; CHECK-LABEL: umulo.i32 -; CHECK: umull x8, w0, w1 -; CHECK-NEXT: cmp xzr, x8, lsr #32 -; CHECK-NEXT: cset w0, ne +; CHECK: umull [[MREG:x[0-9]+]], w0, w1 +; CHECK-NEXT: cmp xzr, [[MREG]], lsr #32 +; CHECK-NEXT: cset {{w[0-9]+}}, ne %t = call {i32, i1} @llvm.umul.with.overflow.i32(i32 %v1, i32 %v2) %val = extractvalue {i32, i1} %t, 0 %obit = extractvalue {i32, i1} %t, 1 @@ -140,13 +230,12 @@ entry: ret i1 %obit } -define i1 @umulo.i64(i64 %v1, i64 %v2, i64* %res) { +define zeroext i1 @umulo.i64(i64 %v1, i64 %v2, i64* %res) { entry: ; CHECK-LABEL: umulo.i64 -; CHECK: umulh x8, x0, x1 -; CHECK-NEXT: cmp xzr, x8 -; CHECK-NEXT: cset w8, ne -; CHECK-NEXT: mul x9, x0, x1 +; CHECK: umulh [[MREG:x[0-9]+]], x0, x1 +; CHECK-NEXT: cmp xzr, [[MREG]] +; CHECK-NEXT: cset {{w[0-9]+}}, ne %t = call {i64, i1} @llvm.umul.with.overflow.i64(i64 %v1, i64 %v2) %val = extractvalue {i64, i1} %t, 0 %obit = extractvalue {i64, i1} %t, 1 @@ -249,9 +338,9 @@ entry: define i32 @smulo.select.i32(i32 %v1, i32 %v2) { entry: ; CHECK-LABEL: smulo.select.i32 -; CHECK: smull x8, w0, w1 -; CHECK-NEXT: lsr x9, x8, #32 -; CHECK-NEXT: cmp w9, w8, asr #31 +; CHECK: smull x[[MREG:[0-9]+]], w0, w1 +; CHECK-NEXT: lsr x[[SREG:[0-9]+]], x[[MREG]], #32 +; CHECK-NEXT: cmp w[[SREG]], w[[MREG]], asr #31 ; CHECK-NEXT: csel w0, w0, w1, ne %t = call {i32, i1} @llvm.smul.with.overflow.i32(i32 %v1, i32 %v2) %obit = extractvalue {i32, i1} %t, 1 @@ -262,9 +351,9 @@ entry: define i64 @smulo.select.i64(i64 %v1, i64 %v2) { entry: ; CHECK-LABEL: smulo.select.i64 -; CHECK: mul x8, x0, x1 -; CHECK-NEXT: smulh x9, x0, x1 -; CHECK-NEXT: cmp x9, x8, asr #63 +; CHECK: mul [[MREG:x[0-9]+]], x0, x1 +; CHECK-NEXT: smulh [[HREG:x[0-9]+]], x0, x1 +; CHECK-NEXT: cmp [[HREG]], [[MREG]], asr #63 ; CHECK-NEXT: csel x0, x0, x1, ne %t = call {i64, i1} @llvm.smul.with.overflow.i64(i64 %v1, i64 %v2) %obit = extractvalue {i64, i1} %t, 1 @@ -275,8 +364,8 @@ entry: define i32 @umulo.select.i32(i32 %v1, i32 %v2) { entry: ; CHECK-LABEL: umulo.select.i32 -; CHECK: umull x8, w0, w1 -; CHECK-NEXT: cmp xzr, x8, lsr #32 +; CHECK: umull [[MREG:x[0-9]+]], w0, w1 +; CHECK-NEXT: cmp xzr, [[MREG]], lsr #32 ; CHECK-NEXT: csel w0, w0, w1, ne %t = call {i32, i1} @llvm.umul.with.overflow.i32(i32 %v1, i32 %v2) %obit = extractvalue {i32, i1} %t, 1 @@ -287,8 +376,8 @@ entry: define i64 @umulo.select.i64(i64 %v1, i64 %v2) { entry: ; CHECK-LABEL: umulo.select.i64 -; CHECK: umulh x8, x0, x1 -; CHECK-NEXT: cmp xzr, x8 +; CHECK: umulh [[MREG:x[0-9]+]], x0, x1 +; CHECK-NEXT: cmp xzr, [[MREG]] ; CHECK-NEXT: csel x0, x0, x1, ne %t = call {i64, i1} @llvm.umul.with.overflow.i64(i64 %v1, i64 %v2) %obit = extractvalue {i64, i1} %t, 1 @@ -300,7 +389,7 @@ entry: ; ; Check the use of the overflow bit in combination with a branch instruction. ; -define i1 @saddo.br.i32(i32 %v1, i32 %v2) { +define zeroext i1 @saddo.br.i32(i32 %v1, i32 %v2) { entry: ; CHECK-LABEL: saddo.br.i32 ; CHECK: cmn w0, w1 @@ -317,7 +406,7 @@ continue: ret i1 true } -define i1 @saddo.br.i64(i64 %v1, i64 %v2) { +define zeroext i1 @saddo.br.i64(i64 %v1, i64 %v2) { entry: ; CHECK-LABEL: saddo.br.i64 ; CHECK: cmn x0, x1 @@ -334,7 +423,7 @@ continue: ret i1 true } -define i1 @uaddo.br.i32(i32 %v1, i32 %v2) { +define zeroext i1 @uaddo.br.i32(i32 %v1, i32 %v2) { entry: ; CHECK-LABEL: uaddo.br.i32 ; CHECK: cmn w0, w1 @@ -351,7 +440,7 @@ continue: ret i1 true } -define i1 @uaddo.br.i64(i64 %v1, i64 %v2) { +define zeroext i1 @uaddo.br.i64(i64 %v1, i64 %v2) { entry: ; CHECK-LABEL: uaddo.br.i64 ; CHECK: cmn x0, x1 @@ -368,7 +457,7 @@ continue: ret i1 true } -define i1 @ssubo.br.i32(i32 %v1, i32 %v2) { +define zeroext i1 @ssubo.br.i32(i32 %v1, i32 %v2) { entry: ; CHECK-LABEL: ssubo.br.i32 ; CHECK: cmp w0, w1 @@ -385,7 +474,7 @@ continue: ret i1 true } -define i1 @ssubo.br.i64(i64 %v1, i64 %v2) { +define zeroext i1 @ssubo.br.i64(i64 %v1, i64 %v2) { entry: ; CHECK-LABEL: ssubo.br.i64 ; CHECK: cmp x0, x1 @@ -402,7 +491,7 @@ continue: ret i1 true } -define i1 @usubo.br.i32(i32 %v1, i32 %v2) { +define zeroext i1 @usubo.br.i32(i32 %v1, i32 %v2) { entry: ; CHECK-LABEL: usubo.br.i32 ; CHECK: cmp w0, w1 @@ -419,7 +508,7 @@ continue: ret i1 true } -define i1 @usubo.br.i64(i64 %v1, i64 %v2) { +define zeroext i1 @usubo.br.i64(i64 %v1, i64 %v2) { entry: ; CHECK-LABEL: usubo.br.i64 ; CHECK: cmp x0, x1 @@ -436,12 +525,12 @@ continue: ret i1 true } -define i1 @smulo.br.i32(i32 %v1, i32 %v2) { +define zeroext i1 @smulo.br.i32(i32 %v1, i32 %v2) { entry: ; CHECK-LABEL: smulo.br.i32 -; CHECK: smull x8, w0, w1 -; CHECK-NEXT: lsr x9, x8, #32 -; CHECK-NEXT: cmp w9, w8, asr #31 +; CHECK: smull x[[MREG:[0-9]+]], w0, w1 +; CHECK-NEXT: lsr x[[SREG:[0-9]+]], x8, #32 +; CHECK-NEXT: cmp w[[SREG]], w[[MREG]], asr #31 ; CHECK-NEXT: b.eq %t = call {i32, i1} @llvm.smul.with.overflow.i32(i32 %v1, i32 %v2) %val = extractvalue {i32, i1} %t, 0 @@ -455,12 +544,12 @@ continue: ret i1 true } -define i1 @smulo.br.i64(i64 %v1, i64 %v2) { +define zeroext i1 @smulo.br.i64(i64 %v1, i64 %v2) { entry: ; CHECK-LABEL: smulo.br.i64 -; CHECK: mul x8, x0, x1 -; CHECK-NEXT: smulh x9, x0, x1 -; CHECK-NEXT: cmp x9, x8, asr #63 +; CHECK: mul [[MREG:x[0-9]+]], x0, x1 +; CHECK-NEXT: smulh [[HREG:x[0-9]+]], x0, x1 +; CHECK-NEXT: cmp [[HREG]], [[MREG]], asr #63 ; CHECK-NEXT: b.eq %t = call {i64, i1} @llvm.smul.with.overflow.i64(i64 %v1, i64 %v2) %val = extractvalue {i64, i1} %t, 0 @@ -474,11 +563,11 @@ continue: ret i1 true } -define i1 @umulo.br.i32(i32 %v1, i32 %v2) { +define zeroext i1 @umulo.br.i32(i32 %v1, i32 %v2) { entry: ; CHECK-LABEL: umulo.br.i32 -; CHECK: umull x8, w0, w1 -; CHECK-NEXT: cmp xzr, x8, lsr #32 +; CHECK: umull [[MREG:x[0-9]+]], w0, w1 +; CHECK-NEXT: cmp xzr, [[MREG]], lsr #32 ; CHECK-NEXT: b.eq %t = call {i32, i1} @llvm.umul.with.overflow.i32(i32 %v1, i32 %v2) %val = extractvalue {i32, i1} %t, 0 @@ -492,11 +581,11 @@ continue: ret i1 true } -define i1 @umulo.br.i64(i64 %v1, i64 %v2) { +define zeroext i1 @umulo.br.i64(i64 %v1, i64 %v2) { entry: ; CHECK-LABEL: umulo.br.i64 -; CHECK: umulh x8, x0, x1 -; CHECK-NEXT: cbz +; CHECK: umulh [[REG:x[0-9]+]], x0, x1 +; CHECK-NEXT: {{cbz|cmp}} %t = call {i64, i1} @llvm.umul.with.overflow.i64(i64 %v1, i64 %v2) %val = extractvalue {i64, i1} %t, 0 %obit = extractvalue {i64, i1} %t, 1