diff options
-rw-r--r-- | llvm/test/Transforms/InstCombine/intrinsics.ll | 303 | ||||
-rw-r--r-- | llvm/test/Transforms/InstCombine/with_overflow.ll | 347 |
2 files changed, 347 insertions, 303 deletions
diff --git a/llvm/test/Transforms/InstCombine/intrinsics.ll b/llvm/test/Transforms/InstCombine/intrinsics.ll index 8de892fd81b..157c14bbd95 100644 --- a/llvm/test/Transforms/InstCombine/intrinsics.ll +++ b/llvm/test/Transforms/InstCombine/intrinsics.ll @@ -1,18 +1,6 @@ ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py ; RUN: opt -instcombine -S < %s | FileCheck %s -%overflow.result = type {i8, i1} -%ov.result.32 = type { i32, i1 } - - -declare %overflow.result @llvm.uadd.with.overflow.i8(i8, i8) nounwind readnone -declare %overflow.result @llvm.umul.with.overflow.i8(i8, i8) nounwind readnone -declare %ov.result.32 @llvm.sadd.with.overflow.i32(i32, i32) nounwind readnone -declare %ov.result.32 @llvm.uadd.with.overflow.i32(i32, i32) nounwind readnone -declare %ov.result.32 @llvm.ssub.with.overflow.i32(i32, i32) nounwind readnone -declare %ov.result.32 @llvm.usub.with.overflow.i32(i32, i32) nounwind readnone -declare %ov.result.32 @llvm.smul.with.overflow.i32(i32, i32) nounwind readnone -declare %ov.result.32 @llvm.umul.with.overflow.i32(i32, i32) nounwind readnone declare double @llvm.powi.f64(double, i32) nounwind readonly declare i32 @llvm.cttz.i32(i32, i1) nounwind readnone declare i32 @llvm.ctlz.i32(i32, i1) nounwind readnone @@ -32,232 +20,6 @@ declare double @llvm.trunc.f64(double %Val) nounwind readonly declare double @llvm.rint.f64(double %Val) nounwind readonly declare double @llvm.nearbyint.f64(double %Val) nounwind readonly -define i8 @uaddtest1(i8 %A, i8 %B) { - %x = call %overflow.result @llvm.uadd.with.overflow.i8(i8 %A, i8 %B) - %y = extractvalue %overflow.result %x, 0 - ret i8 %y -; CHECK-LABEL: @uaddtest1( -; CHECK-NEXT: %y = add i8 %A, %B -; CHECK-NEXT: ret i8 %y -} - -define i8 @uaddtest2(i8 %A, i8 %B, i1* %overflowPtr) { - %and.A = and i8 %A, 127 - %and.B = and i8 %B, 127 - %x = call %overflow.result @llvm.uadd.with.overflow.i8(i8 %and.A, i8 %and.B) - %y = extractvalue %overflow.result %x, 0 - %z = extractvalue %overflow.result %x, 1 - store i1 %z, i1* %overflowPtr - ret i8 %y -; CHECK-LABEL: @uaddtest2( -; CHECK-NEXT: %and.A = and i8 %A, 127 -; CHECK-NEXT: %and.B = and i8 %B, 127 -; CHECK-NEXT: %x = add nuw i8 %and.A, %and.B -; CHECK-NEXT: store i1 false, i1* %overflowPtr -; CHECK-NEXT: ret i8 %x -} - -define i8 @uaddtest3(i8 %A, i8 %B, i1* %overflowPtr) { - %or.A = or i8 %A, -128 - %or.B = or i8 %B, -128 - %x = call %overflow.result @llvm.uadd.with.overflow.i8(i8 %or.A, i8 %or.B) - %y = extractvalue %overflow.result %x, 0 - %z = extractvalue %overflow.result %x, 1 - store i1 %z, i1* %overflowPtr - ret i8 %y -; CHECK-LABEL: @uaddtest3( -; CHECK-NEXT: %or.A = or i8 %A, -128 -; CHECK-NEXT: %or.B = or i8 %B, -128 -; CHECK-NEXT: %x = add i8 %or.A, %or.B -; CHECK-NEXT: store i1 true, i1* %overflowPtr -; CHECK-NEXT: ret i8 %x -} - -define i8 @uaddtest4(i8 %A, i1* %overflowPtr) { - %x = call %overflow.result @llvm.uadd.with.overflow.i8(i8 undef, i8 %A) - %y = extractvalue %overflow.result %x, 0 - %z = extractvalue %overflow.result %x, 1 - store i1 %z, i1* %overflowPtr - ret i8 %y -; CHECK-LABEL: @uaddtest4( -; CHECK-NEXT: ret i8 undef -} - -define i8 @uaddtest5(i8 %A, i1* %overflowPtr) { - %x = call %overflow.result @llvm.uadd.with.overflow.i8(i8 0, i8 %A) - %y = extractvalue %overflow.result %x, 0 - %z = extractvalue %overflow.result %x, 1 - store i1 %z, i1* %overflowPtr - ret i8 %y -; CHECK-LABEL: @uaddtest5( -; CHECK: ret i8 %A -} - -define i1 @uaddtest6(i8 %A, i8 %B) { - %x = call %overflow.result @llvm.uadd.with.overflow.i8(i8 %A, i8 -4) - %z = extractvalue %overflow.result %x, 1 - ret i1 %z -; CHECK-LABEL: @uaddtest6( -; CHECK-NEXT: %z = icmp ugt i8 %A, 3 -; CHECK-NEXT: ret i1 %z -} - -define i8 @uaddtest7(i8 %A, i8 %B) { - %x = call %overflow.result @llvm.uadd.with.overflow.i8(i8 %A, i8 %B) - %z = extractvalue %overflow.result %x, 0 - ret i8 %z -; CHECK-LABEL: @uaddtest7( -; CHECK-NEXT: %z = add i8 %A, %B -; CHECK-NEXT: ret i8 %z -} - -; PR20194 -define %ov.result.32 @saddtest_nsw(i8 %a, i8 %b) { - %A = sext i8 %a to i32 - %B = sext i8 %b to i32 - %x = call %ov.result.32 @llvm.sadd.with.overflow.i32(i32 %A, i32 %B) - ret %ov.result.32 %x -; CHECK-LABEL: @saddtest_nsw -; CHECK: %x = add nsw i32 %A, %B -; CHECK-NEXT: %1 = insertvalue %ov.result.32 { i32 undef, i1 false }, i32 %x, 0 -; CHECK-NEXT: ret %ov.result.32 %1 -} - -define %ov.result.32 @uaddtest_nuw(i32 %a, i32 %b) { - %A = and i32 %a, 2147483647 - %B = and i32 %b, 2147483647 - %x = call %ov.result.32 @llvm.uadd.with.overflow.i32(i32 %A, i32 %B) - ret %ov.result.32 %x -; CHECK-LABEL: @uaddtest_nuw -; CHECK: %x = add nuw i32 %A, %B -; CHECK-NEXT: %1 = insertvalue %ov.result.32 { i32 undef, i1 false }, i32 %x, 0 -; CHECK-NEXT: ret %ov.result.32 %1 -} - -define %ov.result.32 @ssubtest_nsw(i8 %a, i8 %b) { - %A = sext i8 %a to i32 - %B = sext i8 %b to i32 - %x = call %ov.result.32 @llvm.ssub.with.overflow.i32(i32 %A, i32 %B) - ret %ov.result.32 %x -; CHECK-LABEL: @ssubtest_nsw -; CHECK: %x = sub nsw i32 %A, %B -; CHECK-NEXT: %1 = insertvalue %ov.result.32 { i32 undef, i1 false }, i32 %x, 0 -; CHECK-NEXT: ret %ov.result.32 %1 -} - -define %ov.result.32 @usubtest_nuw(i32 %a, i32 %b) { - %A = or i32 %a, 2147483648 - %B = and i32 %b, 2147483647 - %x = call %ov.result.32 @llvm.usub.with.overflow.i32(i32 %A, i32 %B) - ret %ov.result.32 %x -; CHECK-LABEL: @usubtest_nuw -; CHECK: %x = sub nuw i32 %A, %B -; CHECK-NEXT: %1 = insertvalue %ov.result.32 { i32 undef, i1 false }, i32 %x, 0 -; CHECK-NEXT: ret %ov.result.32 %1 -} - -define %ov.result.32 @smultest1_nsw(i32 %a, i32 %b) { - %A = and i32 %a, 4095 ; 0xfff - %B = and i32 %b, 524287; 0x7ffff - %x = call %ov.result.32 @llvm.smul.with.overflow.i32(i32 %A, i32 %B) - ret %ov.result.32 %x -; CHECK-LABEL: @smultest1_nsw -; CHECK: %x = mul nuw nsw i32 %A, %B -; CHECK-NEXT: %1 = insertvalue %ov.result.32 { i32 undef, i1 false }, i32 %x, 0 -; CHECK-NEXT: ret %ov.result.32 %1 -} - -define %ov.result.32 @smultest2_nsw(i32 %a, i32 %b) { - %A = ashr i32 %a, 16 - %B = ashr i32 %b, 16 - %x = call %ov.result.32 @llvm.smul.with.overflow.i32(i32 %A, i32 %B) - ret %ov.result.32 %x -; CHECK-LABEL: @smultest2_nsw -; CHECK: %x = mul nsw i32 %A, %B -; CHECK-NEXT: %1 = insertvalue %ov.result.32 { i32 undef, i1 false }, i32 %x, 0 -; CHECK-NEXT: ret %ov.result.32 %1 -} - -define %ov.result.32 @smultest3_sw(i32 %a, i32 %b) { - %A = ashr i32 %a, 16 - %B = ashr i32 %b, 15 - %x = call %ov.result.32 @llvm.smul.with.overflow.i32(i32 %A, i32 %B) - ret %ov.result.32 %x -; CHECK-LABEL: @smultest3_sw -; CHECK: %x = call %ov.result.32 @llvm.smul.with.overflow.i32(i32 %A, i32 %B) -; CHECK-NEXT: ret %ov.result.32 %x -} - -define %ov.result.32 @umultest_nuw(i32 %a, i32 %b) { - %A = and i32 %a, 65535 ; 0xffff - %B = and i32 %b, 65535 ; 0xffff - %x = call %ov.result.32 @llvm.umul.with.overflow.i32(i32 %A, i32 %B) - ret %ov.result.32 %x -; CHECK-LABEL: @umultest_nuw -; CHECK: %x = mul nuw i32 %A, %B -; CHECK-NEXT: %1 = insertvalue %ov.result.32 { i32 undef, i1 false }, i32 %x, 0 -; CHECK-NEXT: ret %ov.result.32 %1 -} - -define i8 @umultest1(i8 %A, i1* %overflowPtr) { - %x = call %overflow.result @llvm.umul.with.overflow.i8(i8 0, i8 %A) - %y = extractvalue %overflow.result %x, 0 - %z = extractvalue %overflow.result %x, 1 - store i1 %z, i1* %overflowPtr - ret i8 %y -; CHECK-LABEL: @umultest1( -; CHECK-NEXT: store i1 false, i1* %overflowPtr -; CHECK-NEXT: ret i8 0 -} - -define i8 @umultest2(i8 %A, i1* %overflowPtr) { - %x = call %overflow.result @llvm.umul.with.overflow.i8(i8 1, i8 %A) - %y = extractvalue %overflow.result %x, 0 - %z = extractvalue %overflow.result %x, 1 - store i1 %z, i1* %overflowPtr - ret i8 %y -; CHECK-LABEL: @umultest2( -; CHECK-NEXT: store i1 false, i1* %overflowPtr -; CHECK-NEXT: ret i8 %A -} - -define i32 @umultest3(i32 %n) nounwind { - %shr = lshr i32 %n, 2 - %mul = call %ov.result.32 @llvm.umul.with.overflow.i32(i32 %shr, i32 3) - %ov = extractvalue %ov.result.32 %mul, 1 - %res = extractvalue %ov.result.32 %mul, 0 - %ret = select i1 %ov, i32 -1, i32 %res - ret i32 %ret -; CHECK-LABEL: @umultest3( -; CHECK-NEXT: shr -; CHECK-NEXT: mul nuw -; CHECK-NEXT: ret -} - -define i32 @umultest4(i32 %n) nounwind { - %shr = lshr i32 %n, 1 - %mul = call %ov.result.32 @llvm.umul.with.overflow.i32(i32 %shr, i32 4) - %ov = extractvalue %ov.result.32 %mul, 1 - %res = extractvalue %ov.result.32 %mul, 0 - %ret = select i1 %ov, i32 -1, i32 %res - ret i32 %ret -; CHECK-LABEL: @umultest4( -; CHECK: umul.with.overflow -} - -define %ov.result.32 @umultest5(i32 %x, i32 %y) nounwind { - %or_x = or i32 %x, 2147483648 - %or_y = or i32 %y, 2147483648 - %mul = call %ov.result.32 @llvm.umul.with.overflow.i32(i32 %or_x, i32 %or_y) - ret %ov.result.32 %mul -; CHECK-LABEL: @umultest5( -; CHECK-NEXT: %[[or_x:.*]] = or i32 %x, -2147483648 -; CHECK-NEXT: %[[or_y:.*]] = or i32 %y, -2147483648 -; CHECK-NEXT: %[[mul:.*]] = mul i32 %[[or_x]], %[[or_y]] -; CHECK-NEXT: %[[ret:.*]] = insertvalue %ov.result.32 { i32 undef, i1 true }, i32 %[[mul]], 0 -; CHECK-NEXT: ret %ov.result.32 %[[ret]] -} - define void @powi(double %V, double *%P) { %A = tail call double @llvm.powi.f64(double %V, i32 -1) nounwind store volatile double %A, double* %P @@ -574,71 +336,6 @@ define <2 x i32> @cttz_select_vec(<2 x i32> %Value) nounwind { ret <2 x i32> %s } -define i1 @overflow_div_add(i32 %v1, i32 %v2) nounwind { -; CHECK-LABEL: @overflow_div_add( -; CHECK-NEXT: ret i1 false -; - %div = sdiv i32 %v1, 2 - %t = call %ov.result.32 @llvm.sadd.with.overflow.i32(i32 %div, i32 1) - %obit = extractvalue %ov.result.32 %t, 1 - ret i1 %obit -} - -define i1 @overflow_div_sub(i32 %v1, i32 %v2) nounwind { - ; Check cases where the known sign bits are larger than the word size. -; CHECK-LABEL: @overflow_div_sub( -; CHECK-NEXT: ret i1 false -; - %a = ashr i32 %v1, 18 - %div = sdiv i32 %a, 65536 - %t = call %ov.result.32 @llvm.ssub.with.overflow.i32(i32 %div, i32 1) - %obit = extractvalue %ov.result.32 %t, 1 - ret i1 %obit -} - -define i1 @overflow_mod_mul(i32 %v1, i32 %v2) nounwind { -; CHECK-LABEL: @overflow_mod_mul( -; CHECK-NEXT: ret i1 false -; - %rem = srem i32 %v1, 1000 - %t = call %ov.result.32 @llvm.smul.with.overflow.i32(i32 %rem, i32 %rem) - %obit = extractvalue %ov.result.32 %t, 1 - ret i1 %obit -} - -define i1 @overflow_mod_overflow_mul(i32 %v1, i32 %v2) nounwind { -; CHECK-LABEL: @overflow_mod_overflow_mul( -; CHECK-NEXT: [[REM:%.*]] = srem i32 %v1, 65537 -; CHECK-NEXT: [[T:%.*]] = call %ov.result.32 @llvm.smul.with.overflow.i32(i32 [[REM]], i32 [[REM]]) -; CHECK-NEXT: [[OBIT:%.*]] = extractvalue %ov.result.32 [[T]], 1 -; CHECK-NEXT: ret i1 [[OBIT]] -; - %rem = srem i32 %v1, 65537 - ; This may overflow because the result of the mul operands may be greater than 16bits - ; and the result greater than 32. - %t = call %ov.result.32 @llvm.smul.with.overflow.i32(i32 %rem, i32 %rem) - %obit = extractvalue %ov.result.32 %t, 1 - ret i1 %obit -} - -define %ov.result.32 @ssubtest_reorder(i8 %a) { - %A = sext i8 %a to i32 - %x = call %ov.result.32 @llvm.ssub.with.overflow.i32(i32 0, i32 %A) - ret %ov.result.32 %x -; CHECK-LABEL: @ssubtest_reorder -; CHECK: %x = sub nsw i32 0, %A -; CHECK-NEXT: %1 = insertvalue %ov.result.32 { i32 undef, i1 false }, i32 %x, 0 -; CHECK-NEXT: ret %ov.result.32 %1 -} - -define %ov.result.32 @never_overflows_ssub_test0(i32 %a) { - %x = call %ov.result.32 @llvm.ssub.with.overflow.i32(i32 %a, i32 0) - ret %ov.result.32 %x -; CHECK-LABEL: @never_overflows_ssub_test0 -; CHECK-NEXT: %[[x:.*]] = insertvalue %ov.result.32 { i32 undef, i1 false }, i32 %a, 0 -; CHECK-NEXT: ret %ov.result.32 %[[x]] -} - define void @cos(double *%P) { ; CHECK-LABEL: @cos( ; CHECK-NEXT: store volatile double 1.000000e+00, double* %P, align 8 diff --git a/llvm/test/Transforms/InstCombine/with_overflow.ll b/llvm/test/Transforms/InstCombine/with_overflow.ll new file mode 100644 index 00000000000..13339c392e7 --- /dev/null +++ b/llvm/test/Transforms/InstCombine/with_overflow.ll @@ -0,0 +1,347 @@ +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py +; RUN: opt -instcombine -S < %s | FileCheck %s + +declare { i8, i1 } @llvm.uadd.with.overflow.i8(i8, i8) nounwind readnone +declare { i8, i1 } @llvm.umul.with.overflow.i8(i8, i8) nounwind readnone +declare { i32, i1 } @llvm.sadd.with.overflow.i32(i32, i32) nounwind readnone +declare { i32, i1 } @llvm.uadd.with.overflow.i32(i32, i32) nounwind readnone +declare { i32, i1 } @llvm.ssub.with.overflow.i32(i32, i32) nounwind readnone +declare { i32, i1 } @llvm.usub.with.overflow.i32(i32, i32) nounwind readnone +declare { i32, i1 } @llvm.smul.with.overflow.i32(i32, i32) nounwind readnone +declare { i32, i1 } @llvm.umul.with.overflow.i32(i32, i32) nounwind readnone + +define i8 @uaddtest1(i8 %A, i8 %B) { +; CHECK-LABEL: @uaddtest1( +; CHECK-NEXT: [[Y:%.*]] = add i8 [[A:%.*]], [[B:%.*]] +; CHECK-NEXT: ret i8 [[Y]] +; + %x = call { i8, i1 } @llvm.uadd.with.overflow.i8(i8 %A, i8 %B) + %y = extractvalue { i8, i1 } %x, 0 + ret i8 %y +} + +define i8 @uaddtest2(i8 %A, i8 %B, i1* %overflowPtr) { +; CHECK-LABEL: @uaddtest2( +; CHECK-NEXT: [[AND_A:%.*]] = and i8 [[A:%.*]], 127 +; CHECK-NEXT: [[AND_B:%.*]] = and i8 [[B:%.*]], 127 +; CHECK-NEXT: [[X:%.*]] = add nuw i8 [[AND_A]], [[AND_B]] +; CHECK-NEXT: store i1 false, i1* [[OVERFLOWPTR:%.*]], align 1 +; CHECK-NEXT: ret i8 [[X]] +; + %and.A = and i8 %A, 127 + %and.B = and i8 %B, 127 + %x = call { i8, i1 } @llvm.uadd.with.overflow.i8(i8 %and.A, i8 %and.B) + %y = extractvalue { i8, i1 } %x, 0 + %z = extractvalue { i8, i1 } %x, 1 + store i1 %z, i1* %overflowPtr + ret i8 %y +} + +define i8 @uaddtest3(i8 %A, i8 %B, i1* %overflowPtr) { +; CHECK-LABEL: @uaddtest3( +; CHECK-NEXT: [[OR_A:%.*]] = or i8 [[A:%.*]], -128 +; CHECK-NEXT: [[OR_B:%.*]] = or i8 [[B:%.*]], -128 +; CHECK-NEXT: [[X:%.*]] = add i8 [[OR_A]], [[OR_B]] +; CHECK-NEXT: store i1 true, i1* [[OVERFLOWPTR:%.*]], align 1 +; CHECK-NEXT: ret i8 [[X]] +; + %or.A = or i8 %A, -128 + %or.B = or i8 %B, -128 + %x = call { i8, i1 } @llvm.uadd.with.overflow.i8(i8 %or.A, i8 %or.B) + %y = extractvalue { i8, i1 } %x, 0 + %z = extractvalue { i8, i1 } %x, 1 + store i1 %z, i1* %overflowPtr + ret i8 %y +} + +define i8 @uaddtest4(i8 %A, i1* %overflowPtr) { +; CHECK-LABEL: @uaddtest4( +; CHECK-NEXT: ret i8 undef +; + %x = call { i8, i1 } @llvm.uadd.with.overflow.i8(i8 undef, i8 %A) + %y = extractvalue { i8, i1 } %x, 0 + %z = extractvalue { i8, i1 } %x, 1 + store i1 %z, i1* %overflowPtr + ret i8 %y +} + +define i8 @uaddtest5(i8 %A, i1* %overflowPtr) { +; CHECK-LABEL: @uaddtest5( +; CHECK-NEXT: store i1 false, i1* [[OVERFLOWPTR:%.*]], align 1 +; CHECK-NEXT: ret i8 [[A:%.*]] +; + %x = call { i8, i1 } @llvm.uadd.with.overflow.i8(i8 0, i8 %A) + %y = extractvalue { i8, i1 } %x, 0 + %z = extractvalue { i8, i1 } %x, 1 + store i1 %z, i1* %overflowPtr + ret i8 %y +} + +define i1 @uaddtest6(i8 %A, i8 %B) { +; CHECK-LABEL: @uaddtest6( +; CHECK-NEXT: [[Z:%.*]] = icmp ugt i8 [[A:%.*]], 3 +; CHECK-NEXT: ret i1 [[Z]] +; + %x = call { i8, i1 } @llvm.uadd.with.overflow.i8(i8 %A, i8 -4) + %z = extractvalue { i8, i1 } %x, 1 + ret i1 %z +} + +define i8 @uaddtest7(i8 %A, i8 %B) { +; CHECK-LABEL: @uaddtest7( +; CHECK-NEXT: [[Z:%.*]] = add i8 [[A:%.*]], [[B:%.*]] +; CHECK-NEXT: ret i8 [[Z]] +; + %x = call { i8, i1 } @llvm.uadd.with.overflow.i8(i8 %A, i8 %B) + %z = extractvalue { i8, i1 } %x, 0 + ret i8 %z +} + +; PR20194 +define { i32, i1 } @saddtest_nsw(i8 %a, i8 %b) { +; CHECK-LABEL: @saddtest_nsw( +; CHECK-NEXT: [[AA:%.*]] = sext i8 [[A:%.*]] to i32 +; CHECK-NEXT: [[BB:%.*]] = sext i8 [[B:%.*]] to i32 +; CHECK-NEXT: [[X:%.*]] = add nsw i32 [[AA]], [[BB]] +; CHECK-NEXT: [[TMP1:%.*]] = insertvalue { i32, i1 } { i32 undef, i1 false }, i32 [[X]], 0 +; CHECK-NEXT: ret { i32, i1 } [[TMP1]] +; + %aa = sext i8 %a to i32 + %bb = sext i8 %b to i32 + %x = call { i32, i1 } @llvm.sadd.with.overflow.i32(i32 %aa, i32 %bb) + ret { i32, i1 } %x +} + +define { i32, i1 } @uaddtest_nuw(i32 %a, i32 %b) { +; CHECK-LABEL: @uaddtest_nuw( +; CHECK-NEXT: [[AA:%.*]] = and i32 [[A:%.*]], 2147483647 +; CHECK-NEXT: [[BB:%.*]] = and i32 [[B:%.*]], 2147483647 +; CHECK-NEXT: [[X:%.*]] = add nuw i32 [[AA]], [[BB]] +; CHECK-NEXT: [[TMP1:%.*]] = insertvalue { i32, i1 } { i32 undef, i1 false }, i32 [[X]], 0 +; CHECK-NEXT: ret { i32, i1 } [[TMP1]] +; + %aa = and i32 %a, 2147483647 + %bb = and i32 %b, 2147483647 + %x = call { i32, i1 } @llvm.uadd.with.overflow.i32(i32 %aa, i32 %bb) + ret { i32, i1 } %x +} + +define { i32, i1 } @ssubtest_nsw(i8 %a, i8 %b) { +; CHECK-LABEL: @ssubtest_nsw( +; CHECK-NEXT: [[AA:%.*]] = sext i8 [[A:%.*]] to i32 +; CHECK-NEXT: [[BB:%.*]] = sext i8 [[B:%.*]] to i32 +; CHECK-NEXT: [[X:%.*]] = sub nsw i32 [[AA]], [[BB]] +; CHECK-NEXT: [[TMP1:%.*]] = insertvalue { i32, i1 } { i32 undef, i1 false }, i32 [[X]], 0 +; CHECK-NEXT: ret { i32, i1 } [[TMP1]] +; + %aa = sext i8 %a to i32 + %bb = sext i8 %b to i32 + %x = call { i32, i1 } @llvm.ssub.with.overflow.i32(i32 %aa, i32 %bb) + ret { i32, i1 } %x +} + +define { i32, i1 } @usubtest_nuw(i32 %a, i32 %b) { +; CHECK-LABEL: @usubtest_nuw( +; CHECK-NEXT: [[AA:%.*]] = or i32 [[A:%.*]], -2147483648 +; CHECK-NEXT: [[BB:%.*]] = and i32 [[B:%.*]], 2147483647 +; CHECK-NEXT: [[X:%.*]] = sub nuw i32 [[AA]], [[BB]] +; CHECK-NEXT: [[TMP1:%.*]] = insertvalue { i32, i1 } { i32 undef, i1 false }, i32 [[X]], 0 +; CHECK-NEXT: ret { i32, i1 } [[TMP1]] +; + %aa = or i32 %a, 2147483648 + %bb = and i32 %b, 2147483647 + %x = call { i32, i1 } @llvm.usub.with.overflow.i32(i32 %aa, i32 %bb) + ret { i32, i1 } %x +} + +define { i32, i1 } @smultest1_nsw(i32 %a, i32 %b) { +; CHECK-LABEL: @smultest1_nsw( +; CHECK-NEXT: [[AA:%.*]] = and i32 [[A:%.*]], 4095 +; CHECK-NEXT: [[BB:%.*]] = and i32 [[B:%.*]], 524287 +; CHECK-NEXT: [[X:%.*]] = mul nuw nsw i32 [[AA]], [[BB]] +; CHECK-NEXT: [[TMP1:%.*]] = insertvalue { i32, i1 } { i32 undef, i1 false }, i32 [[X]], 0 +; CHECK-NEXT: ret { i32, i1 } [[TMP1]] +; + %aa = and i32 %a, 4095 ; 0xfff + %bb = and i32 %b, 524287; 0x7ffff + %x = call { i32, i1 } @llvm.smul.with.overflow.i32(i32 %aa, i32 %bb) + ret { i32, i1 } %x +} + +define { i32, i1 } @smultest2_nsw(i32 %a, i32 %b) { +; CHECK-LABEL: @smultest2_nsw( +; CHECK-NEXT: [[AA:%.*]] = ashr i32 [[A:%.*]], 16 +; CHECK-NEXT: [[BB:%.*]] = ashr i32 [[B:%.*]], 16 +; CHECK-NEXT: [[X:%.*]] = mul nsw i32 [[AA]], [[BB]] +; CHECK-NEXT: [[TMP1:%.*]] = insertvalue { i32, i1 } { i32 undef, i1 false }, i32 [[X]], 0 +; CHECK-NEXT: ret { i32, i1 } [[TMP1]] +; + %aa = ashr i32 %a, 16 + %bb = ashr i32 %b, 16 + %x = call { i32, i1 } @llvm.smul.with.overflow.i32(i32 %aa, i32 %bb) + ret { i32, i1 } %x +} + +define { i32, i1 } @smultest3_sw(i32 %a, i32 %b) { +; CHECK-LABEL: @smultest3_sw( +; CHECK-NEXT: [[AA:%.*]] = ashr i32 [[A:%.*]], 16 +; CHECK-NEXT: [[BB:%.*]] = ashr i32 [[B:%.*]], 15 +; CHECK-NEXT: [[X:%.*]] = call { i32, i1 } @llvm.smul.with.overflow.i32(i32 [[AA]], i32 [[BB]]) +; CHECK-NEXT: ret { i32, i1 } [[X]] +; + %aa = ashr i32 %a, 16 + %bb = ashr i32 %b, 15 + %x = call { i32, i1 } @llvm.smul.with.overflow.i32(i32 %aa, i32 %bb) + ret { i32, i1 } %x +} + +define { i32, i1 } @umultest_nuw(i32 %a, i32 %b) { +; CHECK-LABEL: @umultest_nuw( +; CHECK-NEXT: [[AA:%.*]] = and i32 [[A:%.*]], 65535 +; CHECK-NEXT: [[BB:%.*]] = and i32 [[B:%.*]], 65535 +; CHECK-NEXT: [[X:%.*]] = mul nuw i32 [[AA]], [[BB]] +; CHECK-NEXT: [[TMP1:%.*]] = insertvalue { i32, i1 } { i32 undef, i1 false }, i32 [[X]], 0 +; CHECK-NEXT: ret { i32, i1 } [[TMP1]] +; + %aa = and i32 %a, 65535 ; 0xffff + %bb = and i32 %b, 65535 ; 0xffff + %x = call { i32, i1 } @llvm.umul.with.overflow.i32(i32 %aa, i32 %bb) + ret { i32, i1 } %x +} + +define i8 @umultest1(i8 %A, i1* %overflowPtr) { +; CHECK-LABEL: @umultest1( +; CHECK-NEXT: store i1 false, i1* [[OVERFLOWPTR:%.*]], align 1 +; CHECK-NEXT: ret i8 0 +; + %x = call { i8, i1 } @llvm.umul.with.overflow.i8(i8 0, i8 %A) + %y = extractvalue { i8, i1 } %x, 0 + %z = extractvalue { i8, i1 } %x, 1 + store i1 %z, i1* %overflowPtr + ret i8 %y +} + +define i8 @umultest2(i8 %A, i1* %overflowPtr) { +; CHECK-LABEL: @umultest2( +; CHECK-NEXT: store i1 false, i1* [[OVERFLOWPTR:%.*]], align 1 +; CHECK-NEXT: ret i8 [[A:%.*]] +; + %x = call { i8, i1 } @llvm.umul.with.overflow.i8(i8 1, i8 %A) + %y = extractvalue { i8, i1 } %x, 0 + %z = extractvalue { i8, i1 } %x, 1 + store i1 %z, i1* %overflowPtr + ret i8 %y +} + +define i32 @umultest3(i32 %n) nounwind { +; CHECK-LABEL: @umultest3( +; CHECK-NEXT: [[SHR:%.*]] = lshr i32 [[N:%.*]], 2 +; CHECK-NEXT: [[MUL:%.*]] = mul nuw i32 [[SHR]], 3 +; CHECK-NEXT: ret i32 [[MUL]] +; + %shr = lshr i32 %n, 2 + %mul = call { i32, i1 } @llvm.umul.with.overflow.i32(i32 %shr, i32 3) + %ov = extractvalue { i32, i1 } %mul, 1 + %res = extractvalue { i32, i1 } %mul, 0 + %ret = select i1 %ov, i32 -1, i32 %res + ret i32 %ret +} + +define i32 @umultest4(i32 %n) nounwind { +; CHECK-LABEL: @umultest4( +; CHECK-NEXT: [[SHR:%.*]] = lshr i32 [[N:%.*]], 1 +; CHECK-NEXT: [[MUL:%.*]] = call { i32, i1 } @llvm.umul.with.overflow.i32(i32 [[SHR]], i32 4) +; CHECK-NEXT: [[OV:%.*]] = extractvalue { i32, i1 } [[MUL]], 1 +; CHECK-NEXT: [[RES:%.*]] = extractvalue { i32, i1 } [[MUL]], 0 +; CHECK-NEXT: [[RET:%.*]] = select i1 [[OV]], i32 -1, i32 [[RES]] +; CHECK-NEXT: ret i32 [[RET]] +; + %shr = lshr i32 %n, 1 + %mul = call { i32, i1 } @llvm.umul.with.overflow.i32(i32 %shr, i32 4) + %ov = extractvalue { i32, i1 } %mul, 1 + %res = extractvalue { i32, i1 } %mul, 0 + %ret = select i1 %ov, i32 -1, i32 %res + ret i32 %ret +} + +define { i32, i1 } @umultest5(i32 %x, i32 %y) nounwind { +; CHECK-LABEL: @umultest5( +; CHECK-NEXT: [[OR_X:%.*]] = or i32 [[X:%.*]], -2147483648 +; CHECK-NEXT: [[OR_Y:%.*]] = or i32 [[Y:%.*]], -2147483648 +; CHECK-NEXT: [[MUL:%.*]] = mul i32 [[OR_X]], [[OR_Y]] +; CHECK-NEXT: [[TMP1:%.*]] = insertvalue { i32, i1 } { i32 undef, i1 true }, i32 [[MUL]], 0 +; CHECK-NEXT: ret { i32, i1 } [[TMP1]] +; + %or_x = or i32 %x, 2147483648 + %or_y = or i32 %y, 2147483648 + %mul = call { i32, i1 } @llvm.umul.with.overflow.i32(i32 %or_x, i32 %or_y) + ret { i32, i1 } %mul +} + +define i1 @overflow_div_add(i32 %v1, i32 %v2) nounwind { +; CHECK-LABEL: @overflow_div_add( +; CHECK-NEXT: ret i1 false +; + %div = sdiv i32 %v1, 2 + %t = call { i32, i1 } @llvm.sadd.with.overflow.i32(i32 %div, i32 1) + %obit = extractvalue { i32, i1 } %t, 1 + ret i1 %obit +} + +define i1 @overflow_div_sub(i32 %v1, i32 %v2) nounwind { + ; Check cases where the known sign bits are larger than the word size. +; CHECK-LABEL: @overflow_div_sub( +; CHECK-NEXT: ret i1 false +; + %a = ashr i32 %v1, 18 + %div = sdiv i32 %a, 65536 + %t = call { i32, i1 } @llvm.ssub.with.overflow.i32(i32 %div, i32 1) + %obit = extractvalue { i32, i1 } %t, 1 + ret i1 %obit +} + +define i1 @overflow_mod_mul(i32 %v1, i32 %v2) nounwind { +; CHECK-LABEL: @overflow_mod_mul( +; CHECK-NEXT: ret i1 false +; + %rem = srem i32 %v1, 1000 + %t = call { i32, i1 } @llvm.smul.with.overflow.i32(i32 %rem, i32 %rem) + %obit = extractvalue { i32, i1 } %t, 1 + ret i1 %obit +} + +define i1 @overflow_mod_overflow_mul(i32 %v1, i32 %v2) nounwind { +; CHECK-LABEL: @overflow_mod_overflow_mul( +; CHECK-NEXT: [[REM:%.*]] = srem i32 [[V1:%.*]], 65537 +; CHECK-NEXT: [[T:%.*]] = call { i32, i1 } @llvm.smul.with.overflow.i32(i32 [[REM]], i32 [[REM]]) +; CHECK-NEXT: [[OBIT:%.*]] = extractvalue { i32, i1 } [[T]], 1 +; CHECK-NEXT: ret i1 [[OBIT]] +; + %rem = srem i32 %v1, 65537 + ; This may overflow because the result of the mul operands may be greater than 16bits + ; and the result greater than 32. + %t = call { i32, i1 } @llvm.smul.with.overflow.i32(i32 %rem, i32 %rem) + %obit = extractvalue { i32, i1 } %t, 1 + ret i1 %obit +} + +define { i32, i1 } @ssubtest_reorder(i8 %a) { +; CHECK-LABEL: @ssubtest_reorder( +; CHECK-NEXT: [[AA:%.*]] = sext i8 [[A:%.*]] to i32 +; CHECK-NEXT: [[X:%.*]] = sub nsw i32 0, [[AA]] +; CHECK-NEXT: [[TMP1:%.*]] = insertvalue { i32, i1 } { i32 undef, i1 false }, i32 [[X]], 0 +; CHECK-NEXT: ret { i32, i1 } [[TMP1]] +; + %aa = sext i8 %a to i32 + %x = call { i32, i1 } @llvm.ssub.with.overflow.i32(i32 0, i32 %aa) + ret { i32, i1 } %x +} + +define { i32, i1 } @never_overflows_ssub_test0(i32 %a) { +; CHECK-LABEL: @never_overflows_ssub_test0( +; CHECK-NEXT: [[X:%.*]] = insertvalue { i32, i1 } { i32 undef, i1 false }, i32 [[A:%.*]], 0 +; CHECK-NEXT: ret { i32, i1 } [[X]] +; + %x = call { i32, i1 } @llvm.ssub.with.overflow.i32(i32 %a, i32 0) + ret { i32, i1 } %x +} |