[IndVarSimplify] Ensure fp values can be represented as consecutive integers #166649

antoniofrighetto · 2025-11-05T21:56:18Z

When transforming floating-point induction variables into integer ones, make sure we stay within the bounds of fp values that can be represented as integers without gaps, i.e., 2^24 and 2^53 for IEEE-754 single and double precision respectively (both on negative and positive side).

Fixes: #166496.

llvmbot · 2025-11-05T21:56:54Z

@llvm/pr-subscribers-llvm-transforms

Author: Antonio Frighetto (antoniofrighetto)

Changes

When transforming floating-point induction variables into integer ones, make sure we stay within the bounds of fp values that can be represented as integers without gaps, i.e., 2^24 and 2^53 for IEEE-754 single and double precision respectively (both on negative and positive side).

Fixes: #166496.

Full diff: https://github.com/llvm/llvm-project/pull/166649.diff

2 Files Affected:

(modified) llvm/lib/Transforms/Scalar/IndVarSimplify.cpp (+27)
(modified) llvm/test/Transforms/IndVarSimplify/floating-point-iv.ll (+83)

diff --git a/llvm/lib/Transforms/Scalar/IndVarSimplify.cpp b/llvm/lib/Transforms/Scalar/IndVarSimplify.cpp
index 4ba4ba3850e58..0df8670942212 100644
--- a/llvm/lib/Transforms/Scalar/IndVarSimplify.cpp
+++ b/llvm/lib/Transforms/Scalar/IndVarSimplify.cpp
@@ -228,6 +228,21 @@ bool IndVarSimplify::handleFloatingPointIV(Loop *L, PHINode *PN) {
       !ConvertToSInt(IncValueVal->getValueAPF(), IncValue))
     return false;
 
+  // Ensure we stay within the bounds of fp values that can be represented
+  // as integers without gaps, i.e., 2^24 and 2^53 for IEEE-754 single and
+  // double precision respectively (both on negative and positive side).
+  const auto &SVFltSema = InitValueVal->getValueAPF().getSemantics();
+  if (!APFloat::isIEEELikeFP(SVFltSema))
+    return false;
+
+  uint64_t StartValPrecision = APFloat::semanticsPrecision(SVFltSema);
+  if (StartValPrecision >= 64)
+    return false;
+
+  uint64_t StartValIntegerLimit = 1LL << StartValPrecision;
+  if (uint64_t(std::abs(InitValue)) > StartValIntegerLimit)
+    return false;
+
   // Check Incr uses. One user is PN and the other user is an exit condition
   // used by the conditional terminator.
   Value::user_iterator IncrUse = Incr->user_begin();
@@ -265,6 +280,18 @@ bool IndVarSimplify::handleFloatingPointIV(Loop *L, PHINode *PN) {
       !ConvertToSInt(ExitValueVal->getValueAPF(), ExitValue))
     return false;
 
+  const auto &EVFltSema = ExitValueVal->getValueAPF().getSemantics();
+  if (!APFloat::isIEEELikeFP(EVFltSema))
+    return false;
+
+  uint64_t ExitValPrecision = APFloat::semanticsPrecision(EVFltSema);
+  if (ExitValPrecision >= 64)
+    return false;
+
+  uint64_t ExitValIntegerLimit = 1LL << ExitValPrecision;
+  if (uint64_t(std::abs(ExitValue)) > ExitValIntegerLimit)
+    return false;
+
   // Find new predicate for integer comparison.
   CmpInst::Predicate NewPred = CmpInst::BAD_ICMP_PREDICATE;
   switch (Compare->getPredicate()) {
diff --git a/llvm/test/Transforms/IndVarSimplify/floating-point-iv.ll b/llvm/test/Transforms/IndVarSimplify/floating-point-iv.ll
index b1ef50382c070..e3e6f5e1d2a6f 100644
--- a/llvm/test/Transforms/IndVarSimplify/floating-point-iv.ll
+++ b/llvm/test/Transforms/IndVarSimplify/floating-point-iv.ll
@@ -417,3 +417,86 @@ loop:
 exit:
   ret void
 }
+
+define void @test_fp_to_int_irrealizable_initval() {
+; CHECK-LABEL: @test_fp_to_int_irrealizable_initval(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    br label [[LOOP:%.*]]
+; CHECK:       loop:
+; CHECK-NEXT:    [[IV:%.*]] = phi float [ 1.000000e+08, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ]
+; CHECK-NEXT:    call void @opaque()
+; CHECK-NEXT:    [[IV_NEXT]] = fadd float [[IV]], -1.700000e+01
+; CHECK-NEXT:    [[CMP:%.*]] = fcmp ult float [[IV_NEXT]], 2.500000e+01
+; CHECK-NEXT:    br i1 [[CMP]], label [[EXIT:%.*]], label [[LOOP]]
+; CHECK:       exit:
+; CHECK-NEXT:    ret void
+;
+entry:
+  br label %loop
+
+loop:
+  %iv = phi float [ 1.000000e+08, %entry ], [ %iv.next, %loop ]
+  call void @opaque()
+  %iv.next = fadd float %iv, -1.700000e+01
+  %cmp = fcmp ult float %iv.next, 2.500000e+01
+  br i1 %cmp, label %exit, label %loop
+
+exit:
+  ret void
+}
+
+define void @test_fp_to_int_irrealizable_exitval() {
+; CHECK-LABEL: @test_fp_to_int_irrealizable_exitval(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    br label [[LOOP:%.*]]
+; CHECK:       loop:
+; CHECK-NEXT:    [[IV:%.*]] = phi float [ 2.500000e+01, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ]
+; CHECK-NEXT:    call void @opaque()
+; CHECK-NEXT:    [[IV_NEXT]] = fadd float [[IV]], 1.700000e+01
+; CHECK-NEXT:    [[CMP:%.*]] = fcmp ugt float [[IV_NEXT]], 1.000000e+08
+; CHECK-NEXT:    br i1 [[CMP]], label [[EXIT:%.*]], label [[LOOP]]
+; CHECK:       exit:
+; CHECK-NEXT:    ret void
+;
+entry:
+  br label %loop
+
+loop:
+  %iv = phi float [ 2.500000e+01, %entry ], [ %iv.next, %loop ]
+  call void @opaque()
+  %iv.next = fadd float %iv, 1.700000e+01
+  %cmp = fcmp ugt float %iv.next, 1.000000e+08
+  br i1 %cmp, label %exit, label %loop
+
+exit:
+  ret void
+}
+
+define void @test_fp_to_int_irrealizable_negative_exitval() {
+; CHECK-LABEL: @test_fp_to_int_irrealizable_negative_exitval(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    br label [[LOOP:%.*]]
+; CHECK:       loop:
+; CHECK-NEXT:    [[IV:%.*]] = phi float [ -2.500000e+01, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ]
+; CHECK-NEXT:    call void @opaque()
+; CHECK-NEXT:    [[IV_NEXT]] = fadd float [[IV]], -1.700000e+01
+; CHECK-NEXT:    [[CMP:%.*]] = fcmp ult float [[IV_NEXT]], -1.000000e+08
+; CHECK-NEXT:    br i1 [[CMP]], label [[EXIT:%.*]], label [[LOOP]]
+; CHECK:       exit:
+; CHECK-NEXT:    ret void
+;
+entry:
+  br label %loop
+
+loop:
+  %iv = phi float [ -2.500000e+01, %entry ], [ %iv.next, %loop ]
+  call void @opaque()
+  %iv.next = fadd float %iv, -1.700000e+01
+  %cmp = fcmp ult float %iv.next, -1.000000e+08
+  br i1 %cmp, label %exit, label %loop
+
+exit:
+  ret void
+}
+
+declare void @opaque()

pinskia · 2025-11-06T00:57:56Z

llvm/lib/Transforms/Scalar/IndVarSimplify.cpp

+    return false;
+
+  uint64_t ExitValIntegerLimit = 1LL << ExitValPrecision;
+  if (uint64_t(std::abs(ExitValue)) > ExitValIntegerLimit)


Can ExitValue be INT64_MIN ? If so then there would be undefined behavior here. I don't think it can be but it definitely deserves a comment.

No, INT64_MIN is properly filtered out.

IEEE-754 stores the fractional component as its absolute value with a separate sign bit. It is made signed by typical twos-complement negation. In addition to the fraction is an implicit 1 (for regular) or 0 (for subnormal) left of the decimal point. The number of bits in the fraction plus the implicit digit is the precision field, which is 53 for f64 or 24 for f32.

To get ExitValue == INT64_MIN from ConvertToSInt, it must be normal (implicit 1) with 63 zeros in the fraction. Such a float would have a semantics with precision of 64, which is filtered out by ExitValPrecision >= 64. ExitValPrecision > 64 implies !ConvertToSInt, so that's redundant, but okay to keep.

And the reason that uint64_t(std::abs(ExitValue)) > (1LL << ExitValPrecision) is appropriate, as opposed to an asymmetric range where there's one more negative value allowed, is because the sign bit means there's exactly as many negative floats as positive.

However, I believe the test should be uint64_t(std::abs(ExitValue)) >= (1LL << ExitValPrecision), as equality would allow for two values (positive and negative) with precision ExitValPrecision+1.

The only float semantics with precision==64 is semX87DoubleExtended, but it's !isIEEELikeFP, so it doesn't matter that any floats which take exactly 64 bits to represent are forbidden.

Looks good, besides the >=.

It turns out that ConvertToSInt() would indeed convert the IEEE-754 double precision representation of INT64_MIN (i.e., 0xC3E0000000000000) into an INT64_MIN integer, leading std::abs to be UB. Switched to use llvm::AbsoluteValue, which should be well-defined for all the inputs, also added a test.

However, I believe the test should be uint64_t(std::abs(ExitValue)) >= (1LL << ExitValPrecision), as equality would allow for two values (positive and negative) with precision ExitValPrecision+1.

The end sides (-2^24 and 2^24 for single precision) are the largest values a floating point can be represented as integer without gaps, so allowing them to be converted to integer should be fine. That said, the handling is currently later blocked by !isInt<32>(InitValue) check.

thaliaarchi

Looks good to me, aside from >/>=.

When John reported the miscompilation, I drafted an approach which computes a closed form solution for the trip count with finite floats, taking into account precision loss. But it's more complex than this and should not block this PR. I may still contribute it later.

thaliaarchi · 2025-11-06T04:50:29Z

llvm/lib/Transforms/Scalar/IndVarSimplify.cpp

+    return false;
+
+  uint64_t ExitValIntegerLimit = 1LL << ExitValPrecision;
+  if (uint64_t(std::abs(ExitValue)) > ExitValIntegerLimit)


No, INT64_MIN is properly filtered out.

IEEE-754 stores the fractional component as its absolute value with a separate sign bit. It is made signed by typical twos-complement negation. In addition to the fraction is an implicit 1 (for regular) or 0 (for subnormal) left of the decimal point. The number of bits in the fraction plus the implicit digit is the precision field, which is 53 for f64 or 24 for f32.

To get ExitValue == INT64_MIN from ConvertToSInt, it must be normal (implicit 1) with 63 zeros in the fraction. Such a float would have a semantics with precision of 64, which is filtered out by ExitValPrecision >= 64. ExitValPrecision > 64 implies !ConvertToSInt, so that's redundant, but okay to keep.

And the reason that uint64_t(std::abs(ExitValue)) > (1LL << ExitValPrecision) is appropriate, as opposed to an asymmetric range where there's one more negative value allowed, is because the sign bit means there's exactly as many negative floats as positive.

However, I believe the test should be uint64_t(std::abs(ExitValue)) >= (1LL << ExitValPrecision), as equality would allow for two values (positive and negative) with precision ExitValPrecision+1.

The only float semantics with precision==64 is semX87DoubleExtended, but it's !isIEEELikeFP, so it doesn't matter that any floats which take exactly 64 bits to represent are forbidden.

Looks good, besides the >=.

pinskia · 2025-11-06T05:23:54Z

The only float semantics with precision==64 is semX87DoubleExtended, but it's !isIEEELikeFP, so it doesn't matter that any floats which take exactly 64 bits to represent are forbidden.

Wait semX87DoubleExtended is !isIEEELikeFP, that seems wrong to me. But what do I know about the LLVM internals. So I just looked and yes LLVM says semX87DoubleExtended is not isIEEELikeFP. I wonder how much fall out would happen if that was corrected :).

dtcxzyw

This constraint is still not enough.
Consider the following case:

#include <cstdio>
#include <cstdlib>
int main() {
  float end = 1U << 24;
  float beg = 0.0;
  unsigned count = 0;
  for (float i = beg; i <= end; i++) {
    if (count > (1U << 26))  exit(1);
    ++count;
  }
  printf("%u\n", count);
  return 0;
}

Note that (float)(1U << 24) + 1.0f == (float)(1U << 24). So the program should call exit(1) instead of exiting the loop.
LLVM IR:

target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128"
target triple = "x86_64-pc-linux-gnu"

@.str = private unnamed_addr constant [4 x i8] c"%u\0A\00", align 1

define dso_local noundef i32 @main() {
  br label %1

1:                                                ; preds = %10, %0
  %2 = phi i32 [ 0, %0 ], [ %11, %10 ]
  %3 = phi float [ 0.000000e+00, %0 ], [ %12, %10 ]
  %4 = fcmp ugt float %3, 0x4170000000000000
  br i1 %4, label %5, label %7

5:                                                ; preds = %1
  %6 = call i32 (ptr, ...) @printf(ptr noundef nonnull dereferenceable(1) @.str, i32 noundef %2)
  ret i32 0

7:                                                ; preds = %1
  %8 = icmp samesign ugt i32 %2, 67108864
  br i1 %8, label %9, label %10

9:                                                ; preds = %7
  call void @exit(i32 noundef 13) #3
  unreachable

10:                                               ; preds = %7
  %11 = add nuw nsw i32 %2, 1
  %12 = fadd float %3, 1.000000e+00
  br label %1, !llvm.loop !9
}

declare void @exit(i32 noundef) local_unnamed_addr
declare noundef i32 @printf(ptr noundef readonly captures(none), ...)

!9 = distinct !{!9, !10}
!10 = !{!"llvm.loop.mustprogress"}

After opt -O3 with your patch:

define dso_local noundef i32 @main() local_unnamed_addr #0 {
  %1 = tail call i32 (ptr, ...) @printf(ptr noundef nonnull dereferenceable(1) @.str, i32 noundef 16777217)
  ret i32 0
}

antoniofrighetto · 2025-11-10T10:41:52Z

This constraint is still not enough. Consider the following case:

Thanks, good catch. While indeed integers from $[0,2^{24}]$ can be represented for single precision, $2^{24} + 1$ would get rounded to the nearest representable float, making the transformation fp -> int imprecise. Bailing out when >= limit, also refactored better the code.

dtcxzyw

LGTM. Thanks!

llvm/lib/Transforms/Scalar/IndVarSimplify.cpp

When transforming floating-point induction variables into integer ones, make sure we stay within the bounds of fp values that can be represented as integers without gaps, i.e., 2^24 and 2^53 for IEEE-754 single and double precision respectively (both on negative and positive side). Fixes: llvm#166496.

antoniofrighetto requested review from dtcxzyw, efriedma-quic, fhahn and nikic November 5, 2025 21:56

llvmbot added the llvm:transforms label Nov 5, 2025

pinskia reviewed Nov 6, 2025

View reviewed changes

thaliaarchi reviewed Nov 6, 2025

View reviewed changes

dtcxzyw reviewed Nov 7, 2025

View reviewed changes

antoniofrighetto force-pushed the feature/indvars-fps-to-representable-int branch from d43a6c7 to f60d26d Compare November 10, 2025 10:41

dtcxzyw approved these changes Nov 10, 2025

View reviewed changes

llvm/lib/Transforms/Scalar/IndVarSimplify.cpp Outdated Show resolved Hide resolved

antoniofrighetto added 2 commits November 11, 2025 10:30

[IndVarSimplify] Precommit tests for PR166649 (NFC)

9100001

antoniofrighetto force-pushed the feature/indvars-fps-to-representable-int branch from f60d26d to eaf3a91 Compare November 11, 2025 09:31

antoniofrighetto merged commit eaf3a91 into llvm:main Nov 11, 2025
5 of 9 checks passed

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

[IndVarSimplify] Ensure fp values can be represented as consecutive integers #166649

[IndVarSimplify] Ensure fp values can be represented as consecutive integers #166649

Uh oh!

antoniofrighetto commented Nov 5, 2025

Uh oh!

llvmbot commented Nov 5, 2025

Uh oh!

pinskia Nov 6, 2025

Uh oh!

thaliaarchi Nov 6, 2025 •

edited

Loading

Uh oh!

antoniofrighetto Nov 6, 2025 •

edited

Loading

Uh oh!

thaliaarchi left a comment •

edited

Loading

Uh oh!

thaliaarchi Nov 6, 2025 •

edited

Loading

Uh oh!

pinskia commented Nov 6, 2025

Uh oh!

dtcxzyw left a comment

Uh oh!

antoniofrighetto commented Nov 10, 2025

Uh oh!

dtcxzyw left a comment

Uh oh!

Uh oh!

Uh oh!

Reviewers

Assignees

Labels

Projects

Milestone

Development

Uh oh!

5 participants

[IndVarSimplify] Ensure fp values can be represented as consecutive integers #166649

[IndVarSimplify] Ensure fp values can be represented as consecutive integers #166649

Uh oh!

Conversation

antoniofrighetto commented Nov 5, 2025

Uh oh!

llvmbot commented Nov 5, 2025

Uh oh!

pinskia Nov 6, 2025

Choose a reason for hiding this comment

Uh oh!

thaliaarchi Nov 6, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Choose a reason for hiding this comment

Uh oh!

antoniofrighetto Nov 6, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Choose a reason for hiding this comment

Uh oh!

thaliaarchi left a comment • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Choose a reason for hiding this comment

Uh oh!

thaliaarchi Nov 6, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Choose a reason for hiding this comment

Uh oh!

pinskia commented Nov 6, 2025

Uh oh!

dtcxzyw left a comment

Choose a reason for hiding this comment

Uh oh!

antoniofrighetto commented Nov 10, 2025

Uh oh!

dtcxzyw left a comment

Choose a reason for hiding this comment

Uh oh!

Uh oh!

Uh oh!

Reviewers

Assignees

Labels

Projects

Milestone

Development

Uh oh!

5 participants

thaliaarchi Nov 6, 2025 •

edited

Loading

antoniofrighetto Nov 6, 2025 •

edited

Loading

thaliaarchi left a comment •

edited

Loading

thaliaarchi Nov 6, 2025 •

edited

Loading