llvm · bababuck · Aug 25, 2025 · Aug 25, 2025 · dtcxzyw · Oct 2, 2025
@@ -5416,6 +5416,45 @@ Instruction *InstCombinerImpl::foldICmpBinOp(ICmpInst &I,
   if (B && D && B == D && NoOp0WrapProblem && NoOp1WrapProblem)
     return new ICmpInst(Pred, A, C);
 
+  // icmp (A-B), (C-B) -> icmp A, C for comparisons of pointer subtraction
+  // that is, if A, B and C are all ptrs converted to integers.
+  //
+  // Tricky case because pointers are effectively unsigned integers, but the
+  // result of their subtraction is signed. Also, these subtractions ought to
+  // have NSW semantics, except we cannot give that to them because the results
+  // are considered signed, but if we optimize away the subtraction, the
+  // underlying pointers need to be treated as unsigned, thus special handling
+  // is required. In this scenario, we must ensure that the comparison is
+  // unsigned after removing the subtraction operations.
+  if (B && D && B == D && isa<PtrToIntOperator>(A) &&
+      isa<PtrToIntOperator>(B) && isa<PtrToIntOperator>(C)) {
+    CmpInst::Predicate UnsignedPred;
+    switch (Pred) {
+    default:
+      // If already unsigned, explicit cast from ptr to unsigned,
+      // so cannot optimize
+      UnsignedPred = CmpInst::BAD_ICMP_PREDICATE;
+      break;
+    case ICmpInst::ICMP_SGT:
+      UnsignedPred = ICmpInst::ICMP_UGT;
+      break;
+    case ICmpInst::ICMP_SLT:
+      UnsignedPred = ICmpInst::ICMP_ULT;
+      break;
+    case ICmpInst::ICMP_SGE:
+      UnsignedPred = ICmpInst::ICMP_UGE;
+      break;
+    case ICmpInst::ICMP_SLE:
+      UnsignedPred = ICmpInst::ICMP_ULE;
+      break;
+    }
+    if (UnsignedPred != CmpInst::BAD_ICMP_PREDICATE) {
+      PtrToIntOperator *AOp = dyn_cast<PtrToIntOperator>(A);
+      PtrToIntOperator *COp = dyn_cast<PtrToIntOperator>(C);
+      return new ICmpInst(UnsignedPred, AOp->getOperand(0), COp->getOperand(0));
+    }
+  }
+
   // icmp (A-B), (A-D) -> icmp D, B for equalities or if there is no overflow.
   if (A && C && A == C && NoOp0WrapProblem && NoOp1WrapProblem)
     return new ICmpInst(Pred, D, B);

diff --git a/llvm/test/Transforms/InstCombine/icmp-ptrdiff.ll b/llvm/test/Transforms/InstCombine/icmp-ptrdiff.ll
@@ -0,0 +1,109 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: opt < %s -passes=instcombine -S | FileCheck %s
+
+define ptr @icmp_ptrdiff_gt(ptr %0, ptr %1, ptr %2) {
 // Otherwise, this is a pointer subtraction. 
 // Do the raw subtraction part. 
 llvm::Value *LHS 
   = Builder.CreatePtrToInt(op.LHS, CGF.PtrDiffTy, "sub.ptr.lhs.cast"); 
 llvm::Value *RHS 
   = Builder.CreatePtrToInt(op.RHS, CGF.PtrDiffTy, "sub.ptr.rhs.cast"); 
 Value *diffInChars = Builder.CreateSub(LHS, RHS, "sub.ptr.sub"); 
 // Okay, figure out the element size. 
 const BinaryOperator *expr = cast<BinaryOperator>(op.E); 
 QualType elementType = expr->getLHS()->getType()->getPointeeType(); 
 llvm::Value *divisor = nullptr; 
 // For a variable-length array, this is going to be non-constant. 
 if (const VariableArrayType *vla 
       = CGF.getContext().getAsVariableArrayType(elementType)) { 
   auto VlaSize = CGF.getVLASize(vla); 
   elementType = VlaSize.Type; 
   divisor = VlaSize.NumElts; 
   // Scale the number of non-VLA elements by the non-VLA element size. 
   CharUnits eltSize = CGF.getContext().getTypeSizeInChars(elementType); 
   if (!eltSize.isOne()) 
     divisor = CGF.Builder.CreateNUWMul(CGF.CGM.getSize(eltSize), divisor); 
 // For everything elese, we can just compute it, safe in the 
 // assumption that Sema won't let anything through that we can't 
 // safely compute the size of. 
 } else { 
   CharUnits elementSize; 
   // Handle GCC extension for pointer arithmetic on void* and 
   // function pointer types. 
   if (elementType->isVoidType() || elementType->isFunctionType()) 
     elementSize = CharUnits::One(); 
   else 
     elementSize = CGF.getContext().getTypeSizeInChars(elementType); 
   // Don't even emit the divide for element size of 1. 
   if (elementSize.isOne()) 
     return diffInChars; 
   divisor = CGF.CGM.getSize(elementSize); 
 } 
 // Otherwise, do a full sdiv. This uses the "exact" form of sdiv, since 
 // pointer difference in C is only defined in the case where both operands 
 // are pointing to elements of an array. 
 return Builder.CreateExactSDiv(diffInChars, divisor, "sub.ptr.div"); 
 // Otherwise, this is a pointer subtraction. 
  
 // Do the raw subtraction part. 
 llvm::Value *LHS 
   = Builder.CreatePtrToInt(op.LHS, CGF.PtrDiffTy, "sub.ptr.lhs.cast"); 
 llvm::Value *RHS 
   = Builder.CreatePtrToInt(op.RHS, CGF.PtrDiffTy, "sub.ptr.rhs.cast"); 
 Value *diffInChars = Builder.CreateSub(LHS, RHS, "sub.ptr.sub"); 
  
 // Okay, figure out the element size. 
 const BinaryOperator *expr = cast<BinaryOperator>(op.E); 
 QualType elementType = expr->getLHS()->getType()->getPointeeType(); 
  
 llvm::Value *divisor = nullptr; 
  
 // For a variable-length array, this is going to be non-constant. 
 if (const VariableArrayType *vla 
       = CGF.getContext().getAsVariableArrayType(elementType)) { 
   auto VlaSize = CGF.getVLASize(vla); 
   elementType = VlaSize.Type; 
   divisor = VlaSize.NumElts; 
  
   // Scale the number of non-VLA elements by the non-VLA element size. 
   CharUnits eltSize = CGF.getContext().getTypeSizeInChars(elementType); 
   if (!eltSize.isOne()) 
     divisor = CGF.Builder.CreateNUWMul(CGF.CGM.getSize(eltSize), divisor); 
  
 // For everything elese, we can just compute it, safe in the 
 // assumption that Sema won't let anything through that we can't 
 // safely compute the size of. 
 } else { 
   CharUnits elementSize; 
   // Handle GCC extension for pointer arithmetic on void* and 
   // function pointer types. 
   if (elementType->isVoidType() || elementType->isFunctionType()) 
     elementSize = CharUnits::One(); 
   else 
     elementSize = CGF.getContext().getTypeSizeInChars(elementType); 
  
   // Don't even emit the divide for element size of 1. 
   if (elementSize.isOne()) 
     return diffInChars; 
  
   divisor = CGF.CGM.getSize(elementSize); 
 } 
  
 // Otherwise, do a full sdiv. This uses the "exact" form of sdiv, since 
 // pointer difference in C is only defined in the case where both operands 
 // are pointing to elements of an array. 
 return Builder.CreateExactSDiv(diffInChars, divisor, "sub.ptr.div"); 
+; CHECK-LABEL: @icmp_ptrdiff_gt(
+; CHECK-NEXT:    [[TMP4:%.*]] = getelementptr inbounds nuw i8, ptr [[TMP0:%.*]], i64 1
+; CHECK-NEXT:    [[TMP10:%.*]] = icmp ugt ptr [[TMP4]], [[TMP2:%.*]]
+; CHECK-NEXT:    [[TMP11:%.*]] = select i1 [[TMP10]], ptr [[TMP2]], ptr [[TMP4]]
+; CHECK-NEXT:    ret ptr [[TMP11]]
+;
+  %4 = getelementptr inbounds nuw i8, ptr %0, i64 1
+  %5 = ptrtoint ptr %4 to i64
+  %6 = ptrtoint ptr %1 to i64
+  %7 = sub i64 %5, %6
+  %8 = ptrtoint ptr %2 to i64
+  %9 = sub i64 %8, %6
+  %10 = icmp sgt i64 %7, %9
+  %11 = select i1 %10, ptr %2, ptr %4
+  ret ptr %11
+}
+
+define ptr @icmp_ptrdiff_lt(ptr %0, ptr %1, ptr %2) {
+; CHECK-LABEL: @icmp_ptrdiff_lt(
+; CHECK-NEXT:    [[TMP4:%.*]] = getelementptr inbounds nuw i8, ptr [[TMP0:%.*]], i64 1
+; CHECK-NEXT:    [[TMP10:%.*]] = icmp ult ptr [[TMP4]], [[TMP2:%.*]]
+; CHECK-NEXT:    [[TMP11:%.*]] = select i1 [[TMP10]], ptr [[TMP2]], ptr [[TMP4]]
+; CHECK-NEXT:    ret ptr [[TMP11]]
+;
+  %4 = getelementptr inbounds nuw i8, ptr %0, i64 1
+  %5 = ptrtoint ptr %4 to i64
+  %6 = ptrtoint ptr %1 to i64
+  %7 = sub i64 %5, %6
+  %8 = ptrtoint ptr %2 to i64
+  %9 = sub i64 %8, %6
+  %10 = icmp slt i64 %7, %9
+  %11 = select i1 %10, ptr %2, ptr %4
+  ret ptr %11
+}
+
+define ptr @icmp_ptrdiff_ge(ptr %0, ptr %1, ptr %2) {
+; CHECK-LABEL: @icmp_ptrdiff_ge(
+; CHECK-NEXT:    [[TMP4:%.*]] = getelementptr inbounds nuw i8, ptr [[TMP0:%.*]], i64 1
+; CHECK-NEXT:    [[DOTNOT:%.*]] = icmp ult ptr [[TMP4]], [[TMP2:%.*]]
+; CHECK-NEXT:    [[TMP10:%.*]] = select i1 [[DOTNOT]], ptr [[TMP4]], ptr [[TMP2]]
+; CHECK-NEXT:    ret ptr [[TMP10]]
+;
+  %4 = getelementptr inbounds nuw i8, ptr %0, i64 1
+  %5 = ptrtoint ptr %4 to i64
+  %6 = ptrtoint ptr %1 to i64
+  %7 = sub i64 %5, %6
+  %8 = ptrtoint ptr %2 to i64
+  %9 = sub i64 %8, %6
+  %10 = icmp sge i64 %7, %9
+  %11 = select i1 %10, ptr %2, ptr %4
+  ret ptr %11
+}
+
+define ptr @icmp_ptrdiff_le(ptr %0, ptr %1, ptr %2) {
+; CHECK-LABEL: @icmp_ptrdiff_le(
+; CHECK-NEXT:    [[TMP4:%.*]] = getelementptr inbounds nuw i8, ptr [[TMP0:%.*]], i64 1
+; CHECK-NEXT:    [[DOTNOT:%.*]] = icmp ugt ptr [[TMP4]], [[TMP2:%.*]]
+; CHECK-NEXT:    [[TMP10:%.*]] = select i1 [[DOTNOT]], ptr [[TMP4]], ptr [[TMP2]]
+; CHECK-NEXT:    ret ptr [[TMP10]]
+;
+  %4 = getelementptr inbounds nuw i8, ptr %0, i64 1
+  %5 = ptrtoint ptr %4 to i64
+  %6 = ptrtoint ptr %1 to i64
+  %7 = sub i64 %5, %6
+  %8 = ptrtoint ptr %2 to i64
+  %9 = sub i64 %8, %6
+  %10 = icmp sle i64 %7, %9
+  %11 = select i1 %10, ptr %2, ptr %4
+  ret ptr %11
+}
+
+define ptr @icmp_ptrdiff_eq(ptr %0, ptr %1, ptr %2) {
+; CHECK-LABEL: @icmp_ptrdiff_eq(
+; CHECK-NEXT:    [[TMP4:%.*]] = getelementptr inbounds nuw i8, ptr [[TMP0:%.*]], i64 1
+; CHECK-NEXT:    ret ptr [[TMP4]]
+;
+  %4 = getelementptr inbounds nuw i8, ptr %0, i64 1
+  %5 = ptrtoint ptr %4 to i64
+  %6 = ptrtoint ptr %1 to i64
+  %7 = sub i64 %5, %6
+  %8 = ptrtoint ptr %2 to i64
+  %9 = sub i64 %8, %6
+  %10 = icmp eq i64 %7, %9
+  %11 = select i1 %10, ptr %2, ptr %4
+  ret ptr %11
+}
+
+define ptr @icmp_ptrdiff_ne(ptr %0, ptr %1, ptr %2) {
+; CHECK-LABEL: @icmp_ptrdiff_ne(
+; CHECK-NEXT:    [[TMP4:%.*]] = getelementptr inbounds nuw i8, ptr [[TMP0:%.*]], i64 1
+; CHECK-NEXT:    [[DOTNOT:%.*]] = icmp eq ptr [[TMP4]], [[TMP2:%.*]]
+; CHECK-NEXT:    [[TMP5:%.*]] = select i1 [[DOTNOT]], ptr [[TMP4]], ptr [[TMP2]]
+; CHECK-NEXT:    ret ptr [[TMP5]]
+;
+  %4 = getelementptr inbounds nuw i8, ptr %0, i64 1
+  %5 = ptrtoint ptr %4 to i64
+  %6 = ptrtoint ptr %1 to i64
+  %7 = sub i64 %5, %6
+  %8 = ptrtoint ptr %2 to i64
+  %9 = sub i64 %8, %6
+  %10 = icmp ne i64 %7, %9
+  %11 = select i1 %10, ptr %2, ptr %4
+  ret ptr %11
+}
+