xref: /freebsd-src/contrib/llvm-project/clang/lib/StaticAnalyzer/Core/RangedConstraintManager.cpp (revision 81ad626541db97eb356e2c1d4a20eb2a26a766ab)
10b57cec5SDimitry Andric //== RangedConstraintManager.cpp --------------------------------*- C++ -*--==//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric //  This file defines RangedConstraintManager, a class that provides a
100b57cec5SDimitry Andric //  range-based constraint manager interface.
110b57cec5SDimitry Andric //
120b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
130b57cec5SDimitry Andric 
140b57cec5SDimitry Andric #include "clang/StaticAnalyzer/Core/PathSensitive/ProgramState.h"
150b57cec5SDimitry Andric #include "clang/StaticAnalyzer/Core/PathSensitive/RangedConstraintManager.h"
160b57cec5SDimitry Andric 
170b57cec5SDimitry Andric namespace clang {
180b57cec5SDimitry Andric 
190b57cec5SDimitry Andric namespace ento {
200b57cec5SDimitry Andric 
~RangedConstraintManager()210b57cec5SDimitry Andric RangedConstraintManager::~RangedConstraintManager() {}
220b57cec5SDimitry Andric 
assumeSym(ProgramStateRef State,SymbolRef Sym,bool Assumption)230b57cec5SDimitry Andric ProgramStateRef RangedConstraintManager::assumeSym(ProgramStateRef State,
240b57cec5SDimitry Andric                                                    SymbolRef Sym,
250b57cec5SDimitry Andric                                                    bool Assumption) {
26fe6060f1SDimitry Andric   Sym = simplify(State, Sym);
27fe6060f1SDimitry Andric 
280b57cec5SDimitry Andric   // Handle SymbolData.
29fe6060f1SDimitry Andric   if (isa<SymbolData>(Sym))
300b57cec5SDimitry Andric     return assumeSymUnsupported(State, Sym, Assumption);
310b57cec5SDimitry Andric 
320b57cec5SDimitry Andric   // Handle symbolic expression.
33fe6060f1SDimitry Andric   if (const SymIntExpr *SIE = dyn_cast<SymIntExpr>(Sym)) {
340b57cec5SDimitry Andric     // We can only simplify expressions whose RHS is an integer.
350b57cec5SDimitry Andric 
360b57cec5SDimitry Andric     BinaryOperator::Opcode op = SIE->getOpcode();
370b57cec5SDimitry Andric     if (BinaryOperator::isComparisonOp(op) && op != BO_Cmp) {
380b57cec5SDimitry Andric       if (!Assumption)
390b57cec5SDimitry Andric         op = BinaryOperator::negateComparisonOp(op);
400b57cec5SDimitry Andric 
410b57cec5SDimitry Andric       return assumeSymRel(State, SIE->getLHS(), op, SIE->getRHS());
420b57cec5SDimitry Andric     }
430b57cec5SDimitry Andric 
44349cc55cSDimitry Andric     // Handle adjustment with non-comparison ops.
45349cc55cSDimitry Andric     const llvm::APSInt &Zero = getBasicVals().getValue(0, SIE->getType());
46349cc55cSDimitry Andric     return assumeSymRel(State, SIE, (Assumption ? BO_NE : BO_EQ), Zero);
47349cc55cSDimitry Andric   }
48349cc55cSDimitry Andric 
49349cc55cSDimitry Andric   if (const auto *SSE = dyn_cast<SymSymExpr>(Sym)) {
50e8d8bef9SDimitry Andric     BinaryOperator::Opcode Op = SSE->getOpcode();
51*81ad6265SDimitry Andric     if (BinaryOperator::isComparisonOp(Op)) {
52e8d8bef9SDimitry Andric 
53e8d8bef9SDimitry Andric       // We convert equality operations for pointers only.
54e8d8bef9SDimitry Andric       if (Loc::isLocType(SSE->getLHS()->getType()) &&
55e8d8bef9SDimitry Andric           Loc::isLocType(SSE->getRHS()->getType())) {
560b57cec5SDimitry Andric         // Translate "a != b" to "(b - a) != 0".
570b57cec5SDimitry Andric         // We invert the order of the operands as a heuristic for how loop
580b57cec5SDimitry Andric         // conditions are usually written ("begin != end") as compared to length
59*81ad6265SDimitry Andric         // calculations ("end - begin"). The more correct thing to do would be
60*81ad6265SDimitry Andric         // to canonicalize "a - b" and "b - a", which would allow us to treat
610b57cec5SDimitry Andric         // "a != b" and "b != a" the same.
620b57cec5SDimitry Andric 
63e8d8bef9SDimitry Andric         SymbolManager &SymMgr = getSymbolManager();
640b57cec5SDimitry Andric         QualType DiffTy = SymMgr.getContext().getPointerDiffType();
650b57cec5SDimitry Andric         SymbolRef Subtraction =
660b57cec5SDimitry Andric             SymMgr.getSymSymExpr(SSE->getRHS(), BO_Sub, SSE->getLHS(), DiffTy);
670b57cec5SDimitry Andric 
680b57cec5SDimitry Andric         const llvm::APSInt &Zero = getBasicVals().getValue(0, DiffTy);
690b57cec5SDimitry Andric         Op = BinaryOperator::reverseComparisonOp(Op);
700b57cec5SDimitry Andric         if (!Assumption)
710b57cec5SDimitry Andric           Op = BinaryOperator::negateComparisonOp(Op);
720b57cec5SDimitry Andric         return assumeSymRel(State, Subtraction, Op, Zero);
730b57cec5SDimitry Andric       }
74e8d8bef9SDimitry Andric 
75e8d8bef9SDimitry Andric       if (BinaryOperator::isEqualityOp(Op)) {
76e8d8bef9SDimitry Andric         SymbolManager &SymMgr = getSymbolManager();
77e8d8bef9SDimitry Andric 
78e8d8bef9SDimitry Andric         QualType ExprType = SSE->getType();
79e8d8bef9SDimitry Andric         SymbolRef CanonicalEquality =
80e8d8bef9SDimitry Andric             SymMgr.getSymSymExpr(SSE->getLHS(), BO_EQ, SSE->getRHS(), ExprType);
81e8d8bef9SDimitry Andric 
82e8d8bef9SDimitry Andric         bool WasEqual = SSE->getOpcode() == BO_EQ;
83e8d8bef9SDimitry Andric         bool IsExpectedEqual = WasEqual == Assumption;
84e8d8bef9SDimitry Andric 
85e8d8bef9SDimitry Andric         const llvm::APSInt &Zero = getBasicVals().getValue(0, ExprType);
86e8d8bef9SDimitry Andric 
87e8d8bef9SDimitry Andric         if (IsExpectedEqual) {
88e8d8bef9SDimitry Andric           return assumeSymNE(State, CanonicalEquality, Zero, Zero);
89e8d8bef9SDimitry Andric         }
90e8d8bef9SDimitry Andric 
91e8d8bef9SDimitry Andric         return assumeSymEQ(State, CanonicalEquality, Zero, Zero);
92e8d8bef9SDimitry Andric       }
930b57cec5SDimitry Andric     }
94*81ad6265SDimitry Andric   }
950b57cec5SDimitry Andric 
960b57cec5SDimitry Andric   // If we get here, there's nothing else we can do but treat the symbol as
970b57cec5SDimitry Andric   // opaque.
980b57cec5SDimitry Andric   return assumeSymUnsupported(State, Sym, Assumption);
990b57cec5SDimitry Andric }
1000b57cec5SDimitry Andric 
assumeSymInclusiveRange(ProgramStateRef State,SymbolRef Sym,const llvm::APSInt & From,const llvm::APSInt & To,bool InRange)1010b57cec5SDimitry Andric ProgramStateRef RangedConstraintManager::assumeSymInclusiveRange(
1020b57cec5SDimitry Andric     ProgramStateRef State, SymbolRef Sym, const llvm::APSInt &From,
1030b57cec5SDimitry Andric     const llvm::APSInt &To, bool InRange) {
104fe6060f1SDimitry Andric 
105fe6060f1SDimitry Andric   Sym = simplify(State, Sym);
106fe6060f1SDimitry Andric 
1070b57cec5SDimitry Andric   // Get the type used for calculating wraparound.
1080b57cec5SDimitry Andric   BasicValueFactory &BVF = getBasicVals();
1090b57cec5SDimitry Andric   APSIntType WraparoundType = BVF.getAPSIntType(Sym->getType());
1100b57cec5SDimitry Andric 
1110b57cec5SDimitry Andric   llvm::APSInt Adjustment = WraparoundType.getZeroValue();
1120b57cec5SDimitry Andric   SymbolRef AdjustedSym = Sym;
1130b57cec5SDimitry Andric   computeAdjustment(AdjustedSym, Adjustment);
1140b57cec5SDimitry Andric 
1150b57cec5SDimitry Andric   // Convert the right-hand side integer as necessary.
1160b57cec5SDimitry Andric   APSIntType ComparisonType = std::max(WraparoundType, APSIntType(From));
1170b57cec5SDimitry Andric   llvm::APSInt ConvertedFrom = ComparisonType.convert(From);
1180b57cec5SDimitry Andric   llvm::APSInt ConvertedTo = ComparisonType.convert(To);
1190b57cec5SDimitry Andric 
1200b57cec5SDimitry Andric   // Prefer unsigned comparisons.
1210b57cec5SDimitry Andric   if (ComparisonType.getBitWidth() == WraparoundType.getBitWidth() &&
1220b57cec5SDimitry Andric       ComparisonType.isUnsigned() && !WraparoundType.isUnsigned())
1230b57cec5SDimitry Andric     Adjustment.setIsSigned(false);
1240b57cec5SDimitry Andric 
1250b57cec5SDimitry Andric   if (InRange)
1260b57cec5SDimitry Andric     return assumeSymWithinInclusiveRange(State, AdjustedSym, ConvertedFrom,
1270b57cec5SDimitry Andric                                          ConvertedTo, Adjustment);
1280b57cec5SDimitry Andric   return assumeSymOutsideInclusiveRange(State, AdjustedSym, ConvertedFrom,
1290b57cec5SDimitry Andric                                         ConvertedTo, Adjustment);
1300b57cec5SDimitry Andric }
1310b57cec5SDimitry Andric 
1320b57cec5SDimitry Andric ProgramStateRef
assumeSymUnsupported(ProgramStateRef State,SymbolRef Sym,bool Assumption)1330b57cec5SDimitry Andric RangedConstraintManager::assumeSymUnsupported(ProgramStateRef State,
1340b57cec5SDimitry Andric                                               SymbolRef Sym, bool Assumption) {
135fe6060f1SDimitry Andric   Sym = simplify(State, Sym);
136fe6060f1SDimitry Andric 
1370b57cec5SDimitry Andric   BasicValueFactory &BVF = getBasicVals();
1380b57cec5SDimitry Andric   QualType T = Sym->getType();
1390b57cec5SDimitry Andric 
1400b57cec5SDimitry Andric   // Non-integer types are not supported.
1410b57cec5SDimitry Andric   if (!T->isIntegralOrEnumerationType())
1420b57cec5SDimitry Andric     return State;
1430b57cec5SDimitry Andric 
1440b57cec5SDimitry Andric   // Reverse the operation and add directly to state.
1450b57cec5SDimitry Andric   const llvm::APSInt &Zero = BVF.getValue(0, T);
1460b57cec5SDimitry Andric   if (Assumption)
1470b57cec5SDimitry Andric     return assumeSymNE(State, Sym, Zero, Zero);
1480b57cec5SDimitry Andric   else
1490b57cec5SDimitry Andric     return assumeSymEQ(State, Sym, Zero, Zero);
1500b57cec5SDimitry Andric }
1510b57cec5SDimitry Andric 
assumeSymRel(ProgramStateRef State,SymbolRef Sym,BinaryOperator::Opcode Op,const llvm::APSInt & Int)1520b57cec5SDimitry Andric ProgramStateRef RangedConstraintManager::assumeSymRel(ProgramStateRef State,
1530b57cec5SDimitry Andric                                                       SymbolRef Sym,
1540b57cec5SDimitry Andric                                                       BinaryOperator::Opcode Op,
1550b57cec5SDimitry Andric                                                       const llvm::APSInt &Int) {
1560b57cec5SDimitry Andric   assert(BinaryOperator::isComparisonOp(Op) &&
1570b57cec5SDimitry Andric          "Non-comparison ops should be rewritten as comparisons to zero.");
1580b57cec5SDimitry Andric 
1590b57cec5SDimitry Andric   // Simplification: translate an assume of a constraint of the form
1600b57cec5SDimitry Andric   // "(exp comparison_op expr) != 0" to true into an assume of
1610b57cec5SDimitry Andric   // "exp comparison_op expr" to true. (And similarly, an assume of the form
1620b57cec5SDimitry Andric   // "(exp comparison_op expr) == 0" to true into an assume of
1630b57cec5SDimitry Andric   // "exp comparison_op expr" to false.)
1640b57cec5SDimitry Andric   if (Int == 0 && (Op == BO_EQ || Op == BO_NE)) {
1650b57cec5SDimitry Andric     if (const BinarySymExpr *SE = dyn_cast<BinarySymExpr>(Sym))
1660b57cec5SDimitry Andric       if (BinaryOperator::isComparisonOp(SE->getOpcode()))
1670b57cec5SDimitry Andric         return assumeSym(State, Sym, (Op == BO_NE ? true : false));
1680b57cec5SDimitry Andric   }
1690b57cec5SDimitry Andric 
1700b57cec5SDimitry Andric   // Get the type used for calculating wraparound.
1710b57cec5SDimitry Andric   BasicValueFactory &BVF = getBasicVals();
1720b57cec5SDimitry Andric   APSIntType WraparoundType = BVF.getAPSIntType(Sym->getType());
1730b57cec5SDimitry Andric 
1740b57cec5SDimitry Andric   // We only handle simple comparisons of the form "$sym == constant"
1750b57cec5SDimitry Andric   // or "($sym+constant1) == constant2".
1760b57cec5SDimitry Andric   // The adjustment is "constant1" in the above expression. It's used to
1770b57cec5SDimitry Andric   // "slide" the solution range around for modular arithmetic. For example,
1780b57cec5SDimitry Andric   // x < 4 has the solution [0, 3]. x+2 < 4 has the solution [0-2, 3-2], which
1790b57cec5SDimitry Andric   // in modular arithmetic is [0, 1] U [UINT_MAX-1, UINT_MAX]. It's up to
1800b57cec5SDimitry Andric   // the subclasses of SimpleConstraintManager to handle the adjustment.
1810b57cec5SDimitry Andric   llvm::APSInt Adjustment = WraparoundType.getZeroValue();
1820b57cec5SDimitry Andric   computeAdjustment(Sym, Adjustment);
1830b57cec5SDimitry Andric 
1840b57cec5SDimitry Andric   // Convert the right-hand side integer as necessary.
1850b57cec5SDimitry Andric   APSIntType ComparisonType = std::max(WraparoundType, APSIntType(Int));
1860b57cec5SDimitry Andric   llvm::APSInt ConvertedInt = ComparisonType.convert(Int);
1870b57cec5SDimitry Andric 
1880b57cec5SDimitry Andric   // Prefer unsigned comparisons.
1890b57cec5SDimitry Andric   if (ComparisonType.getBitWidth() == WraparoundType.getBitWidth() &&
1900b57cec5SDimitry Andric       ComparisonType.isUnsigned() && !WraparoundType.isUnsigned())
1910b57cec5SDimitry Andric     Adjustment.setIsSigned(false);
1920b57cec5SDimitry Andric 
1930b57cec5SDimitry Andric   switch (Op) {
1940b57cec5SDimitry Andric   default:
1950b57cec5SDimitry Andric     llvm_unreachable("invalid operation not caught by assertion above");
1960b57cec5SDimitry Andric 
1970b57cec5SDimitry Andric   case BO_EQ:
1980b57cec5SDimitry Andric     return assumeSymEQ(State, Sym, ConvertedInt, Adjustment);
1990b57cec5SDimitry Andric 
2000b57cec5SDimitry Andric   case BO_NE:
2010b57cec5SDimitry Andric     return assumeSymNE(State, Sym, ConvertedInt, Adjustment);
2020b57cec5SDimitry Andric 
2030b57cec5SDimitry Andric   case BO_GT:
2040b57cec5SDimitry Andric     return assumeSymGT(State, Sym, ConvertedInt, Adjustment);
2050b57cec5SDimitry Andric 
2060b57cec5SDimitry Andric   case BO_GE:
2070b57cec5SDimitry Andric     return assumeSymGE(State, Sym, ConvertedInt, Adjustment);
2080b57cec5SDimitry Andric 
2090b57cec5SDimitry Andric   case BO_LT:
2100b57cec5SDimitry Andric     return assumeSymLT(State, Sym, ConvertedInt, Adjustment);
2110b57cec5SDimitry Andric 
2120b57cec5SDimitry Andric   case BO_LE:
2130b57cec5SDimitry Andric     return assumeSymLE(State, Sym, ConvertedInt, Adjustment);
2140b57cec5SDimitry Andric   } // end switch
2150b57cec5SDimitry Andric }
2160b57cec5SDimitry Andric 
computeAdjustment(SymbolRef & Sym,llvm::APSInt & Adjustment)2170b57cec5SDimitry Andric void RangedConstraintManager::computeAdjustment(SymbolRef &Sym,
2180b57cec5SDimitry Andric                                                 llvm::APSInt &Adjustment) {
2190b57cec5SDimitry Andric   // Is it a "($sym+constant1)" expression?
2200b57cec5SDimitry Andric   if (const SymIntExpr *SE = dyn_cast<SymIntExpr>(Sym)) {
2210b57cec5SDimitry Andric     BinaryOperator::Opcode Op = SE->getOpcode();
2220b57cec5SDimitry Andric     if (Op == BO_Add || Op == BO_Sub) {
2230b57cec5SDimitry Andric       Sym = SE->getLHS();
2240b57cec5SDimitry Andric       Adjustment = APSIntType(Adjustment).convert(SE->getRHS());
2250b57cec5SDimitry Andric 
2260b57cec5SDimitry Andric       // Don't forget to negate the adjustment if it's being subtracted.
2270b57cec5SDimitry Andric       // This should happen /after/ promotion, in case the value being
2280b57cec5SDimitry Andric       // subtracted is, say, CHAR_MIN, and the promoted type is 'int'.
2290b57cec5SDimitry Andric       if (Op == BO_Sub)
2300b57cec5SDimitry Andric         Adjustment = -Adjustment;
2310b57cec5SDimitry Andric     }
2320b57cec5SDimitry Andric   }
2330b57cec5SDimitry Andric }
2340b57cec5SDimitry Andric 
simplifyToSVal(ProgramStateRef State,SymbolRef Sym)235349cc55cSDimitry Andric SVal simplifyToSVal(ProgramStateRef State, SymbolRef Sym) {
236fe6060f1SDimitry Andric   SValBuilder &SVB = State->getStateManager().getSValBuilder();
237349cc55cSDimitry Andric   return SVB.simplifySVal(State, SVB.makeSymbolVal(Sym));
238349cc55cSDimitry Andric }
239349cc55cSDimitry Andric 
simplify(ProgramStateRef State,SymbolRef Sym)240349cc55cSDimitry Andric SymbolRef simplify(ProgramStateRef State, SymbolRef Sym) {
241349cc55cSDimitry Andric   SVal SimplifiedVal = simplifyToSVal(State, Sym);
242fe6060f1SDimitry Andric   if (SymbolRef SimplifiedSym = SimplifiedVal.getAsSymbol())
243fe6060f1SDimitry Andric     return SimplifiedSym;
244fe6060f1SDimitry Andric   return Sym;
245fe6060f1SDimitry Andric }
2460b57cec5SDimitry Andric 
247fe6060f1SDimitry Andric } // end of namespace ento
2480b57cec5SDimitry Andric } // end of namespace clang
249