blob: 4fd06f24c5bc6f1228015f29874a84fe6dc9e458 [file] [log] [blame]
Ted Kremenek1c2fb272011-08-03 20:17:43 +00001// MallocOverflowSecurityChecker.cpp - Check for malloc overflows -*- C++ -*-=//
2//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Ted Kremenek1c2fb272011-08-03 20:17:43 +00006//
7//===----------------------------------------------------------------------===//
8//
9// This checker detects a common memory allocation security flaw.
10// Suppose 'unsigned int n' comes from an untrusted source. If the
11// code looks like 'malloc (n * 4)', and an attacker can make 'n' be
12// say MAX_UINT/4+2, then instead of allocating the correct 'n' 4-byte
13// elements, this will actually allocate only two because of overflow.
14// Then when the rest of the program attempts to store values past the
15// second element, these values will actually overwrite other items in
16// the heap, probably allowing the attacker to execute arbitrary code.
17//
18//===----------------------------------------------------------------------===//
19
Kristof Umann76a21502018-12-15 16:23:51 +000020#include "clang/StaticAnalyzer/Checkers/BuiltinCheckerRegistration.h"
Ted Kremenek1c2fb272011-08-03 20:17:43 +000021#include "clang/AST/EvaluatedExprVisitor.h"
Ted Kremenek1c2fb272011-08-03 20:17:43 +000022#include "clang/StaticAnalyzer/Core/BugReporter/BugReporter.h"
Chandler Carruth3a022472012-12-04 09:13:33 +000023#include "clang/StaticAnalyzer/Core/Checker.h"
24#include "clang/StaticAnalyzer/Core/PathSensitive/AnalysisManager.h"
Devin Coughlin683dfd32015-09-23 23:27:55 +000025#include "llvm/ADT/APSInt.h"
Ted Kremenek1c2fb272011-08-03 20:17:43 +000026#include "llvm/ADT/SmallVector.h"
Benjamin Kramercfeacf52016-05-27 14:27:13 +000027#include <utility>
Ted Kremenek1c2fb272011-08-03 20:17:43 +000028
29using namespace clang;
30using namespace ento;
Devin Coughlin683dfd32015-09-23 23:27:55 +000031using llvm::APSInt;
Ted Kremenek1c2fb272011-08-03 20:17:43 +000032
33namespace {
34struct MallocOverflowCheck {
35 const BinaryOperator *mulop;
36 const Expr *variable;
Devin Coughlin683dfd32015-09-23 23:27:55 +000037 APSInt maxVal;
Ted Kremenek1c2fb272011-08-03 20:17:43 +000038
Devin Coughlin683dfd32015-09-23 23:27:55 +000039 MallocOverflowCheck(const BinaryOperator *m, const Expr *v, APSInt val)
Benjamin Kramercfeacf52016-05-27 14:27:13 +000040 : mulop(m), variable(v), maxVal(std::move(val)) {}
Ted Kremenek1c2fb272011-08-03 20:17:43 +000041};
42
43class MallocOverflowSecurityChecker : public Checker<check::ASTCodeBody> {
44public:
45 void checkASTCodeBody(const Decl *D, AnalysisManager &mgr,
46 BugReporter &BR) const;
47
48 void CheckMallocArgument(
Dmitri Gribenkof8579502013-01-12 19:30:44 +000049 SmallVectorImpl<MallocOverflowCheck> &PossibleMallocOverflows,
Ted Kremenek1c2fb272011-08-03 20:17:43 +000050 const Expr *TheArgument, ASTContext &Context) const;
51
52 void OutputPossibleOverflows(
Dmitri Gribenkof8579502013-01-12 19:30:44 +000053 SmallVectorImpl<MallocOverflowCheck> &PossibleMallocOverflows,
Ted Kremenek1c2fb272011-08-03 20:17:43 +000054 const Decl *D, BugReporter &BR, AnalysisManager &mgr) const;
55
56};
57} // end anonymous namespace
58
Devin Coughlin683dfd32015-09-23 23:27:55 +000059// Return true for computations which evaluate to zero: e.g., mult by 0.
60static inline bool EvaluatesToZero(APSInt &Val, BinaryOperatorKind op) {
61 return (op == BO_Mul) && (Val == 0);
62}
63
Ted Kremenek1c2fb272011-08-03 20:17:43 +000064void MallocOverflowSecurityChecker::CheckMallocArgument(
Dmitri Gribenkof8579502013-01-12 19:30:44 +000065 SmallVectorImpl<MallocOverflowCheck> &PossibleMallocOverflows,
Ted Kremenek1c2fb272011-08-03 20:17:43 +000066 const Expr *TheArgument,
67 ASTContext &Context) const {
68
69 /* Look for a linear combination with a single variable, and at least
70 one multiplication.
71 Reject anything that applies to the variable: an explicit cast,
72 conditional expression, an operation that could reduce the range
73 of the result, or anything too complicated :-). */
Devin Coughlin683dfd32015-09-23 23:27:55 +000074 const Expr *e = TheArgument;
Craig Topper0dbb7832014-05-27 02:45:47 +000075 const BinaryOperator * mulop = nullptr;
Devin Coughlin683dfd32015-09-23 23:27:55 +000076 APSInt maxVal;
Ted Kremenek1c2fb272011-08-03 20:17:43 +000077
78 for (;;) {
Devin Coughlin683dfd32015-09-23 23:27:55 +000079 maxVal = 0;
Ted Kremenek1c2fb272011-08-03 20:17:43 +000080 e = e->IgnoreParenImpCasts();
Devin Coughlin683dfd32015-09-23 23:27:55 +000081 if (const BinaryOperator *binop = dyn_cast<BinaryOperator>(e)) {
Ted Kremenek1c2fb272011-08-03 20:17:43 +000082 BinaryOperatorKind opc = binop->getOpcode();
83 // TODO: ignore multiplications by 1, reject if multiplied by 0.
Craig Topper0dbb7832014-05-27 02:45:47 +000084 if (mulop == nullptr && opc == BO_Mul)
Ted Kremenek1c2fb272011-08-03 20:17:43 +000085 mulop = binop;
86 if (opc != BO_Mul && opc != BO_Add && opc != BO_Sub && opc != BO_Shl)
87 return;
88
89 const Expr *lhs = binop->getLHS();
90 const Expr *rhs = binop->getRHS();
Devin Coughlin683dfd32015-09-23 23:27:55 +000091 if (rhs->isEvaluatable(Context)) {
Ted Kremenek1c2fb272011-08-03 20:17:43 +000092 e = lhs;
Devin Coughlin683dfd32015-09-23 23:27:55 +000093 maxVal = rhs->EvaluateKnownConstInt(Context);
94 if (EvaluatesToZero(maxVal, opc))
95 return;
96 } else if ((opc == BO_Add || opc == BO_Mul) &&
97 lhs->isEvaluatable(Context)) {
98 maxVal = lhs->EvaluateKnownConstInt(Context);
99 if (EvaluatesToZero(maxVal, opc))
100 return;
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000101 e = rhs;
Devin Coughlin683dfd32015-09-23 23:27:55 +0000102 } else
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000103 return;
104 }
105 else if (isa<DeclRefExpr>(e) || isa<MemberExpr>(e))
106 break;
107 else
108 return;
109 }
110
Craig Topper0dbb7832014-05-27 02:45:47 +0000111 if (mulop == nullptr)
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000112 return;
113
114 // We've found the right structure of malloc argument, now save
115 // the data so when the body of the function is completely available
116 // we can check for comparisons.
117
118 // TODO: Could push this into the innermost scope where 'e' is
119 // defined, rather than the whole function.
Devin Coughlin683dfd32015-09-23 23:27:55 +0000120 PossibleMallocOverflows.push_back(MallocOverflowCheck(mulop, e, maxVal));
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000121}
122
123namespace {
124// A worker class for OutputPossibleOverflows.
125class CheckOverflowOps :
126 public EvaluatedExprVisitor<CheckOverflowOps> {
127public:
Dmitri Gribenkof8579502013-01-12 19:30:44 +0000128 typedef SmallVectorImpl<MallocOverflowCheck> theVecType;
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000129
130private:
131 theVecType &toScanFor;
132 ASTContext &Context;
133
134 bool isIntZeroExpr(const Expr *E) const {
Richard Smithcaf33902011-10-10 18:28:20 +0000135 if (!E->getType()->isIntegralOrEnumerationType())
136 return false;
Fangrui Song407659a2018-11-30 23:41:18 +0000137 Expr::EvalResult Result;
Richard Smithcaf33902011-10-10 18:28:20 +0000138 if (E->EvaluateAsInt(Result, Context))
Fangrui Song407659a2018-11-30 23:41:18 +0000139 return Result.Val.getInt() == 0;
Richard Smithcaf33902011-10-10 18:28:20 +0000140 return false;
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000141 }
142
Benjamin Kramer6ec90ec2016-07-09 12:16:58 +0000143 static const Decl *getDecl(const DeclRefExpr *DR) { return DR->getDecl(); }
144 static const Decl *getDecl(const MemberExpr *ME) {
145 return ME->getMemberDecl();
146 }
Devin Coughlin683dfd32015-09-23 23:27:55 +0000147
148 template <typename T1>
Benjamin Kramer951a6282016-07-09 11:16:56 +0000149 void Erase(const T1 *DR,
Benjamin Kramer6ec90ec2016-07-09 12:16:58 +0000150 llvm::function_ref<bool(const MallocOverflowCheck &)> Pred) {
151 auto P = [DR, Pred](const MallocOverflowCheck &Check) {
Benjamin Kramer951a6282016-07-09 11:16:56 +0000152 if (const auto *CheckDR = dyn_cast<T1>(Check.variable))
153 return getDecl(CheckDR) == getDecl(DR) && Pred(Check);
154 return false;
155 };
156 toScanFor.erase(std::remove_if(toScanFor.begin(), toScanFor.end(), P),
157 toScanFor.end());
Devin Coughlin683dfd32015-09-23 23:27:55 +0000158 }
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000159
Devin Coughlin683dfd32015-09-23 23:27:55 +0000160 void CheckExpr(const Expr *E_p) {
Benjamin Kramer6ec90ec2016-07-09 12:16:58 +0000161 auto PredTrue = [](const MallocOverflowCheck &) { return true; };
Devin Coughlin683dfd32015-09-23 23:27:55 +0000162 const Expr *E = E_p->IgnoreParenImpCasts();
163 if (const DeclRefExpr *DR = dyn_cast<DeclRefExpr>(E))
Benjamin Kramer6ec90ec2016-07-09 12:16:58 +0000164 Erase<DeclRefExpr>(DR, PredTrue);
Benjamin Kramera008d3a2015-04-10 11:37:55 +0000165 else if (const auto *ME = dyn_cast<MemberExpr>(E)) {
Benjamin Kramer6ec90ec2016-07-09 12:16:58 +0000166 Erase<MemberExpr>(ME, PredTrue);
Devin Coughlin683dfd32015-09-23 23:27:55 +0000167 }
168 }
169
170 // Check if the argument to malloc is assigned a value
171 // which cannot cause an overflow.
172 // e.g., malloc (mul * x) and,
173 // case 1: mul = <constant value>
174 // case 2: mul = a/b, where b > x
175 void CheckAssignmentExpr(BinaryOperator *AssignEx) {
176 bool assignKnown = false;
177 bool numeratorKnown = false, denomKnown = false;
178 APSInt denomVal;
179 denomVal = 0;
180
181 // Erase if the multiplicand was assigned a constant value.
182 const Expr *rhs = AssignEx->getRHS();
183 if (rhs->isEvaluatable(Context))
184 assignKnown = true;
185
186 // Discard the report if the multiplicand was assigned a value,
187 // that can never overflow after multiplication. e.g., the assignment
188 // is a division operator and the denominator is > other multiplicand.
189 const Expr *rhse = rhs->IgnoreParenImpCasts();
190 if (const BinaryOperator *BOp = dyn_cast<BinaryOperator>(rhse)) {
191 if (BOp->getOpcode() == BO_Div) {
192 const Expr *denom = BOp->getRHS()->IgnoreParenImpCasts();
Fangrui Song407659a2018-11-30 23:41:18 +0000193 Expr::EvalResult Result;
194 if (denom->EvaluateAsInt(Result, Context)) {
195 denomVal = Result.Val.getInt();
Devin Coughlin683dfd32015-09-23 23:27:55 +0000196 denomKnown = true;
Fangrui Song407659a2018-11-30 23:41:18 +0000197 }
Devin Coughlin683dfd32015-09-23 23:27:55 +0000198 const Expr *numerator = BOp->getLHS()->IgnoreParenImpCasts();
199 if (numerator->isEvaluatable(Context))
200 numeratorKnown = true;
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000201 }
202 }
Devin Coughlin683dfd32015-09-23 23:27:55 +0000203 if (!assignKnown && !denomKnown)
204 return;
205 auto denomExtVal = denomVal.getExtValue();
206
207 // Ignore negative denominator.
208 if (denomExtVal < 0)
209 return;
210
211 const Expr *lhs = AssignEx->getLHS();
212 const Expr *E = lhs->IgnoreParenImpCasts();
213
214 auto pred = [assignKnown, numeratorKnown,
Benjamin Kramer951a6282016-07-09 11:16:56 +0000215 denomExtVal](const MallocOverflowCheck &Check) {
Devin Coughlin683dfd32015-09-23 23:27:55 +0000216 return assignKnown ||
Benjamin Kramer951a6282016-07-09 11:16:56 +0000217 (numeratorKnown && (denomExtVal >= Check.maxVal.getExtValue()));
Devin Coughlin683dfd32015-09-23 23:27:55 +0000218 };
219
220 if (const DeclRefExpr *DR = dyn_cast<DeclRefExpr>(E))
221 Erase<DeclRefExpr>(DR, pred);
222 else if (const auto *ME = dyn_cast<MemberExpr>(E))
223 Erase<MemberExpr>(ME, pred);
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000224 }
225
226 public:
227 void VisitBinaryOperator(BinaryOperator *E) {
228 if (E->isComparisonOp()) {
229 const Expr * lhs = E->getLHS();
230 const Expr * rhs = E->getRHS();
231 // Ignore comparisons against zero, since they generally don't
232 // protect against an overflow.
Devin Coughlin683dfd32015-09-23 23:27:55 +0000233 if (!isIntZeroExpr(lhs) && !isIntZeroExpr(rhs)) {
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000234 CheckExpr(lhs);
235 CheckExpr(rhs);
236 }
237 }
Devin Coughlin683dfd32015-09-23 23:27:55 +0000238 if (E->isAssignmentOp())
239 CheckAssignmentExpr(E);
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000240 EvaluatedExprVisitor<CheckOverflowOps>::VisitBinaryOperator(E);
241 }
242
243 /* We specifically ignore loop conditions, because they're typically
244 not error checks. */
245 void VisitWhileStmt(WhileStmt *S) {
246 return this->Visit(S->getBody());
247 }
248 void VisitForStmt(ForStmt *S) {
249 return this->Visit(S->getBody());
250 }
251 void VisitDoStmt(DoStmt *S) {
252 return this->Visit(S->getBody());
253 }
254
255 CheckOverflowOps(theVecType &v, ASTContext &ctx)
256 : EvaluatedExprVisitor<CheckOverflowOps>(ctx),
257 toScanFor(v), Context(ctx)
258 { }
259 };
Alexander Kornienkoab9db512015-06-22 23:07:51 +0000260}
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000261
262// OutputPossibleOverflows - We've found a possible overflow earlier,
263// now check whether Body might contain a comparison which might be
264// preventing the overflow.
265// This doesn't do flow analysis, range analysis, or points-to analysis; it's
266// just a dumb "is there a comparison" scan. The aim here is to
267// detect the most blatent cases of overflow and educate the
268// programmer.
269void MallocOverflowSecurityChecker::OutputPossibleOverflows(
Dmitri Gribenkof8579502013-01-12 19:30:44 +0000270 SmallVectorImpl<MallocOverflowCheck> &PossibleMallocOverflows,
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000271 const Decl *D, BugReporter &BR, AnalysisManager &mgr) const {
272 // By far the most common case: nothing to check.
273 if (PossibleMallocOverflows.empty())
274 return;
275
276 // Delete any possible overflows which have a comparison.
277 CheckOverflowOps c(PossibleMallocOverflows, BR.getContext());
Ted Kremenek81ce1c82011-10-24 01:32:45 +0000278 c.Visit(mgr.getAnalysisDeclContext(D)->getBody());
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000279
280 // Output warnings for all overflows that are left.
281 for (CheckOverflowOps::theVecType::iterator
282 i = PossibleMallocOverflows.begin(),
283 e = PossibleMallocOverflows.end();
284 i != e;
285 ++i) {
Alexander Kornienko4aca9b12014-02-11 21:49:21 +0000286 BR.EmitBasicReport(
287 D, this, "malloc() size overflow", categories::UnixAPI,
288 "the computation of the size of the memory allocation may overflow",
289 PathDiagnosticLocation::createOperatorLoc(i->mulop,
290 BR.getSourceManager()),
291 i->mulop->getSourceRange());
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000292 }
293}
294
295void MallocOverflowSecurityChecker::checkASTCodeBody(const Decl *D,
296 AnalysisManager &mgr,
297 BugReporter &BR) const {
298
299 CFG *cfg = mgr.getCFG(D);
300 if (!cfg)
301 return;
302
303 // A list of variables referenced in possibly overflowing malloc operands.
Dmitri Gribenkof8579502013-01-12 19:30:44 +0000304 SmallVector<MallocOverflowCheck, 2> PossibleMallocOverflows;
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000305
306 for (CFG::iterator it = cfg->begin(), ei = cfg->end(); it != ei; ++it) {
307 CFGBlock *block = *it;
308 for (CFGBlock::iterator bi = block->begin(), be = block->end();
309 bi != be; ++bi) {
David Blaikie00be69a2013-02-23 00:29:34 +0000310 if (Optional<CFGStmt> CS = bi->getAs<CFGStmt>()) {
311 if (const CallExpr *TheCall = dyn_cast<CallExpr>(CS->getStmt())) {
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000312 // Get the callee.
313 const FunctionDecl *FD = TheCall->getDirectCallee();
314
315 if (!FD)
Devin Coughlin683dfd32015-09-23 23:27:55 +0000316 continue;
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000317
318 // Get the name of the callee. If it's a builtin, strip off the prefix.
319 IdentifierInfo *FnInfo = FD->getIdentifier();
Anna Zaks0070c6d2011-09-27 22:25:01 +0000320 if (!FnInfo)
Devin Coughlin683dfd32015-09-23 23:27:55 +0000321 continue;
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000322
323 if (FnInfo->isStr ("malloc") || FnInfo->isStr ("_MALLOC")) {
324 if (TheCall->getNumArgs() == 1)
325 CheckMallocArgument(PossibleMallocOverflows, TheCall->getArg(0),
326 mgr.getASTContext());
327 }
328 }
329 }
330 }
331 }
332
333 OutputPossibleOverflows(PossibleMallocOverflows, D, BR, mgr);
334}
335
Kristof Umann058a7a42019-01-26 14:23:08 +0000336void ento::registerMallocOverflowSecurityChecker(CheckerManager &mgr) {
Ted Kremenek1c2fb272011-08-03 20:17:43 +0000337 mgr.registerChecker<MallocOverflowSecurityChecker>();
338}
Kristof Umann058a7a42019-01-26 14:23:08 +0000339
340bool ento::shouldRegisterMallocOverflowSecurityChecker(const LangOptions &LO) {
341 return true;
342}