clang 20.0.0git
UnsafeBufferUsage.cpp
Go to the documentation of this file.
1//===- UnsafeBufferUsage.cpp - Replace pointers with modern C++ -----------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
11#include "clang/AST/Decl.h"
13#include "clang/AST/Expr.h"
15#include "clang/AST/Stmt.h"
17#include "clang/AST/Type.h"
21#include "clang/Lex/Lexer.h"
23#include "llvm/ADT/APSInt.h"
24#include "llvm/ADT/SmallVector.h"
25#include "llvm/ADT/StringRef.h"
26#include "llvm/Support/Casting.h"
27#include <memory>
28#include <optional>
29#include <queue>
30#include <sstream>
31
32using namespace llvm;
33using namespace clang;
34using namespace ast_matchers;
35
36#ifndef NDEBUG
37namespace {
38class StmtDebugPrinter
39 : public ConstStmtVisitor<StmtDebugPrinter, std::string> {
40public:
41 std::string VisitStmt(const Stmt *S) { return S->getStmtClassName(); }
42
43 std::string VisitBinaryOperator(const BinaryOperator *BO) {
44 return "BinaryOperator(" + BO->getOpcodeStr().str() + ")";
45 }
46
47 std::string VisitUnaryOperator(const UnaryOperator *UO) {
48 return "UnaryOperator(" + UO->getOpcodeStr(UO->getOpcode()).str() + ")";
49 }
50
51 std::string VisitImplicitCastExpr(const ImplicitCastExpr *ICE) {
52 return "ImplicitCastExpr(" + std::string(ICE->getCastKindName()) + ")";
53 }
54};
55
56// Returns a string of ancestor `Stmt`s of the given `DRE` in such a form:
57// "DRE ==> parent-of-DRE ==> grandparent-of-DRE ==> ...".
58static std::string getDREAncestorString(const DeclRefExpr *DRE,
59 ASTContext &Ctx) {
60 std::stringstream SS;
61 const Stmt *St = DRE;
62 StmtDebugPrinter StmtPriner;
63
64 do {
65 SS << StmtPriner.Visit(St);
66
67 DynTypedNodeList StParents = Ctx.getParents(*St);
68
69 if (StParents.size() > 1)
70 return "unavailable due to multiple parents";
71 if (StParents.size() == 0)
72 break;
73 St = StParents.begin()->get<Stmt>();
74 if (St)
75 SS << " ==> ";
76 } while (St);
77 return SS.str();
78}
79} // namespace
80#endif /* NDEBUG */
81
82namespace clang::ast_matchers {
83// A `RecursiveASTVisitor` that traverses all descendants of a given node "n"
84// except for those belonging to a different callable of "n".
86public:
87 // Creates an AST visitor that matches `Matcher` on all
88 // descendants of a given node "n" except for the ones
89 // belonging to a different callable of "n".
90 MatchDescendantVisitor(const internal::DynTypedMatcher *Matcher,
91 internal::ASTMatchFinder *Finder,
92 internal::BoundNodesTreeBuilder *Builder,
93 internal::ASTMatchFinder::BindKind Bind,
94 const bool ignoreUnevaluatedContext)
95 : Matcher(Matcher), Finder(Finder), Builder(Builder), Bind(Bind),
96 Matches(false), ignoreUnevaluatedContext(ignoreUnevaluatedContext) {
98 ShouldVisitImplicitCode = false; // TODO: let's ignore implicit code for now
99 }
100
101 // Returns true if a match is found in a subtree of `DynNode`, which belongs
102 // to the same callable of `DynNode`.
103 bool findMatch(const DynTypedNode &DynNode) {
104 Matches = false;
105 if (const Stmt *StmtNode = DynNode.get<Stmt>()) {
106 TraverseStmt(const_cast<Stmt *>(StmtNode));
107 *Builder = ResultBindings;
108 return Matches;
109 }
110 return false;
111 }
112
113 // The following are overriding methods from the base visitor class.
114 // They are public only to allow CRTP to work. They are *not *part
115 // of the public API of this class.
116
117 // For the matchers so far used in safe buffers, we only need to match
118 // `Stmt`s. To override more as needed.
119
120 bool TraverseDecl(Decl *Node) override {
121 if (!Node)
122 return true;
123 if (!match(*Node))
124 return false;
125 // To skip callables:
126 if (isa<FunctionDecl, BlockDecl, ObjCMethodDecl>(Node))
127 return true;
128 // Traverse descendants
130 }
131
133 // These are unevaluated, except the result expression.
134 if (ignoreUnevaluatedContext)
135 return TraverseStmt(Node->getResultExpr());
136 return DynamicRecursiveASTVisitor::TraverseGenericSelectionExpr(Node);
137 }
138
139 bool
141 // Unevaluated context.
142 if (ignoreUnevaluatedContext)
143 return true;
144 return DynamicRecursiveASTVisitor::TraverseUnaryExprOrTypeTraitExpr(Node);
145 }
146
148 // Unevaluated context.
149 if (ignoreUnevaluatedContext)
150 return true;
151 return DynamicRecursiveASTVisitor::TraverseTypeOfExprTypeLoc(Node);
152 }
153
155 // Unevaluated context.
156 if (ignoreUnevaluatedContext)
157 return true;
158 return DynamicRecursiveASTVisitor::TraverseDecltypeTypeLoc(Node);
159 }
160
162 // Unevaluated context.
163 if (ignoreUnevaluatedContext)
164 return true;
165 return DynamicRecursiveASTVisitor::TraverseCXXNoexceptExpr(Node);
166 }
167
169 // Unevaluated context.
170 if (ignoreUnevaluatedContext)
171 return true;
172 return DynamicRecursiveASTVisitor::TraverseCXXTypeidExpr(Node);
173 }
174
176 if (!TraverseStmt(Node->getExpr()))
177 return false;
178 return DynamicRecursiveASTVisitor::TraverseCXXDefaultInitExpr(Node);
179 }
180
181 bool TraverseStmt(Stmt *Node) override {
182 if (!Node)
183 return true;
184 if (!match(*Node))
185 return false;
187 }
188
189private:
190 // Sets 'Matched' to true if 'Matcher' matches 'Node'
191 //
192 // Returns 'true' if traversal should continue after this function
193 // returns, i.e. if no match is found or 'Bind' is 'BK_All'.
194 template <typename T> bool match(const T &Node) {
195 internal::BoundNodesTreeBuilder RecursiveBuilder(*Builder);
196
197 if (Matcher->matches(DynTypedNode::create(Node), Finder,
198 &RecursiveBuilder)) {
199 ResultBindings.addMatch(RecursiveBuilder);
200 Matches = true;
201 if (Bind != internal::ASTMatchFinder::BK_All)
202 return false; // Abort as soon as a match is found.
203 }
204 return true;
205 }
206
207 const internal::DynTypedMatcher *const Matcher;
208 internal::ASTMatchFinder *const Finder;
209 internal::BoundNodesTreeBuilder *const Builder;
210 internal::BoundNodesTreeBuilder ResultBindings;
211 const internal::ASTMatchFinder::BindKind Bind;
212 bool Matches;
213 bool ignoreUnevaluatedContext;
214};
215
216// Because we're dealing with raw pointers, let's define what we mean by that.
217static auto hasPointerType() {
218 return hasType(hasCanonicalType(pointerType()));
219}
220
221static auto hasArrayType() { return hasType(hasCanonicalType(arrayType())); }
222
223AST_MATCHER_P(Stmt, forEachDescendantEvaluatedStmt, internal::Matcher<Stmt>,
224 innerMatcher) {
225 const DynTypedMatcher &DTM = static_cast<DynTypedMatcher>(innerMatcher);
226
227 MatchDescendantVisitor Visitor(&DTM, Finder, Builder, ASTMatchFinder::BK_All,
228 true);
229 return Visitor.findMatch(DynTypedNode::create(Node));
230}
231
232AST_MATCHER_P(Stmt, forEachDescendantStmt, internal::Matcher<Stmt>,
233 innerMatcher) {
234 const DynTypedMatcher &DTM = static_cast<DynTypedMatcher>(innerMatcher);
235
236 MatchDescendantVisitor Visitor(&DTM, Finder, Builder, ASTMatchFinder::BK_All,
237 false);
238 return Visitor.findMatch(DynTypedNode::create(Node));
239}
240
241// Matches a `Stmt` node iff the node is in a safe-buffer opt-out region
242AST_MATCHER_P(Stmt, notInSafeBufferOptOut, const UnsafeBufferUsageHandler *,
243 Handler) {
244 return !Handler->isSafeBufferOptOut(Node.getBeginLoc());
245}
246
247AST_MATCHER_P(Stmt, ignoreUnsafeBufferInContainer,
248 const UnsafeBufferUsageHandler *, Handler) {
249 return Handler->ignoreUnsafeBufferInContainer(Node.getBeginLoc());
250}
251
252AST_MATCHER_P(Stmt, ignoreUnsafeLibcCall, const UnsafeBufferUsageHandler *,
253 Handler) {
254 if (Finder->getASTContext().getLangOpts().CPlusPlus)
255 return Handler->ignoreUnsafeBufferInLibcCall(Node.getBeginLoc());
256 return true; /* Only warn about libc calls for C++ */
257}
258
259AST_MATCHER_P(CastExpr, castSubExpr, internal::Matcher<Expr>, innerMatcher) {
260 return innerMatcher.matches(*Node.getSubExpr(), Finder, Builder);
261}
262
263// Matches a `UnaryOperator` whose operator is pre-increment:
265 return Node.getOpcode() == UnaryOperator::Opcode::UO_PreInc;
266}
267
268// Returns a matcher that matches any expression 'e' such that `innerMatcher`
269// matches 'e' and 'e' is in an Unspecified Lvalue Context.
270static auto isInUnspecifiedLvalueContext(internal::Matcher<Expr> innerMatcher) {
271 // clang-format off
272 return
273 expr(anyOf(
275 hasCastKind(CastKind::CK_LValueToRValue),
276 castSubExpr(innerMatcher)),
279 hasLHS(innerMatcher)
280 )
281 ));
282 // clang-format on
283}
284
285// Returns a matcher that matches any expression `e` such that `InnerMatcher`
286// matches `e` and `e` is in an Unspecified Pointer Context (UPC).
287static internal::Matcher<Stmt>
288isInUnspecifiedPointerContext(internal::Matcher<Stmt> InnerMatcher) {
289 // A UPC can be
290 // 1. an argument of a function call (except the callee has [[unsafe_...]]
291 // attribute), or
292 // 2. the operand of a pointer-to-(integer or bool) cast operation; or
293 // 3. the operand of a comparator operation; or
294 // 4. the operand of a pointer subtraction operation
295 // (i.e., computing the distance between two pointers); or ...
296
297 // clang-format off
298 auto CallArgMatcher = callExpr(
299 forEachArgumentWithParamType(
300 InnerMatcher,
301 isAnyPointer() /* array also decays to pointer type*/),
302 unless(callee(
303 functionDecl(hasAttr(attr::UnsafeBufferUsage)))));
304
305 auto CastOperandMatcher =
306 castExpr(anyOf(hasCastKind(CastKind::CK_PointerToIntegral),
307 hasCastKind(CastKind::CK_PointerToBoolean)),
308 castSubExpr(allOf(hasPointerType(), InnerMatcher)));
309
310 auto CompOperandMatcher =
311 binaryOperator(hasAnyOperatorName("!=", "==", "<", "<=", ">", ">="),
312 eachOf(hasLHS(allOf(hasPointerType(), InnerMatcher)),
313 hasRHS(allOf(hasPointerType(), InnerMatcher))));
314
315 // A matcher that matches pointer subtractions:
316 auto PtrSubtractionMatcher =
317 binaryOperator(hasOperatorName("-"),
318 // Note that here we need both LHS and RHS to be
319 // pointer. Then the inner matcher can match any of
320 // them:
321 allOf(hasLHS(hasPointerType()),
322 hasRHS(hasPointerType())),
323 eachOf(hasLHS(InnerMatcher),
324 hasRHS(InnerMatcher)));
325 // clang-format on
326
327 return stmt(anyOf(CallArgMatcher, CastOperandMatcher, CompOperandMatcher,
328 PtrSubtractionMatcher));
329 // FIXME: any more cases? (UPC excludes the RHS of an assignment. For now we
330 // don't have to check that.)
331}
332
333// Returns a matcher that matches any expression 'e' such that `innerMatcher`
334// matches 'e' and 'e' is in an unspecified untyped context (i.e the expression
335// 'e' isn't evaluated to an RValue). For example, consider the following code:
336// int *p = new int[4];
337// int *q = new int[4];
338// if ((p = q)) {}
339// p = q;
340// The expression `p = q` in the conditional of the `if` statement
341// `if ((p = q))` is evaluated as an RValue, whereas the expression `p = q;`
342// in the assignment statement is in an untyped context.
343static internal::Matcher<Stmt>
344isInUnspecifiedUntypedContext(internal::Matcher<Stmt> InnerMatcher) {
345 // An unspecified context can be
346 // 1. A compound statement,
347 // 2. The body of an if statement
348 // 3. Body of a loop
349 auto CompStmt = compoundStmt(forEach(InnerMatcher));
350 auto IfStmtThen = ifStmt(hasThen(InnerMatcher));
351 auto IfStmtElse = ifStmt(hasElse(InnerMatcher));
352 // FIXME: Handle loop bodies.
353 return stmt(anyOf(CompStmt, IfStmtThen, IfStmtElse));
354}
355
356// Given a two-param std::span construct call, matches iff the call has the
357// following forms:
358// 1. `std::span<T>{new T[n], n}`, where `n` is a literal or a DRE
359// 2. `std::span<T>{new T, 1}`
360// 3. `std::span<T>{&var, 1}`
361// 4. `std::span<T>{a, n}`, where `a` is of an array-of-T with constant size
362// `n`
363// 5. `std::span<T>{any, 0}`
364// 6. `std::span<T>{std::addressof(...), 1}`
365AST_MATCHER(CXXConstructExpr, isSafeSpanTwoParamConstruct) {
366 assert(Node.getNumArgs() == 2 &&
367 "expecting a two-parameter std::span constructor");
368 const Expr *Arg0 = Node.getArg(0)->IgnoreImplicit();
369 const Expr *Arg1 = Node.getArg(1)->IgnoreImplicit();
370 auto HaveEqualConstantValues = [&Finder](const Expr *E0, const Expr *E1) {
371 if (auto E0CV = E0->getIntegerConstantExpr(Finder->getASTContext()))
372 if (auto E1CV = E1->getIntegerConstantExpr(Finder->getASTContext())) {
373 return APSInt::compareValues(*E0CV, *E1CV) == 0;
374 }
375 return false;
376 };
377 auto AreSameDRE = [](const Expr *E0, const Expr *E1) {
378 if (auto *DRE0 = dyn_cast<DeclRefExpr>(E0))
379 if (auto *DRE1 = dyn_cast<DeclRefExpr>(E1)) {
380 return DRE0->getDecl() == DRE1->getDecl();
381 }
382 return false;
383 };
384 std::optional<APSInt> Arg1CV =
385 Arg1->getIntegerConstantExpr(Finder->getASTContext());
386
387 if (Arg1CV && Arg1CV->isZero())
388 // Check form 5:
389 return true;
390 switch (Arg0->IgnoreImplicit()->getStmtClass()) {
391 case Stmt::CXXNewExprClass:
392 if (auto Size = cast<CXXNewExpr>(Arg0)->getArraySize()) {
393 // Check form 1:
394 return AreSameDRE((*Size)->IgnoreImplicit(), Arg1) ||
395 HaveEqualConstantValues(*Size, Arg1);
396 }
397 // TODO: what's placeholder type? avoid it for now.
398 if (!cast<CXXNewExpr>(Arg0)->hasPlaceholderType()) {
399 // Check form 2:
400 return Arg1CV && Arg1CV->isOne();
401 }
402 break;
403 case Stmt::UnaryOperatorClass:
404 if (cast<UnaryOperator>(Arg0)->getOpcode() ==
405 UnaryOperator::Opcode::UO_AddrOf)
406 // Check form 3:
407 return Arg1CV && Arg1CV->isOne();
408 break;
409 case Stmt::CallExprClass:
410 if (const auto *CE = dyn_cast<CallExpr>(Arg0)) {
411 const auto FnDecl = CE->getDirectCallee();
412 if (FnDecl && FnDecl->getNameAsString() == "addressof" &&
413 FnDecl->isInStdNamespace()) {
414 return Arg1CV && Arg1CV->isOne();
415 }
416 }
417 break;
418 default:
419 break;
420 }
421
422 QualType Arg0Ty = Arg0->IgnoreImplicit()->getType();
423
424 if (auto *ConstArrTy =
425 Finder->getASTContext().getAsConstantArrayType(Arg0Ty)) {
426 const APSInt ConstArrSize = APSInt(ConstArrTy->getSize());
427
428 // Check form 4:
429 return Arg1CV && APSInt::compareValues(ConstArrSize, *Arg1CV) == 0;
430 }
431 return false;
432}
433
434AST_MATCHER(ArraySubscriptExpr, isSafeArraySubscript) {
435 // FIXME: Proper solution:
436 // - refactor Sema::CheckArrayAccess
437 // - split safe/OOB/unknown decision logic from diagnostics emitting code
438 // - e. g. "Try harder to find a NamedDecl to point at in the note."
439 // already duplicated
440 // - call both from Sema and from here
441
442 uint64_t limit;
443 if (const auto *CATy =
444 dyn_cast<ConstantArrayType>(Node.getBase()
445 ->IgnoreParenImpCasts()
446 ->getType()
447 ->getUnqualifiedDesugaredType())) {
448 limit = CATy->getLimitedSize();
449 } else if (const auto *SLiteral = dyn_cast<StringLiteral>(
450 Node.getBase()->IgnoreParenImpCasts())) {
451 limit = SLiteral->getLength() + 1;
452 } else {
453 return false;
454 }
455
456 Expr::EvalResult EVResult;
457 if (Node.getIdx()->EvaluateAsInt(EVResult, Finder->getASTContext())) {
458 llvm::APSInt ArrIdx = EVResult.Val.getInt();
459 // FIXME: ArrIdx.isNegative() we could immediately emit an error as that's a
460 // bug
461 if (ArrIdx.isNonNegative() && ArrIdx.getLimitedValue() < limit)
462 return true;
463 }
464 return false;
465}
466
467AST_MATCHER_P(CallExpr, hasNumArgs, unsigned, Num) {
468 return Node.getNumArgs() == Num;
469}
470
471namespace libc_func_matchers {
472// Under `libc_func_matchers`, define a set of matchers that match unsafe
473// functions in libc and unsafe calls to them.
474
475// A tiny parser to strip off common prefix and suffix of libc function names
476// in real code.
477//
478// Given a function name, `matchName` returns `CoreName` according to the
479// following grammar:
480//
481// LibcName := CoreName | CoreName + "_s"
482// MatchingName := "__builtin_" + LibcName |
483// "__builtin___" + LibcName + "_chk" |
484// "__asan_" + LibcName
485//
487 StringRef matchName(StringRef FunName, bool isBuiltin) {
488 // Try to match __builtin_:
489 if (isBuiltin && FunName.starts_with("__builtin_"))
490 // Then either it is __builtin_LibcName or __builtin___LibcName_chk or
491 // no match:
493 FunName.drop_front(10 /* truncate "__builtin_" */));
494 // Try to match __asan_:
495 if (FunName.starts_with("__asan_"))
496 return matchLibcName(FunName.drop_front(7 /* truncate of "__asan_" */));
497 return matchLibcName(FunName);
498 }
499
500 // Parameter `Name` is the substring after stripping off the prefix
501 // "__builtin_".
502 StringRef matchLibcNameOrBuiltinChk(StringRef Name) {
503 if (Name.starts_with("__") && Name.ends_with("_chk"))
504 return matchLibcName(
505 Name.drop_front(2).drop_back(4) /* truncate "__" and "_chk" */);
506 return matchLibcName(Name);
507 }
508
509 StringRef matchLibcName(StringRef Name) {
510 if (Name.ends_with("_s"))
511 return Name.drop_back(2 /* truncate "_s" */);
512 return Name;
513 }
514};
515
516// A pointer type expression is known to be null-terminated, if it has the
517// form: E.c_str(), for any expression E of `std::string` type.
518static bool isNullTermPointer(const Expr *Ptr) {
519 if (isa<StringLiteral>(Ptr->IgnoreParenImpCasts()))
520 return true;
521 if (isa<PredefinedExpr>(Ptr->IgnoreParenImpCasts()))
522 return true;
523 if (auto *MCE = dyn_cast<CXXMemberCallExpr>(Ptr->IgnoreParenImpCasts())) {
524 const CXXMethodDecl *MD = MCE->getMethodDecl();
525 const CXXRecordDecl *RD = MCE->getRecordDecl()->getCanonicalDecl();
526
527 if (MD && RD && RD->isInStdNamespace())
528 if (MD->getName() == "c_str" && RD->getName() == "basic_string")
529 return true;
530 }
531 return false;
532}
533
534// Return true iff at least one of following cases holds:
535// 1. Format string is a literal and there is an unsafe pointer argument
536// corresponding to an `s` specifier;
537// 2. Format string is not a literal and there is least an unsafe pointer
538// argument (including the formatter argument).
539//
540// `UnsafeArg` is the output argument that will be set only if this function
541// returns true.
542static bool hasUnsafeFormatOrSArg(const CallExpr *Call, const Expr *&UnsafeArg,
543 const unsigned FmtArgIdx, ASTContext &Ctx,
544 bool isKprintf = false) {
545 class StringFormatStringHandler
547 const CallExpr *Call;
548 unsigned FmtArgIdx;
549 const Expr *&UnsafeArg;
550
551 public:
552 StringFormatStringHandler(const CallExpr *Call, unsigned FmtArgIdx,
553 const Expr *&UnsafeArg)
554 : Call(Call), FmtArgIdx(FmtArgIdx), UnsafeArg(UnsafeArg) {}
555
556 bool HandlePrintfSpecifier(const analyze_printf::PrintfSpecifier &FS,
557 const char *startSpecifier,
558 unsigned specifierLen,
559 const TargetInfo &Target) override {
560 if (FS.getConversionSpecifier().getKind() ==
561 analyze_printf::PrintfConversionSpecifier::sArg) {
562 unsigned ArgIdx = FS.getPositionalArgIndex() + FmtArgIdx;
563
564 if (0 < ArgIdx && ArgIdx < Call->getNumArgs())
565 if (!isNullTermPointer(Call->getArg(ArgIdx))) {
566 UnsafeArg = Call->getArg(ArgIdx); // output
567 // returning false stops parsing immediately
568 return false;
569 }
570 }
571 return true; // continue parsing
572 }
573 };
574
575 const Expr *Fmt = Call->getArg(FmtArgIdx);
576
577 if (auto *SL = dyn_cast<StringLiteral>(Fmt->IgnoreParenImpCasts())) {
578 StringRef FmtStr;
579
580 if (SL->getCharByteWidth() == 1)
581 FmtStr = SL->getString();
582 else if (auto EvaledFmtStr = SL->tryEvaluateString(Ctx))
583 FmtStr = *EvaledFmtStr;
584 else
585 goto CHECK_UNSAFE_PTR;
586
587 StringFormatStringHandler Handler(Call, FmtArgIdx, UnsafeArg);
588
590 Handler, FmtStr.begin(), FmtStr.end(), Ctx.getLangOpts(),
591 Ctx.getTargetInfo(), isKprintf);
592 }
593CHECK_UNSAFE_PTR:
594 // If format is not a string literal, we cannot analyze the format string.
595 // In this case, this call is considered unsafe if at least one argument
596 // (including the format argument) is unsafe pointer.
597 return llvm::any_of(
598 llvm::make_range(Call->arg_begin() + FmtArgIdx, Call->arg_end()),
599 [&UnsafeArg](const Expr *Arg) -> bool {
600 if (Arg->getType()->isPointerType() && !isNullTermPointer(Arg)) {
601 UnsafeArg = Arg;
602 return true;
603 }
604 return false;
605 });
606}
607
608// Matches a FunctionDecl node such that
609// 1. It's name, after stripping off predefined prefix and suffix, is
610// `CoreName`; and
611// 2. `CoreName` or `CoreName[str/wcs]` is one of the `PredefinedNames`, which
612// is a set of libc function names.
613//
614// Note: For predefined prefix and suffix, see `LibcFunNamePrefixSuffixParser`.
615// The notation `CoreName[str/wcs]` means a new name obtained from replace
616// string "wcs" with "str" in `CoreName`.
617AST_MATCHER(FunctionDecl, isPredefinedUnsafeLibcFunc) {
618 static std::unique_ptr<std::set<StringRef>> PredefinedNames = nullptr;
619 if (!PredefinedNames)
620 PredefinedNames =
621 std::make_unique<std::set<StringRef>, std::set<StringRef>>({
622 // numeric conversion:
623 "atof",
624 "atoi",
625 "atol",
626 "atoll",
627 "strtol",
628 "strtoll",
629 "strtoul",
630 "strtoull",
631 "strtof",
632 "strtod",
633 "strtold",
634 "strtoimax",
635 "strtoumax",
636 // "strfromf", "strfromd", "strfroml", // C23?
637 // string manipulation:
638 "strcpy",
639 "strncpy",
640 "strlcpy",
641 "strcat",
642 "strncat",
643 "strlcat",
644 "strxfrm",
645 "strdup",
646 "strndup",
647 // string examination:
648 "strlen",
649 "strnlen",
650 "strcmp",
651 "strncmp",
652 "stricmp",
653 "strcasecmp",
654 "strcoll",
655 "strchr",
656 "strrchr",
657 "strspn",
658 "strcspn",
659 "strpbrk",
660 "strstr",
661 "strtok",
662 // "mem-" functions
663 "memchr",
664 "wmemchr",
665 "memcmp",
666 "wmemcmp",
667 "memcpy",
668 "memccpy",
669 "mempcpy",
670 "wmemcpy",
671 "memmove",
672 "wmemmove",
673 "memset",
674 "wmemset",
675 // IO:
676 "fread",
677 "fwrite",
678 "fgets",
679 "fgetws",
680 "gets",
681 "fputs",
682 "fputws",
683 "puts",
684 // others
685 "strerror_s",
686 "strerror_r",
687 "bcopy",
688 "bzero",
689 "bsearch",
690 "qsort",
691 });
692
693 auto *II = Node.getIdentifier();
694
695 if (!II)
696 return false;
697
698 StringRef Name = LibcFunNamePrefixSuffixParser().matchName(
699 II->getName(), Node.getBuiltinID());
700
701 // Match predefined names:
702 if (PredefinedNames->find(Name) != PredefinedNames->end())
703 return true;
704
705 std::string NameWCS = Name.str();
706 size_t WcsPos = NameWCS.find("wcs");
707
708 while (WcsPos != std::string::npos) {
709 NameWCS[WcsPos++] = 's';
710 NameWCS[WcsPos++] = 't';
711 NameWCS[WcsPos++] = 'r';
712 WcsPos = NameWCS.find("wcs", WcsPos);
713 }
714 if (PredefinedNames->find(NameWCS) != PredefinedNames->end())
715 return true;
716 // All `scanf` functions are unsafe (including `sscanf`, `vsscanf`, etc.. They
717 // all should end with "scanf"):
718 return Name.ends_with("scanf");
719}
720
721// Match a call to one of the `v*printf` functions taking `va_list`. We cannot
722// check safety for these functions so they should be changed to their
723// non-va_list versions.
724AST_MATCHER(FunctionDecl, isUnsafeVaListPrintfFunc) {
725 auto *II = Node.getIdentifier();
726
727 if (!II)
728 return false;
729
730 StringRef Name = LibcFunNamePrefixSuffixParser().matchName(
731 II->getName(), Node.getBuiltinID());
732
733 if (!Name.ends_with("printf"))
734 return false; // neither printf nor scanf
735 return Name.starts_with("v");
736}
737
738// Matches a call to one of the `sprintf` functions as they are always unsafe
739// and should be changed to `snprintf`.
740AST_MATCHER(FunctionDecl, isUnsafeSprintfFunc) {
741 auto *II = Node.getIdentifier();
742
743 if (!II)
744 return false;
745
746 StringRef Name = LibcFunNamePrefixSuffixParser().matchName(
747 II->getName(), Node.getBuiltinID());
748
749 if (!Name.ends_with("printf") ||
750 // Let `isUnsafeVaListPrintfFunc` check for cases with va-list:
751 Name.starts_with("v"))
752 return false;
753
754 StringRef Prefix = Name.drop_back(6);
755
756 if (Prefix.ends_with("w"))
757 Prefix = Prefix.drop_back(1);
758 return Prefix == "s";
759}
760
761// Match function declarations of `printf`, `fprintf`, `snprintf` and their wide
762// character versions. Calls to these functions can be safe if their arguments
763// are carefully made safe.
764AST_MATCHER(FunctionDecl, isNormalPrintfFunc) {
765 auto *II = Node.getIdentifier();
766
767 if (!II)
768 return false;
769
770 StringRef Name = LibcFunNamePrefixSuffixParser().matchName(
771 II->getName(), Node.getBuiltinID());
772
773 if (!Name.ends_with("printf") || Name.starts_with("v"))
774 return false;
775
776 StringRef Prefix = Name.drop_back(6);
777
778 if (Prefix.ends_with("w"))
779 Prefix = Prefix.drop_back(1);
780
781 return Prefix.empty() || Prefix == "k" || Prefix == "f" || Prefix == "sn";
782}
783
784// This matcher requires that it is known that the callee `isNormalPrintf`.
785// Then if the format string is a string literal, this matcher matches when at
786// least one string argument is unsafe. If the format is not a string literal,
787// this matcher matches when at least one pointer type argument is unsafe.
788AST_MATCHER_P(CallExpr, hasUnsafePrintfStringArg,
789 clang::ast_matchers::internal::Matcher<Expr>,
790 UnsafeStringArgMatcher) {
791 // Determine what printf it is by examining formal parameters:
792 const FunctionDecl *FD = Node.getDirectCallee();
793
794 assert(FD && "It should have been checked that FD is non-null.");
795
796 unsigned NumParms = FD->getNumParams();
797
798 if (NumParms < 1)
799 return false; // possibly some user-defined printf function
800
801 ASTContext &Ctx = Finder->getASTContext();
802 QualType FirstParmTy = FD->getParamDecl(0)->getType();
803
804 if (!FirstParmTy->isPointerType())
805 return false; // possibly some user-defined printf function
806
807 QualType FirstPteTy = FirstParmTy->castAs<PointerType>()->getPointeeType();
808
809 if (!Ctx.getFILEType()
810 .isNull() && //`FILE *` must be in the context if it is fprintf
811 FirstPteTy.getCanonicalType() == Ctx.getFILEType().getCanonicalType()) {
812 // It is a fprintf:
813 const Expr *UnsafeArg;
814
815 if (hasUnsafeFormatOrSArg(&Node, UnsafeArg, 1, Ctx, false))
816 return UnsafeStringArgMatcher.matches(*UnsafeArg, Finder, Builder);
817 return false;
818 }
819
820 if (FirstPteTy.isConstQualified()) {
821 // If the first parameter is a `const char *`, it is a printf/kprintf:
822 bool isKprintf = false;
823 const Expr *UnsafeArg;
824
825 if (auto *II = FD->getIdentifier())
826 isKprintf = II->getName() == "kprintf";
827 if (hasUnsafeFormatOrSArg(&Node, UnsafeArg, 0, Ctx, isKprintf))
828 return UnsafeStringArgMatcher.matches(*UnsafeArg, Finder, Builder);
829 return false;
830 }
831
832 if (NumParms > 2) {
833 QualType SecondParmTy = FD->getParamDecl(1)->getType();
834
835 if (!FirstPteTy.isConstQualified() && SecondParmTy->isIntegerType()) {
836 // If the first parameter type is non-const qualified `char *` and the
837 // second is an integer, it is a snprintf:
838 const Expr *UnsafeArg;
839
840 if (hasUnsafeFormatOrSArg(&Node, UnsafeArg, 2, Ctx, false))
841 return UnsafeStringArgMatcher.matches(*UnsafeArg, Finder, Builder);
842 return false;
843 }
844 }
845 // We don't really recognize this "normal" printf, the only thing we
846 // can do is to require all pointers to be null-terminated:
847 for (auto Arg : Node.arguments())
848 if (Arg->getType()->isPointerType() && !isNullTermPointer(Arg))
849 if (UnsafeStringArgMatcher.matches(*Arg, Finder, Builder))
850 return true;
851 return false;
852}
853
854// This matcher requires that it is known that the callee `isNormalPrintf`.
855// Then it matches if the first two arguments of the call is a pointer and an
856// integer and they are not in a safe pattern.
857//
858// For the first two arguments: `ptr` and `size`, they are safe if in the
859// following patterns:
860//
861// Pattern 1:
862// ptr := DRE.data();
863// size:= DRE.size()/DRE.size_bytes()
864// And DRE is a hardened container or view.
865//
866// Pattern 2:
867// ptr := Constant-Array-DRE;
868// size:= any expression that has compile-time constant value equivalent to
869// sizeof (Constant-Array-DRE)
870AST_MATCHER(CallExpr, hasUnsafeSnprintfBuffer) {
871 const FunctionDecl *FD = Node.getDirectCallee();
872
873 assert(FD && "It should have been checked that FD is non-null.");
874
875 if (FD->getNumParams() < 3)
876 return false; // Not an snprint
877
878 QualType FirstParmTy = FD->getParamDecl(0)->getType();
879
880 if (!FirstParmTy->isPointerType())
881 return false; // Not an snprint
882
883 QualType FirstPteTy = FirstParmTy->castAs<PointerType>()->getPointeeType();
884 const Expr *Buf = Node.getArg(0), *Size = Node.getArg(1);
885
886 if (FirstPteTy.isConstQualified() || !Buf->getType()->isPointerType() ||
887 !Size->getType()->isIntegerType())
888 return false; // not an snprintf call
889
890 // Pattern 1:
891 static StringRef SizedObjs[] = {"span", "array", "vector",
892 "basic_string_view", "basic_string"};
893 Buf = Buf->IgnoreParenImpCasts();
894 Size = Size->IgnoreParenImpCasts();
895 if (auto *MCEPtr = dyn_cast<CXXMemberCallExpr>(Buf))
896 if (auto *MCESize = dyn_cast<CXXMemberCallExpr>(Size)) {
897 auto *DREOfPtr = dyn_cast<DeclRefExpr>(
898 MCEPtr->getImplicitObjectArgument()->IgnoreParenImpCasts());
899 auto *DREOfSize = dyn_cast<DeclRefExpr>(
900 MCESize->getImplicitObjectArgument()->IgnoreParenImpCasts());
901
902 if (!DREOfPtr || !DREOfSize)
903 return true; // not in safe pattern
904 if (DREOfPtr->getDecl() != DREOfSize->getDecl())
905 return true; // not in safe pattern
906 if (MCEPtr->getMethodDecl()->getName() != "data")
907 return true; // not in safe pattern
908
909 if (MCESize->getMethodDecl()->getName() == "size_bytes" ||
910 // Note here the pointer must be a pointer-to-char type unless there
911 // is explicit casting. If there is explicit casting, this branch
912 // is unreachable. Thus, at this branch "size" and "size_bytes" are
913 // equivalent as the pointer is a char pointer:
914 MCESize->getMethodDecl()->getName() == "size")
915 for (StringRef SizedObj : SizedObjs)
916 if (MCEPtr->getRecordDecl()->isInStdNamespace() &&
917 MCEPtr->getRecordDecl()->getCanonicalDecl()->getName() ==
918 SizedObj)
919 return false; // It is in fact safe
920 }
921
922 // Pattern 2:
923 if (auto *DRE = dyn_cast<DeclRefExpr>(Buf->IgnoreParenImpCasts())) {
924 ASTContext &Ctx = Finder->getASTContext();
925
926 if (auto *CAT = Ctx.getAsConstantArrayType(DRE->getType())) {
928 // The array element type must be compatible with `char` otherwise an
929 // explicit cast will be needed, which will make this check unreachable.
930 // Therefore, the array extent is same as its' bytewise size.
931 if (Size->EvaluateAsConstantExpr(ER, Ctx)) {
932 APSInt EVal = ER.Val.getInt(); // Size must have integer type
933
934 return APSInt::compareValues(EVal, APSInt(CAT->getSize(), true)) != 0;
935 }
936 }
937 }
938 return true; // ptr and size are not in safe pattern
939}
940} // namespace libc_func_matchers
941} // namespace clang::ast_matchers
942
943namespace {
944// Because the analysis revolves around variables and their types, we'll need to
945// track uses of variables (aka DeclRefExprs).
946using DeclUseList = SmallVector<const DeclRefExpr *, 1>;
947
948// Convenience typedef.
949using FixItList = SmallVector<FixItHint, 4>;
950} // namespace
951
952namespace {
953/// Gadget is an individual operation in the code that may be of interest to
954/// this analysis. Each (non-abstract) subclass corresponds to a specific
955/// rigid AST structure that constitutes an operation on a pointer-type object.
956/// Discovery of a gadget in the code corresponds to claiming that we understand
957/// what this part of code is doing well enough to potentially improve it.
958/// Gadgets can be warning (immediately deserving a warning) or fixable (not
959/// always deserving a warning per se, but requires our attention to identify
960/// it warrants a fixit).
961class Gadget {
962public:
963 enum class Kind {
964#define GADGET(x) x,
965#include "clang/Analysis/Analyses/UnsafeBufferUsageGadgets.def"
966 };
967
968 /// Common type of ASTMatchers used for discovering gadgets.
969 /// Useful for implementing the static matcher() methods
970 /// that are expected from all non-abstract subclasses.
971 using Matcher = decltype(stmt());
972
973 Gadget(Kind K) : K(K) {}
974
975 Kind getKind() const { return K; }
976
977#ifndef NDEBUG
978 StringRef getDebugName() const {
979 switch (K) {
980#define GADGET(x) \
981 case Kind::x: \
982 return #x;
983#include "clang/Analysis/Analyses/UnsafeBufferUsageGadgets.def"
984 }
985 llvm_unreachable("Unhandled Gadget::Kind enum");
986 }
987#endif
988
989 virtual bool isWarningGadget() const = 0;
990 // TODO remove this method from WarningGadget interface. It's only used for
991 // debug prints in FixableGadget.
992 virtual SourceLocation getSourceLoc() const = 0;
993
994 /// Returns the list of pointer-type variables on which this gadget performs
995 /// its operation. Typically, there's only one variable. This isn't a list
996 /// of all DeclRefExprs in the gadget's AST!
997 virtual DeclUseList getClaimedVarUseSites() const = 0;
998
999 virtual ~Gadget() = default;
1000
1001private:
1002 Kind K;
1003};
1004
1005/// Warning gadgets correspond to unsafe code patterns that warrants
1006/// an immediate warning.
1007class WarningGadget : public Gadget {
1008public:
1009 WarningGadget(Kind K) : Gadget(K) {}
1010
1011 static bool classof(const Gadget *G) { return G->isWarningGadget(); }
1012 bool isWarningGadget() const final { return true; }
1013
1014 virtual void handleUnsafeOperation(UnsafeBufferUsageHandler &Handler,
1015 bool IsRelatedToDecl,
1016 ASTContext &Ctx) const = 0;
1017};
1018
1019/// Fixable gadgets correspond to code patterns that aren't always unsafe but
1020/// need to be properly recognized in order to emit fixes. For example, if a raw
1021/// pointer-type variable is replaced by a safe C++ container, every use of such
1022/// variable must be carefully considered and possibly updated.
1023class FixableGadget : public Gadget {
1024public:
1025 FixableGadget(Kind K) : Gadget(K) {}
1026
1027 static bool classof(const Gadget *G) { return !G->isWarningGadget(); }
1028 bool isWarningGadget() const final { return false; }
1029
1030 /// Returns a fixit that would fix the current gadget according to
1031 /// the current strategy. Returns std::nullopt if the fix cannot be produced;
1032 /// returns an empty list if no fixes are necessary.
1033 virtual std::optional<FixItList> getFixits(const FixitStrategy &) const {
1034 return std::nullopt;
1035 }
1036
1037 /// Returns a list of two elements where the first element is the LHS of a
1038 /// pointer assignment statement and the second element is the RHS. This
1039 /// two-element list represents the fact that the LHS buffer gets its bounds
1040 /// information from the RHS buffer. This information will be used later to
1041 /// group all those variables whose types must be modified together to prevent
1042 /// type mismatches.
1043 virtual std::optional<std::pair<const VarDecl *, const VarDecl *>>
1044 getStrategyImplications() const {
1045 return std::nullopt;
1046 }
1047};
1048
1049static auto toSupportedVariable() { return to(varDecl()); }
1050
1051using FixableGadgetList = std::vector<std::unique_ptr<FixableGadget>>;
1052using WarningGadgetList = std::vector<std::unique_ptr<WarningGadget>>;
1053
1054/// An increment of a pointer-type value is unsafe as it may run the pointer
1055/// out of bounds.
1056class IncrementGadget : public WarningGadget {
1057 static constexpr const char *const OpTag = "op";
1058 const UnaryOperator *Op;
1059
1060public:
1061 IncrementGadget(const MatchFinder::MatchResult &Result)
1062 : WarningGadget(Kind::Increment),
1063 Op(Result.Nodes.getNodeAs<UnaryOperator>(OpTag)) {}
1064
1065 static bool classof(const Gadget *G) {
1066 return G->getKind() == Kind::Increment;
1067 }
1068
1069 static Matcher matcher() {
1070 return stmt(
1071 unaryOperator(hasOperatorName("++"),
1072 hasUnaryOperand(ignoringParenImpCasts(hasPointerType())))
1073 .bind(OpTag));
1074 }
1075
1076 void handleUnsafeOperation(UnsafeBufferUsageHandler &Handler,
1077 bool IsRelatedToDecl,
1078 ASTContext &Ctx) const override {
1079 Handler.handleUnsafeOperation(Op, IsRelatedToDecl, Ctx);
1080 }
1081 SourceLocation getSourceLoc() const override { return Op->getBeginLoc(); }
1082
1083 DeclUseList getClaimedVarUseSites() const override {
1085 if (const auto *DRE =
1086 dyn_cast<DeclRefExpr>(Op->getSubExpr()->IgnoreParenImpCasts())) {
1087 Uses.push_back(DRE);
1088 }
1089
1090 return std::move(Uses);
1091 }
1092};
1093
1094/// A decrement of a pointer-type value is unsafe as it may run the pointer
1095/// out of bounds.
1096class DecrementGadget : public WarningGadget {
1097 static constexpr const char *const OpTag = "op";
1098 const UnaryOperator *Op;
1099
1100public:
1101 DecrementGadget(const MatchFinder::MatchResult &Result)
1102 : WarningGadget(Kind::Decrement),
1103 Op(Result.Nodes.getNodeAs<UnaryOperator>(OpTag)) {}
1104
1105 static bool classof(const Gadget *G) {
1106 return G->getKind() == Kind::Decrement;
1107 }
1108
1109 static Matcher matcher() {
1110 return stmt(
1111 unaryOperator(hasOperatorName("--"),
1112 hasUnaryOperand(ignoringParenImpCasts(hasPointerType())))
1113 .bind(OpTag));
1114 }
1115
1116 void handleUnsafeOperation(UnsafeBufferUsageHandler &Handler,
1117 bool IsRelatedToDecl,
1118 ASTContext &Ctx) const override {
1119 Handler.handleUnsafeOperation(Op, IsRelatedToDecl, Ctx);
1120 }
1121 SourceLocation getSourceLoc() const override { return Op->getBeginLoc(); }
1122
1123 DeclUseList getClaimedVarUseSites() const override {
1124 if (const auto *DRE =
1125 dyn_cast<DeclRefExpr>(Op->getSubExpr()->IgnoreParenImpCasts())) {
1126 return {DRE};
1127 }
1128
1129 return {};
1130 }
1131};
1132
1133/// Array subscript expressions on raw pointers as if they're arrays. Unsafe as
1134/// it doesn't have any bounds checks for the array.
1135class ArraySubscriptGadget : public WarningGadget {
1136 static constexpr const char *const ArraySubscrTag = "ArraySubscript";
1137 const ArraySubscriptExpr *ASE;
1138
1139public:
1140 ArraySubscriptGadget(const MatchFinder::MatchResult &Result)
1141 : WarningGadget(Kind::ArraySubscript),
1142 ASE(Result.Nodes.getNodeAs<ArraySubscriptExpr>(ArraySubscrTag)) {}
1143
1144 static bool classof(const Gadget *G) {
1145 return G->getKind() == Kind::ArraySubscript;
1146 }
1147
1148 static Matcher matcher() {
1149 // clang-format off
1150 return stmt(arraySubscriptExpr(
1151 hasBase(ignoringParenImpCasts(
1153 unless(anyOf(
1154 isSafeArraySubscript(),
1155 hasIndex(
1157 )
1158 ))).bind(ArraySubscrTag));
1159 // clang-format on
1160 }
1161
1162 void handleUnsafeOperation(UnsafeBufferUsageHandler &Handler,
1163 bool IsRelatedToDecl,
1164 ASTContext &Ctx) const override {
1165 Handler.handleUnsafeOperation(ASE, IsRelatedToDecl, Ctx);
1166 }
1167 SourceLocation getSourceLoc() const override { return ASE->getBeginLoc(); }
1168
1169 DeclUseList getClaimedVarUseSites() const override {
1170 if (const auto *DRE =
1171 dyn_cast<DeclRefExpr>(ASE->getBase()->IgnoreParenImpCasts())) {
1172 return {DRE};
1173 }
1174
1175 return {};
1176 }
1177};
1178
1179/// A pointer arithmetic expression of one of the forms:
1180/// \code
1181/// ptr + n | n + ptr | ptr - n | ptr += n | ptr -= n
1182/// \endcode
1183class PointerArithmeticGadget : public WarningGadget {
1184 static constexpr const char *const PointerArithmeticTag = "ptrAdd";
1185 static constexpr const char *const PointerArithmeticPointerTag = "ptrAddPtr";
1186 const BinaryOperator *PA; // pointer arithmetic expression
1187 const Expr *Ptr; // the pointer expression in `PA`
1188
1189public:
1190 PointerArithmeticGadget(const MatchFinder::MatchResult &Result)
1191 : WarningGadget(Kind::PointerArithmetic),
1192 PA(Result.Nodes.getNodeAs<BinaryOperator>(PointerArithmeticTag)),
1193 Ptr(Result.Nodes.getNodeAs<Expr>(PointerArithmeticPointerTag)) {}
1194
1195 static bool classof(const Gadget *G) {
1196 return G->getKind() == Kind::PointerArithmetic;
1197 }
1198
1199 static Matcher matcher() {
1200 auto HasIntegerType = anyOf(hasType(isInteger()), hasType(enumType()));
1201 auto PtrAtRight =
1202 allOf(hasOperatorName("+"),
1203 hasRHS(expr(hasPointerType()).bind(PointerArithmeticPointerTag)),
1204 hasLHS(HasIntegerType));
1205 auto PtrAtLeft =
1206 allOf(anyOf(hasOperatorName("+"), hasOperatorName("-"),
1207 hasOperatorName("+="), hasOperatorName("-=")),
1208 hasLHS(expr(hasPointerType()).bind(PointerArithmeticPointerTag)),
1209 hasRHS(HasIntegerType));
1210
1211 return stmt(binaryOperator(anyOf(PtrAtLeft, PtrAtRight))
1212 .bind(PointerArithmeticTag));
1213 }
1214
1215 void handleUnsafeOperation(UnsafeBufferUsageHandler &Handler,
1216 bool IsRelatedToDecl,
1217 ASTContext &Ctx) const override {
1218 Handler.handleUnsafeOperation(PA, IsRelatedToDecl, Ctx);
1219 }
1220 SourceLocation getSourceLoc() const override { return PA->getBeginLoc(); }
1221
1222 DeclUseList getClaimedVarUseSites() const override {
1223 if (const auto *DRE = dyn_cast<DeclRefExpr>(Ptr->IgnoreParenImpCasts())) {
1224 return {DRE};
1225 }
1226
1227 return {};
1228 }
1229 // FIXME: pointer adding zero should be fine
1230 // FIXME: this gadge will need a fix-it
1231};
1232
1233class SpanTwoParamConstructorGadget : public WarningGadget {
1234 static constexpr const char *const SpanTwoParamConstructorTag =
1235 "spanTwoParamConstructor";
1236 const CXXConstructExpr *Ctor; // the span constructor expression
1237
1238public:
1239 SpanTwoParamConstructorGadget(const MatchFinder::MatchResult &Result)
1240 : WarningGadget(Kind::SpanTwoParamConstructor),
1241 Ctor(Result.Nodes.getNodeAs<CXXConstructExpr>(
1242 SpanTwoParamConstructorTag)) {}
1243
1244 static bool classof(const Gadget *G) {
1245 return G->getKind() == Kind::SpanTwoParamConstructor;
1246 }
1247
1248 static Matcher matcher() {
1249 auto HasTwoParamSpanCtorDecl = hasDeclaration(
1250 cxxConstructorDecl(hasDeclContext(isInStdNamespace()), hasName("span"),
1251 parameterCountIs(2)));
1252
1253 return stmt(cxxConstructExpr(HasTwoParamSpanCtorDecl,
1254 unless(isSafeSpanTwoParamConstruct()))
1255 .bind(SpanTwoParamConstructorTag));
1256 }
1257
1258 static Matcher matcher(const UnsafeBufferUsageHandler *Handler) {
1259 return stmt(unless(ignoreUnsafeBufferInContainer(Handler)), matcher());
1260 }
1261
1262 void handleUnsafeOperation(UnsafeBufferUsageHandler &Handler,
1263 bool IsRelatedToDecl,
1264 ASTContext &Ctx) const override {
1265 Handler.handleUnsafeOperationInContainer(Ctor, IsRelatedToDecl, Ctx);
1266 }
1267 SourceLocation getSourceLoc() const override { return Ctor->getBeginLoc(); }
1268
1269 DeclUseList getClaimedVarUseSites() const override {
1270 // If the constructor call is of the form `std::span{var, n}`, `var` is
1271 // considered an unsafe variable.
1272 if (auto *DRE = dyn_cast<DeclRefExpr>(Ctor->getArg(0))) {
1273 if (isa<VarDecl>(DRE->getDecl()))
1274 return {DRE};
1275 }
1276 return {};
1277 }
1278};
1279
1280/// A pointer initialization expression of the form:
1281/// \code
1282/// int *p = q;
1283/// \endcode
1284class PointerInitGadget : public FixableGadget {
1285private:
1286 static constexpr const char *const PointerInitLHSTag = "ptrInitLHS";
1287 static constexpr const char *const PointerInitRHSTag = "ptrInitRHS";
1288 const VarDecl *PtrInitLHS; // the LHS pointer expression in `PI`
1289 const DeclRefExpr *PtrInitRHS; // the RHS pointer expression in `PI`
1290
1291public:
1292 PointerInitGadget(const MatchFinder::MatchResult &Result)
1293 : FixableGadget(Kind::PointerInit),
1294 PtrInitLHS(Result.Nodes.getNodeAs<VarDecl>(PointerInitLHSTag)),
1295 PtrInitRHS(Result.Nodes.getNodeAs<DeclRefExpr>(PointerInitRHSTag)) {}
1296
1297 static bool classof(const Gadget *G) {
1298 return G->getKind() == Kind::PointerInit;
1299 }
1300
1301 static Matcher matcher() {
1302 auto PtrInitStmt = declStmt(hasSingleDecl(
1303 varDecl(hasInitializer(ignoringImpCasts(
1304 declRefExpr(hasPointerType(), toSupportedVariable())
1305 .bind(PointerInitRHSTag))))
1306 .bind(PointerInitLHSTag)));
1307
1308 return stmt(PtrInitStmt);
1309 }
1310
1311 virtual std::optional<FixItList>
1312 getFixits(const FixitStrategy &S) const override;
1313 SourceLocation getSourceLoc() const override {
1314 return PtrInitRHS->getBeginLoc();
1315 }
1316
1317 virtual DeclUseList getClaimedVarUseSites() const override {
1318 return DeclUseList{PtrInitRHS};
1319 }
1320
1321 virtual std::optional<std::pair<const VarDecl *, const VarDecl *>>
1322 getStrategyImplications() const override {
1323 return std::make_pair(PtrInitLHS, cast<VarDecl>(PtrInitRHS->getDecl()));
1324 }
1325};
1326
1327/// A pointer assignment expression of the form:
1328/// \code
1329/// p = q;
1330/// \endcode
1331/// where both `p` and `q` are pointers.
1332class PtrToPtrAssignmentGadget : public FixableGadget {
1333private:
1334 static constexpr const char *const PointerAssignLHSTag = "ptrLHS";
1335 static constexpr const char *const PointerAssignRHSTag = "ptrRHS";
1336 const DeclRefExpr *PtrLHS; // the LHS pointer expression in `PA`
1337 const DeclRefExpr *PtrRHS; // the RHS pointer expression in `PA`
1338
1339public:
1340 PtrToPtrAssignmentGadget(const MatchFinder::MatchResult &Result)
1341 : FixableGadget(Kind::PtrToPtrAssignment),
1342 PtrLHS(Result.Nodes.getNodeAs<DeclRefExpr>(PointerAssignLHSTag)),
1343 PtrRHS(Result.Nodes.getNodeAs<DeclRefExpr>(PointerAssignRHSTag)) {}
1344
1345 static bool classof(const Gadget *G) {
1346 return G->getKind() == Kind::PtrToPtrAssignment;
1347 }
1348
1349 static Matcher matcher() {
1350 auto PtrAssignExpr = binaryOperator(
1351 allOf(hasOperatorName("="),
1352 hasRHS(ignoringParenImpCasts(
1353 declRefExpr(hasPointerType(), toSupportedVariable())
1354 .bind(PointerAssignRHSTag))),
1355 hasLHS(declRefExpr(hasPointerType(), toSupportedVariable())
1356 .bind(PointerAssignLHSTag))));
1357
1358 return stmt(isInUnspecifiedUntypedContext(PtrAssignExpr));
1359 }
1360
1361 virtual std::optional<FixItList>
1362 getFixits(const FixitStrategy &S) const override;
1363 SourceLocation getSourceLoc() const override { return PtrLHS->getBeginLoc(); }
1364
1365 virtual DeclUseList getClaimedVarUseSites() const override {
1366 return DeclUseList{PtrLHS, PtrRHS};
1367 }
1368
1369 virtual std::optional<std::pair<const VarDecl *, const VarDecl *>>
1370 getStrategyImplications() const override {
1371 return std::make_pair(cast<VarDecl>(PtrLHS->getDecl()),
1372 cast<VarDecl>(PtrRHS->getDecl()));
1373 }
1374};
1375
1376/// An assignment expression of the form:
1377/// \code
1378/// ptr = array;
1379/// \endcode
1380/// where `p` is a pointer and `array` is a constant size array.
1381class CArrayToPtrAssignmentGadget : public FixableGadget {
1382private:
1383 static constexpr const char *const PointerAssignLHSTag = "ptrLHS";
1384 static constexpr const char *const PointerAssignRHSTag = "ptrRHS";
1385 const DeclRefExpr *PtrLHS; // the LHS pointer expression in `PA`
1386 const DeclRefExpr *PtrRHS; // the RHS pointer expression in `PA`
1387
1388public:
1389 CArrayToPtrAssignmentGadget(const MatchFinder::MatchResult &Result)
1390 : FixableGadget(Kind::CArrayToPtrAssignment),
1391 PtrLHS(Result.Nodes.getNodeAs<DeclRefExpr>(PointerAssignLHSTag)),
1392 PtrRHS(Result.Nodes.getNodeAs<DeclRefExpr>(PointerAssignRHSTag)) {}
1393
1394 static bool classof(const Gadget *G) {
1395 return G->getKind() == Kind::CArrayToPtrAssignment;
1396 }
1397
1398 static Matcher matcher() {
1399 auto PtrAssignExpr = binaryOperator(
1400 allOf(hasOperatorName("="),
1401 hasRHS(ignoringParenImpCasts(
1402 declRefExpr(hasType(hasCanonicalType(constantArrayType())),
1403 toSupportedVariable())
1404 .bind(PointerAssignRHSTag))),
1405 hasLHS(declRefExpr(hasPointerType(), toSupportedVariable())
1406 .bind(PointerAssignLHSTag))));
1407
1408 return stmt(isInUnspecifiedUntypedContext(PtrAssignExpr));
1409 }
1410
1411 virtual std::optional<FixItList>
1412 getFixits(const FixitStrategy &S) const override;
1413 SourceLocation getSourceLoc() const override { return PtrLHS->getBeginLoc(); }
1414
1415 virtual DeclUseList getClaimedVarUseSites() const override {
1416 return DeclUseList{PtrLHS, PtrRHS};
1417 }
1418
1419 virtual std::optional<std::pair<const VarDecl *, const VarDecl *>>
1420 getStrategyImplications() const override {
1421 return {};
1422 }
1423};
1424
1425/// A call of a function or method that performs unchecked buffer operations
1426/// over one of its pointer parameters.
1427class UnsafeBufferUsageAttrGadget : public WarningGadget {
1428 constexpr static const char *const OpTag = "attr_expr";
1429 const Expr *Op;
1430
1431public:
1432 UnsafeBufferUsageAttrGadget(const MatchFinder::MatchResult &Result)
1433 : WarningGadget(Kind::UnsafeBufferUsageAttr),
1434 Op(Result.Nodes.getNodeAs<Expr>(OpTag)) {}
1435
1436 static bool classof(const Gadget *G) {
1437 return G->getKind() == Kind::UnsafeBufferUsageAttr;
1438 }
1439
1440 static Matcher matcher() {
1441 auto HasUnsafeFieldDecl =
1442 member(fieldDecl(hasAttr(attr::UnsafeBufferUsage)));
1443
1444 auto HasUnsafeFnDecl =
1445 callee(functionDecl(hasAttr(attr::UnsafeBufferUsage)));
1446
1447 return stmt(anyOf(callExpr(HasUnsafeFnDecl).bind(OpTag),
1448 memberExpr(HasUnsafeFieldDecl).bind(OpTag)));
1449 }
1450
1451 void handleUnsafeOperation(UnsafeBufferUsageHandler &Handler,
1452 bool IsRelatedToDecl,
1453 ASTContext &Ctx) const override {
1454 Handler.handleUnsafeOperation(Op, IsRelatedToDecl, Ctx);
1455 }
1456 SourceLocation getSourceLoc() const override { return Op->getBeginLoc(); }
1457
1458 DeclUseList getClaimedVarUseSites() const override { return {}; }
1459};
1460
1461/// A call of a constructor that performs unchecked buffer operations
1462/// over one of its pointer parameters, or constructs a class object that will
1463/// perform buffer operations that depend on the correctness of the parameters.
1464class UnsafeBufferUsageCtorAttrGadget : public WarningGadget {
1465 constexpr static const char *const OpTag = "cxx_construct_expr";
1466 const CXXConstructExpr *Op;
1467
1468public:
1469 UnsafeBufferUsageCtorAttrGadget(const MatchFinder::MatchResult &Result)
1470 : WarningGadget(Kind::UnsafeBufferUsageCtorAttr),
1471 Op(Result.Nodes.getNodeAs<CXXConstructExpr>(OpTag)) {}
1472
1473 static bool classof(const Gadget *G) {
1474 return G->getKind() == Kind::UnsafeBufferUsageCtorAttr;
1475 }
1476
1477 static Matcher matcher() {
1478 auto HasUnsafeCtorDecl =
1479 hasDeclaration(cxxConstructorDecl(hasAttr(attr::UnsafeBufferUsage)));
1480 // std::span(ptr, size) ctor is handled by SpanTwoParamConstructorGadget.
1481 auto HasTwoParamSpanCtorDecl = SpanTwoParamConstructorGadget::matcher();
1482 return stmt(
1483 cxxConstructExpr(HasUnsafeCtorDecl, unless(HasTwoParamSpanCtorDecl))
1484 .bind(OpTag));
1485 }
1486
1487 void handleUnsafeOperation(UnsafeBufferUsageHandler &Handler,
1488 bool IsRelatedToDecl,
1489 ASTContext &Ctx) const override {
1490 Handler.handleUnsafeOperation(Op, IsRelatedToDecl, Ctx);
1491 }
1492 SourceLocation getSourceLoc() const override { return Op->getBeginLoc(); }
1493
1494 DeclUseList getClaimedVarUseSites() const override { return {}; }
1495};
1496
1497// Warning gadget for unsafe invocation of span::data method.
1498// Triggers when the pointer returned by the invocation is immediately
1499// cast to a larger type.
1500
1501class DataInvocationGadget : public WarningGadget {
1502 constexpr static const char *const OpTag = "data_invocation_expr";
1503 const ExplicitCastExpr *Op;
1504
1505public:
1506 DataInvocationGadget(const MatchFinder::MatchResult &Result)
1507 : WarningGadget(Kind::DataInvocation),
1508 Op(Result.Nodes.getNodeAs<ExplicitCastExpr>(OpTag)) {}
1509
1510 static bool classof(const Gadget *G) {
1511 return G->getKind() == Kind::DataInvocation;
1512 }
1513
1514 static Matcher matcher() {
1515
1516 Matcher callExpr = cxxMemberCallExpr(callee(
1517 cxxMethodDecl(hasName("data"),
1518 ofClass(anyOf(hasName("std::span"), hasName("std::array"),
1519 hasName("std::vector"))))));
1520 return stmt(
1522 .bind(OpTag));
1523 }
1524
1525 void handleUnsafeOperation(UnsafeBufferUsageHandler &Handler,
1526 bool IsRelatedToDecl,
1527 ASTContext &Ctx) const override {
1528 Handler.handleUnsafeOperation(Op, IsRelatedToDecl, Ctx);
1529 }
1530 SourceLocation getSourceLoc() const override { return Op->getBeginLoc(); }
1531
1532 DeclUseList getClaimedVarUseSites() const override { return {}; }
1533};
1534
1535class UnsafeLibcFunctionCallGadget : public WarningGadget {
1536 const CallExpr *const Call;
1537 const Expr *UnsafeArg = nullptr;
1538 constexpr static const char *const Tag = "UnsafeLibcFunctionCall";
1539 // Extra tags for additional information:
1540 constexpr static const char *const UnsafeSprintfTag =
1541 "UnsafeLibcFunctionCall_sprintf";
1542 constexpr static const char *const UnsafeSizedByTag =
1543 "UnsafeLibcFunctionCall_sized_by";
1544 constexpr static const char *const UnsafeStringTag =
1545 "UnsafeLibcFunctionCall_string";
1546 constexpr static const char *const UnsafeVaListTag =
1547 "UnsafeLibcFunctionCall_va_list";
1548
1549 enum UnsafeKind {
1550 OTHERS = 0, // no specific information, the callee function is unsafe
1551 SPRINTF = 1, // never call `-sprintf`s, call `-snprintf`s instead.
1552 SIZED_BY =
1553 2, // the first two arguments of `snprintf` function have
1554 // "__sized_by" relation but they do not conform to safe patterns
1555 STRING = 3, // an argument is a pointer-to-char-as-string but does not
1556 // guarantee null-termination
1557 VA_LIST = 4, // one of the `-printf`s function that take va_list, which is
1558 // considered unsafe as it is not compile-time check
1559 } WarnedFunKind = OTHERS;
1560
1561public:
1562 UnsafeLibcFunctionCallGadget(const MatchFinder::MatchResult &Result)
1563 : WarningGadget(Kind::UnsafeLibcFunctionCall),
1564 Call(Result.Nodes.getNodeAs<CallExpr>(Tag)) {
1565 if (Result.Nodes.getNodeAs<Decl>(UnsafeSprintfTag))
1566 WarnedFunKind = SPRINTF;
1567 else if (auto *E = Result.Nodes.getNodeAs<Expr>(UnsafeStringTag)) {
1568 WarnedFunKind = STRING;
1569 UnsafeArg = E;
1570 } else if (Result.Nodes.getNodeAs<CallExpr>(UnsafeSizedByTag)) {
1571 WarnedFunKind = SIZED_BY;
1572 UnsafeArg = Call->getArg(0);
1573 } else if (Result.Nodes.getNodeAs<Decl>(UnsafeVaListTag))
1574 WarnedFunKind = VA_LIST;
1575 }
1576
1577 static Matcher matcher(const UnsafeBufferUsageHandler *Handler) {
1578 return stmt(unless(ignoreUnsafeLibcCall(Handler)),
1579 anyOf(
1580 callExpr(
1581 callee(functionDecl(anyOf(
1582 // Match a predefined unsafe libc
1583 // function:
1584 functionDecl(libc_func_matchers::isPredefinedUnsafeLibcFunc()),
1585 // Match a call to one of the `v*printf` functions
1586 // taking va-list, which cannot be checked at
1587 // compile-time:
1588 functionDecl(libc_func_matchers::isUnsafeVaListPrintfFunc())
1589 .bind(UnsafeVaListTag),
1590 // Match a call to a `sprintf` function, which is never
1591 // safe:
1592 functionDecl(libc_func_matchers::isUnsafeSprintfFunc())
1593 .bind(UnsafeSprintfTag)))),
1594 // (unless the call has a sole string literal argument):
1595 unless(
1596 allOf(hasArgument(0, expr(stringLiteral())), hasNumArgs(1)))),
1597
1598 // The following two cases require checking against actual
1599 // arguments of the call:
1600
1601 // Match a call to an `snprintf` function. And first two
1602 // arguments of the call (that describe a buffer) are not in
1603 // safe patterns:
1604 callExpr(callee(functionDecl(libc_func_matchers::isNormalPrintfFunc())),
1605 libc_func_matchers::hasUnsafeSnprintfBuffer())
1606 .bind(UnsafeSizedByTag),
1607 // Match a call to a `printf` function, which can be safe if
1608 // all arguments are null-terminated:
1609 callExpr(callee(functionDecl(libc_func_matchers::isNormalPrintfFunc())),
1610 libc_func_matchers::hasUnsafePrintfStringArg(
1611 expr().bind(UnsafeStringTag)))));
1612 }
1613
1614 const Stmt *getBaseStmt() const { return Call; }
1615
1616 SourceLocation getSourceLoc() const override { return Call->getBeginLoc(); }
1617
1618 void handleUnsafeOperation(UnsafeBufferUsageHandler &Handler,
1619 bool IsRelatedToDecl,
1620 ASTContext &Ctx) const override {
1621 Handler.handleUnsafeLibcCall(Call, WarnedFunKind, Ctx, UnsafeArg);
1622 }
1623
1624 DeclUseList getClaimedVarUseSites() const override { return {}; }
1625};
1626
1627// Represents expressions of the form `DRE[*]` in the Unspecified Lvalue
1628// Context (see `isInUnspecifiedLvalueContext`).
1629// Note here `[]` is the built-in subscript operator.
1630class ULCArraySubscriptGadget : public FixableGadget {
1631private:
1632 static constexpr const char *const ULCArraySubscriptTag =
1633 "ArraySubscriptUnderULC";
1634 const ArraySubscriptExpr *Node;
1635
1636public:
1637 ULCArraySubscriptGadget(const MatchFinder::MatchResult &Result)
1638 : FixableGadget(Kind::ULCArraySubscript),
1639 Node(Result.Nodes.getNodeAs<ArraySubscriptExpr>(ULCArraySubscriptTag)) {
1640 assert(Node != nullptr && "Expecting a non-null matching result");
1641 }
1642
1643 static bool classof(const Gadget *G) {
1644 return G->getKind() == Kind::ULCArraySubscript;
1645 }
1646
1647 static Matcher matcher() {
1648 auto ArrayOrPtr = anyOf(hasPointerType(), hasArrayType());
1649 auto BaseIsArrayOrPtrDRE = hasBase(
1650 ignoringParenImpCasts(declRefExpr(ArrayOrPtr, toSupportedVariable())));
1651 auto Target =
1652 arraySubscriptExpr(BaseIsArrayOrPtrDRE).bind(ULCArraySubscriptTag);
1653
1655 }
1656
1657 virtual std::optional<FixItList>
1658 getFixits(const FixitStrategy &S) const override;
1659 SourceLocation getSourceLoc() const override { return Node->getBeginLoc(); }
1660
1661 virtual DeclUseList getClaimedVarUseSites() const override {
1662 if (const auto *DRE =
1663 dyn_cast<DeclRefExpr>(Node->getBase()->IgnoreImpCasts())) {
1664 return {DRE};
1665 }
1666 return {};
1667 }
1668};
1669
1670// Fixable gadget to handle stand alone pointers of the form `UPC(DRE)` in the
1671// unspecified pointer context (isInUnspecifiedPointerContext). The gadget emits
1672// fixit of the form `UPC(DRE.data())`.
1673class UPCStandalonePointerGadget : public FixableGadget {
1674private:
1675 static constexpr const char *const DeclRefExprTag = "StandalonePointer";
1676 const DeclRefExpr *Node;
1677
1678public:
1679 UPCStandalonePointerGadget(const MatchFinder::MatchResult &Result)
1680 : FixableGadget(Kind::UPCStandalonePointer),
1681 Node(Result.Nodes.getNodeAs<DeclRefExpr>(DeclRefExprTag)) {
1682 assert(Node != nullptr && "Expecting a non-null matching result");
1683 }
1684
1685 static bool classof(const Gadget *G) {
1686 return G->getKind() == Kind::UPCStandalonePointer;
1687 }
1688
1689 static Matcher matcher() {
1690 auto ArrayOrPtr = anyOf(hasPointerType(), hasArrayType());
1691 auto target = expr(ignoringParenImpCasts(
1692 declRefExpr(allOf(ArrayOrPtr, toSupportedVariable()))
1693 .bind(DeclRefExprTag)));
1694 return stmt(isInUnspecifiedPointerContext(target));
1695 }
1696
1697 virtual std::optional<FixItList>
1698 getFixits(const FixitStrategy &S) const override;
1699 SourceLocation getSourceLoc() const override { return Node->getBeginLoc(); }
1700
1701 virtual DeclUseList getClaimedVarUseSites() const override { return {Node}; }
1702};
1703
1704class PointerDereferenceGadget : public FixableGadget {
1705 static constexpr const char *const BaseDeclRefExprTag = "BaseDRE";
1706 static constexpr const char *const OperatorTag = "op";
1707
1708 const DeclRefExpr *BaseDeclRefExpr = nullptr;
1709 const UnaryOperator *Op = nullptr;
1710
1711public:
1712 PointerDereferenceGadget(const MatchFinder::MatchResult &Result)
1713 : FixableGadget(Kind::PointerDereference),
1714 BaseDeclRefExpr(
1715 Result.Nodes.getNodeAs<DeclRefExpr>(BaseDeclRefExprTag)),
1716 Op(Result.Nodes.getNodeAs<UnaryOperator>(OperatorTag)) {}
1717
1718 static bool classof(const Gadget *G) {
1719 return G->getKind() == Kind::PointerDereference;
1720 }
1721
1722 static Matcher matcher() {
1723 auto Target =
1725 hasOperatorName("*"),
1726 has(expr(ignoringParenImpCasts(
1727 declRefExpr(toSupportedVariable()).bind(BaseDeclRefExprTag)))))
1728 .bind(OperatorTag);
1729
1731 }
1732
1733 DeclUseList getClaimedVarUseSites() const override {
1734 return {BaseDeclRefExpr};
1735 }
1736
1737 virtual std::optional<FixItList>
1738 getFixits(const FixitStrategy &S) const override;
1739 SourceLocation getSourceLoc() const override { return Op->getBeginLoc(); }
1740};
1741
1742// Represents expressions of the form `&DRE[any]` in the Unspecified Pointer
1743// Context (see `isInUnspecifiedPointerContext`).
1744// Note here `[]` is the built-in subscript operator.
1745class UPCAddressofArraySubscriptGadget : public FixableGadget {
1746private:
1747 static constexpr const char *const UPCAddressofArraySubscriptTag =
1748 "AddressofArraySubscriptUnderUPC";
1749 const UnaryOperator *Node; // the `&DRE[any]` node
1750
1751public:
1752 UPCAddressofArraySubscriptGadget(const MatchFinder::MatchResult &Result)
1753 : FixableGadget(Kind::ULCArraySubscript),
1754 Node(Result.Nodes.getNodeAs<UnaryOperator>(
1755 UPCAddressofArraySubscriptTag)) {
1756 assert(Node != nullptr && "Expecting a non-null matching result");
1757 }
1758
1759 static bool classof(const Gadget *G) {
1760 return G->getKind() == Kind::UPCAddressofArraySubscript;
1761 }
1762
1763 static Matcher matcher() {
1764 return expr(isInUnspecifiedPointerContext(expr(ignoringImpCasts(
1766 hasOperatorName("&"),
1767 hasUnaryOperand(arraySubscriptExpr(hasBase(
1768 ignoringParenImpCasts(declRefExpr(toSupportedVariable()))))))
1769 .bind(UPCAddressofArraySubscriptTag)))));
1770 }
1771
1772 virtual std::optional<FixItList>
1773 getFixits(const FixitStrategy &) const override;
1774 SourceLocation getSourceLoc() const override { return Node->getBeginLoc(); }
1775
1776 virtual DeclUseList getClaimedVarUseSites() const override {
1777 const auto *ArraySubst = cast<ArraySubscriptExpr>(Node->getSubExpr());
1778 const auto *DRE =
1779 cast<DeclRefExpr>(ArraySubst->getBase()->IgnoreParenImpCasts());
1780 return {DRE};
1781 }
1782};
1783} // namespace
1784
1785namespace {
1786// An auxiliary tracking facility for the fixit analysis. It helps connect
1787// declarations to its uses and make sure we've covered all uses with our
1788// analysis before we try to fix the declaration.
1789class DeclUseTracker {
1790 using UseSetTy = SmallSet<const DeclRefExpr *, 16>;
1791 using DefMapTy = DenseMap<const VarDecl *, const DeclStmt *>;
1792
1793 // Allocate on the heap for easier move.
1794 std::unique_ptr<UseSetTy> Uses{std::make_unique<UseSetTy>()};
1795 DefMapTy Defs{};
1796
1797public:
1798 DeclUseTracker() = default;
1799 DeclUseTracker(const DeclUseTracker &) = delete; // Let's avoid copies.
1800 DeclUseTracker &operator=(const DeclUseTracker &) = delete;
1801 DeclUseTracker(DeclUseTracker &&) = default;
1802 DeclUseTracker &operator=(DeclUseTracker &&) = default;
1803
1804 // Start tracking a freshly discovered DRE.
1805 void discoverUse(const DeclRefExpr *DRE) { Uses->insert(DRE); }
1806
1807 // Stop tracking the DRE as it's been fully figured out.
1808 void claimUse(const DeclRefExpr *DRE) {
1809 assert(Uses->count(DRE) &&
1810 "DRE not found or claimed by multiple matchers!");
1811 Uses->erase(DRE);
1812 }
1813
1814 // A variable is unclaimed if at least one use is unclaimed.
1815 bool hasUnclaimedUses(const VarDecl *VD) const {
1816 // FIXME: Can this be less linear? Maybe maintain a map from VDs to DREs?
1817 return any_of(*Uses, [VD](const DeclRefExpr *DRE) {
1818 return DRE->getDecl()->getCanonicalDecl() == VD->getCanonicalDecl();
1819 });
1820 }
1821
1822 UseSetTy getUnclaimedUses(const VarDecl *VD) const {
1823 UseSetTy ReturnSet;
1824 for (auto use : *Uses) {
1825 if (use->getDecl()->getCanonicalDecl() == VD->getCanonicalDecl()) {
1826 ReturnSet.insert(use);
1827 }
1828 }
1829 return ReturnSet;
1830 }
1831
1832 void discoverDecl(const DeclStmt *DS) {
1833 for (const Decl *D : DS->decls()) {
1834 if (const auto *VD = dyn_cast<VarDecl>(D)) {
1835 // FIXME: Assertion temporarily disabled due to a bug in
1836 // ASTMatcher internal behavior in presence of GNU
1837 // statement-expressions. We need to properly investigate this
1838 // because it can screw up our algorithm in other ways.
1839 // assert(Defs.count(VD) == 0 && "Definition already discovered!");
1840 Defs[VD] = DS;
1841 }
1842 }
1843 }
1844
1845 const DeclStmt *lookupDecl(const VarDecl *VD) const {
1846 return Defs.lookup(VD);
1847 }
1848};
1849} // namespace
1850
1851// Representing a pointer type expression of the form `++Ptr` in an Unspecified
1852// Pointer Context (UPC):
1853class UPCPreIncrementGadget : public FixableGadget {
1854private:
1855 static constexpr const char *const UPCPreIncrementTag =
1856 "PointerPreIncrementUnderUPC";
1857 const UnaryOperator *Node; // the `++Ptr` node
1858
1859public:
1861 : FixableGadget(Kind::UPCPreIncrement),
1862 Node(Result.Nodes.getNodeAs<UnaryOperator>(UPCPreIncrementTag)) {
1863 assert(Node != nullptr && "Expecting a non-null matching result");
1864 }
1865
1866 static bool classof(const Gadget *G) {
1867 return G->getKind() == Kind::UPCPreIncrement;
1868 }
1869
1870 static Matcher matcher() {
1871 // Note here we match `++Ptr` for any expression `Ptr` of pointer type.
1872 // Although currently we can only provide fix-its when `Ptr` is a DRE, we
1873 // can have the matcher be general, so long as `getClaimedVarUseSites` does
1874 // things right.
1875 return stmt(isInUnspecifiedPointerContext(expr(ignoringImpCasts(
1876 unaryOperator(isPreInc(),
1877 hasUnaryOperand(declRefExpr(toSupportedVariable())))
1878 .bind(UPCPreIncrementTag)))));
1879 }
1880
1881 virtual std::optional<FixItList>
1882 getFixits(const FixitStrategy &S) const override;
1883 SourceLocation getSourceLoc() const override { return Node->getBeginLoc(); }
1884
1885 virtual DeclUseList getClaimedVarUseSites() const override {
1886 return {dyn_cast<DeclRefExpr>(Node->getSubExpr())};
1887 }
1888};
1889
1890// Representing a pointer type expression of the form `Ptr += n` in an
1891// Unspecified Untyped Context (UUC):
1892class UUCAddAssignGadget : public FixableGadget {
1893private:
1894 static constexpr const char *const UUCAddAssignTag =
1895 "PointerAddAssignUnderUUC";
1896 static constexpr const char *const OffsetTag = "Offset";
1897
1898 const BinaryOperator *Node; // the `Ptr += n` node
1899 const Expr *Offset = nullptr;
1900
1901public:
1903 : FixableGadget(Kind::UUCAddAssign),
1904 Node(Result.Nodes.getNodeAs<BinaryOperator>(UUCAddAssignTag)),
1905 Offset(Result.Nodes.getNodeAs<Expr>(OffsetTag)) {
1906 assert(Node != nullptr && "Expecting a non-null matching result");
1907 }
1908
1909 static bool classof(const Gadget *G) {
1910 return G->getKind() == Kind::UUCAddAssign;
1911 }
1912
1913 static Matcher matcher() {
1914 // clang-format off
1915 return stmt(isInUnspecifiedUntypedContext(expr(ignoringImpCasts(
1916 binaryOperator(hasOperatorName("+="),
1917 hasLHS(
1920 toSupportedVariable())),
1921 hasRHS(expr().bind(OffsetTag)))
1922 .bind(UUCAddAssignTag)))));
1923 // clang-format on
1924 }
1925
1926 virtual std::optional<FixItList>
1927 getFixits(const FixitStrategy &S) const override;
1928 SourceLocation getSourceLoc() const override { return Node->getBeginLoc(); }
1929
1930 virtual DeclUseList getClaimedVarUseSites() const override {
1931 return {dyn_cast<DeclRefExpr>(Node->getLHS())};
1932 }
1933};
1934
1935// Representing a fixable expression of the form `*(ptr + 123)` or `*(123 +
1936// ptr)`:
1937class DerefSimplePtrArithFixableGadget : public FixableGadget {
1938 static constexpr const char *const BaseDeclRefExprTag = "BaseDRE";
1939 static constexpr const char *const DerefOpTag = "DerefOp";
1940 static constexpr const char *const AddOpTag = "AddOp";
1941 static constexpr const char *const OffsetTag = "Offset";
1942
1943 const DeclRefExpr *BaseDeclRefExpr = nullptr;
1944 const UnaryOperator *DerefOp = nullptr;
1945 const BinaryOperator *AddOp = nullptr;
1946 const IntegerLiteral *Offset = nullptr;
1947
1948public:
1950 : FixableGadget(Kind::DerefSimplePtrArithFixable),
1951 BaseDeclRefExpr(
1952 Result.Nodes.getNodeAs<DeclRefExpr>(BaseDeclRefExprTag)),
1953 DerefOp(Result.Nodes.getNodeAs<UnaryOperator>(DerefOpTag)),
1954 AddOp(Result.Nodes.getNodeAs<BinaryOperator>(AddOpTag)),
1955 Offset(Result.Nodes.getNodeAs<IntegerLiteral>(OffsetTag)) {}
1956
1957 static Matcher matcher() {
1958 // clang-format off
1959 auto ThePtr = expr(hasPointerType(),
1960 ignoringImpCasts(declRefExpr(toSupportedVariable()).
1961 bind(BaseDeclRefExprTag)));
1962 auto PlusOverPtrAndInteger = expr(anyOf(
1963 binaryOperator(hasOperatorName("+"), hasLHS(ThePtr),
1964 hasRHS(integerLiteral().bind(OffsetTag)))
1965 .bind(AddOpTag),
1966 binaryOperator(hasOperatorName("+"), hasRHS(ThePtr),
1967 hasLHS(integerLiteral().bind(OffsetTag)))
1968 .bind(AddOpTag)));
1970 hasOperatorName("*"),
1971 hasUnaryOperand(ignoringParens(PlusOverPtrAndInteger)))
1972 .bind(DerefOpTag));
1973 // clang-format on
1974 }
1975
1976 virtual std::optional<FixItList>
1977 getFixits(const FixitStrategy &s) const final;
1978 SourceLocation getSourceLoc() const override {
1979 return DerefOp->getBeginLoc();
1980 }
1981
1982 virtual DeclUseList getClaimedVarUseSites() const final {
1983 return {BaseDeclRefExpr};
1984 }
1985};
1986
1987/// Scan the function and return a list of gadgets found with provided kits.
1988static void findGadgets(const Stmt *S, ASTContext &Ctx,
1989 const UnsafeBufferUsageHandler &Handler,
1990 bool EmitSuggestions, FixableGadgetList &FixableGadgets,
1991 WarningGadgetList &WarningGadgets,
1992 DeclUseTracker &Tracker) {
1993
1994 struct GadgetFinderCallback : MatchFinder::MatchCallback {
1995 GadgetFinderCallback(FixableGadgetList &FixableGadgets,
1996 WarningGadgetList &WarningGadgets,
1997 DeclUseTracker &Tracker)
1998 : FixableGadgets(FixableGadgets), WarningGadgets(WarningGadgets),
1999 Tracker(Tracker) {}
2000
2001 void run(const MatchFinder::MatchResult &Result) override {
2002 // In debug mode, assert that we've found exactly one gadget.
2003 // This helps us avoid conflicts in .bind() tags.
2004#if NDEBUG
2005#define NEXT return
2006#else
2007 [[maybe_unused]] int numFound = 0;
2008#define NEXT ++numFound
2009#endif
2010
2011 if (const auto *DRE = Result.Nodes.getNodeAs<DeclRefExpr>("any_dre")) {
2012 Tracker.discoverUse(DRE);
2013 NEXT;
2014 }
2015
2016 if (const auto *DS = Result.Nodes.getNodeAs<DeclStmt>("any_ds")) {
2017 Tracker.discoverDecl(DS);
2018 NEXT;
2019 }
2020
2021 // Figure out which matcher we've found, and call the appropriate
2022 // subclass constructor.
2023 // FIXME: Can we do this more logarithmically?
2024#define FIXABLE_GADGET(name) \
2025 if (Result.Nodes.getNodeAs<Stmt>(#name)) { \
2026 FixableGadgets.push_back(std::make_unique<name##Gadget>(Result)); \
2027 NEXT; \
2028 }
2029#include "clang/Analysis/Analyses/UnsafeBufferUsageGadgets.def"
2030#define WARNING_GADGET(name) \
2031 if (Result.Nodes.getNodeAs<Stmt>(#name)) { \
2032 WarningGadgets.push_back(std::make_unique<name##Gadget>(Result)); \
2033 NEXT; \
2034 }
2035#include "clang/Analysis/Analyses/UnsafeBufferUsageGadgets.def"
2036
2037 assert(numFound >= 1 && "Gadgets not found in match result!");
2038 assert(numFound <= 1 && "Conflicting bind tags in gadgets!");
2039 }
2040
2041 FixableGadgetList &FixableGadgets;
2042 WarningGadgetList &WarningGadgets;
2043 DeclUseTracker &Tracker;
2044 };
2045
2046 MatchFinder M;
2047 GadgetFinderCallback CB{FixableGadgets, WarningGadgets, Tracker};
2048
2049 // clang-format off
2050 M.addMatcher(
2051 stmt(
2052 forEachDescendantEvaluatedStmt(stmt(anyOf(
2053 // Add Gadget::matcher() for every gadget in the registry.
2054#define WARNING_GADGET(x) \
2055 allOf(x ## Gadget::matcher().bind(#x), \
2056 notInSafeBufferOptOut(&Handler)),
2057#define WARNING_OPTIONAL_GADGET(x) \
2058 allOf(x ## Gadget::matcher(&Handler).bind(#x), \
2059 notInSafeBufferOptOut(&Handler)),
2060#include "clang/Analysis/Analyses/UnsafeBufferUsageGadgets.def"
2061 // Avoid a hanging comma.
2062 unless(stmt())
2063 )))
2064 ),
2065 &CB
2066 );
2067 // clang-format on
2068
2069 if (EmitSuggestions) {
2070 // clang-format off
2071 M.addMatcher(
2072 stmt(
2073 forEachDescendantStmt(stmt(eachOf(
2074#define FIXABLE_GADGET(x) \
2075 x ## Gadget::matcher().bind(#x),
2076#include "clang/Analysis/Analyses/UnsafeBufferUsageGadgets.def"
2077 // In parallel, match all DeclRefExprs so that to find out
2078 // whether there are any uncovered by gadgets.
2080 to(anyOf(varDecl(), bindingDecl()))).bind("any_dre"),
2081 // Also match DeclStmts because we'll need them when fixing
2082 // their underlying VarDecls that otherwise don't have
2083 // any backreferences to DeclStmts.
2084 declStmt().bind("any_ds")
2085 )))
2086 ),
2087 &CB
2088 );
2089 // clang-format on
2090 }
2091
2092 M.match(*S, Ctx);
2093}
2094
2095// Compares AST nodes by source locations.
2096template <typename NodeTy> struct CompareNode {
2097 bool operator()(const NodeTy *N1, const NodeTy *N2) const {
2098 return N1->getBeginLoc().getRawEncoding() <
2099 N2->getBeginLoc().getRawEncoding();
2100 }
2101};
2102
2104 std::map<const VarDecl *, std::set<const WarningGadget *>,
2105 // To keep keys sorted by their locations in the map so that the
2106 // order is deterministic:
2109 // These Gadgets are not related to pointer variables (e. g. temporaries).
2111};
2112
2113static WarningGadgetSets
2114groupWarningGadgetsByVar(const WarningGadgetList &AllUnsafeOperations) {
2115 WarningGadgetSets result;
2116 // If some gadgets cover more than one
2117 // variable, they'll appear more than once in the map.
2118 for (auto &G : AllUnsafeOperations) {
2119 DeclUseList ClaimedVarUseSites = G->getClaimedVarUseSites();
2120
2121 bool AssociatedWithVarDecl = false;
2122 for (const DeclRefExpr *DRE : ClaimedVarUseSites) {
2123 if (const auto *VD = dyn_cast<VarDecl>(DRE->getDecl())) {
2124 result.byVar[VD].insert(G.get());
2125 AssociatedWithVarDecl = true;
2126 }
2127 }
2128
2129 if (!AssociatedWithVarDecl) {
2130 result.noVar.push_back(G.get());
2131 continue;
2132 }
2133 }
2134 return result;
2135}
2136
2138 std::map<const VarDecl *, std::set<const FixableGadget *>,
2139 // To keep keys sorted by their locations in the map so that the
2140 // order is deterministic:
2143};
2144
2145static FixableGadgetSets
2146groupFixablesByVar(FixableGadgetList &&AllFixableOperations) {
2147 FixableGadgetSets FixablesForUnsafeVars;
2148 for (auto &F : AllFixableOperations) {
2149 DeclUseList DREs = F->getClaimedVarUseSites();
2150
2151 for (const DeclRefExpr *DRE : DREs) {
2152 if (const auto *VD = dyn_cast<VarDecl>(DRE->getDecl())) {
2153 FixablesForUnsafeVars.byVar[VD].insert(F.get());
2154 }
2155 }
2156 }
2157 return FixablesForUnsafeVars;
2158}
2159
2161 const SourceManager &SM) {
2162 // A simple interval overlap detection algorithm. Sorts all ranges by their
2163 // begin location then finds the first overlap in one pass.
2164 std::vector<const FixItHint *> All; // a copy of `FixIts`
2165
2166 for (const FixItHint &H : FixIts)
2167 All.push_back(&H);
2168 std::sort(All.begin(), All.end(),
2169 [&SM](const FixItHint *H1, const FixItHint *H2) {
2170 return SM.isBeforeInTranslationUnit(H1->RemoveRange.getBegin(),
2171 H2->RemoveRange.getBegin());
2172 });
2173
2174 const FixItHint *CurrHint = nullptr;
2175
2176 for (const FixItHint *Hint : All) {
2177 if (!CurrHint ||
2178 SM.isBeforeInTranslationUnit(CurrHint->RemoveRange.getEnd(),
2179 Hint->RemoveRange.getBegin())) {
2180 // Either to initialize `CurrHint` or `CurrHint` does not
2181 // overlap with `Hint`:
2182 CurrHint = Hint;
2183 } else
2184 // In case `Hint` overlaps the `CurrHint`, we found at least one
2185 // conflict:
2186 return true;
2187 }
2188 return false;
2189}
2190
2191std::optional<FixItList>
2192PtrToPtrAssignmentGadget::getFixits(const FixitStrategy &S) const {
2193 const auto *LeftVD = cast<VarDecl>(PtrLHS->getDecl());
2194 const auto *RightVD = cast<VarDecl>(PtrRHS->getDecl());
2195 switch (S.lookup(LeftVD)) {
2196 case FixitStrategy::Kind::Span:
2197 if (S.lookup(RightVD) == FixitStrategy::Kind::Span)
2198 return FixItList{};
2199 return std::nullopt;
2200 case FixitStrategy::Kind::Wontfix:
2201 return std::nullopt;
2202 case FixitStrategy::Kind::Iterator:
2203 case FixitStrategy::Kind::Array:
2204 return std::nullopt;
2205 case FixitStrategy::Kind::Vector:
2206 llvm_unreachable("unsupported strategies for FixableGadgets");
2207 }
2208 return std::nullopt;
2209}
2210
2211/// \returns fixit that adds .data() call after \DRE.
2212static inline std::optional<FixItList> createDataFixit(const ASTContext &Ctx,
2213 const DeclRefExpr *DRE);
2214
2215std::optional<FixItList>
2216CArrayToPtrAssignmentGadget::getFixits(const FixitStrategy &S) const {
2217 const auto *LeftVD = cast<VarDecl>(PtrLHS->getDecl());
2218 const auto *RightVD = cast<VarDecl>(PtrRHS->getDecl());
2219 // TLDR: Implementing fixits for non-Wontfix strategy on both LHS and RHS is
2220 // non-trivial.
2221 //
2222 // CArrayToPtrAssignmentGadget doesn't have strategy implications because
2223 // constant size array propagates its bounds. Because of that LHS and RHS are
2224 // addressed by two different fixits.
2225 //
2226 // At the same time FixitStrategy S doesn't reflect what group a fixit belongs
2227 // to and can't be generally relied on in multi-variable Fixables!
2228 //
2229 // E. g. If an instance of this gadget is fixing variable on LHS then the
2230 // variable on RHS is fixed by a different fixit and its strategy for LHS
2231 // fixit is as if Wontfix.
2232 //
2233 // The only exception is Wontfix strategy for a given variable as that is
2234 // valid for any fixit produced for the given input source code.
2235 if (S.lookup(LeftVD) == FixitStrategy::Kind::Span) {
2236 if (S.lookup(RightVD) == FixitStrategy::Kind::Wontfix) {
2237 return FixItList{};
2238 }
2239 } else if (S.lookup(LeftVD) == FixitStrategy::Kind::Wontfix) {
2240 if (S.lookup(RightVD) == FixitStrategy::Kind::Array) {
2241 return createDataFixit(RightVD->getASTContext(), PtrRHS);
2242 }
2243 }
2244 return std::nullopt;
2245}
2246
2247std::optional<FixItList>
2248PointerInitGadget::getFixits(const FixitStrategy &S) const {
2249 const auto *LeftVD = PtrInitLHS;
2250 const auto *RightVD = cast<VarDecl>(PtrInitRHS->getDecl());
2251 switch (S.lookup(LeftVD)) {
2252 case FixitStrategy::Kind::Span:
2253 if (S.lookup(RightVD) == FixitStrategy::Kind::Span)
2254 return FixItList{};
2255 return std::nullopt;
2256 case FixitStrategy::Kind::Wontfix:
2257 return std::nullopt;
2258 case FixitStrategy::Kind::Iterator:
2259 case FixitStrategy::Kind::Array:
2260 return std::nullopt;
2261 case FixitStrategy::Kind::Vector:
2262 llvm_unreachable("unsupported strategies for FixableGadgets");
2263 }
2264 return std::nullopt;
2265}
2266
2267static bool isNonNegativeIntegerExpr(const Expr *Expr, const VarDecl *VD,
2268 const ASTContext &Ctx) {
2269 if (auto ConstVal = Expr->getIntegerConstantExpr(Ctx)) {
2270 if (ConstVal->isNegative())
2271 return false;
2272 } else if (!Expr->getType()->isUnsignedIntegerType())
2273 return false;
2274 return true;
2275}
2276
2277std::optional<FixItList>
2278ULCArraySubscriptGadget::getFixits(const FixitStrategy &S) const {
2279 if (const auto *DRE =
2280 dyn_cast<DeclRefExpr>(Node->getBase()->IgnoreImpCasts()))
2281 if (const auto *VD = dyn_cast<VarDecl>(DRE->getDecl())) {
2282 switch (S.lookup(VD)) {
2283 case FixitStrategy::Kind::Span: {
2284
2285 // If the index has a negative constant value, we give up as no valid
2286 // fix-it can be generated:
2287 const ASTContext &Ctx = // FIXME: we need ASTContext to be passed in!
2288 VD->getASTContext();
2289 if (!isNonNegativeIntegerExpr(Node->getIdx(), VD, Ctx))
2290 return std::nullopt;
2291 // no-op is a good fix-it, otherwise
2292 return FixItList{};
2293 }
2294 case FixitStrategy::Kind::Array:
2295 return FixItList{};
2296 case FixitStrategy::Kind::Wontfix:
2297 case FixitStrategy::Kind::Iterator:
2298 case FixitStrategy::Kind::Vector:
2299 llvm_unreachable("unsupported strategies for FixableGadgets");
2300 }
2301 }
2302 return std::nullopt;
2303}
2304
2305static std::optional<FixItList> // forward declaration
2307
2308std::optional<FixItList>
2309UPCAddressofArraySubscriptGadget::getFixits(const FixitStrategy &S) const {
2310 auto DREs = getClaimedVarUseSites();
2311 const auto *VD = cast<VarDecl>(DREs.front()->getDecl());
2312
2313 switch (S.lookup(VD)) {
2314 case FixitStrategy::Kind::Span:
2316 case FixitStrategy::Kind::Wontfix:
2317 case FixitStrategy::Kind::Iterator:
2318 case FixitStrategy::Kind::Array:
2319 return std::nullopt;
2320 case FixitStrategy::Kind::Vector:
2321 llvm_unreachable("unsupported strategies for FixableGadgets");
2322 }
2323 return std::nullopt; // something went wrong, no fix-it
2324}
2325
2326// FIXME: this function should be customizable through format
2327static StringRef getEndOfLine() {
2328 static const char *const EOL = "\n";
2329 return EOL;
2330}
2331
2332// Returns the text indicating that the user needs to provide input there:
2333static std::string
2334getUserFillPlaceHolder(StringRef HintTextToUser = "placeholder") {
2335 std::string s = std::string("<# ");
2336 s += HintTextToUser;
2337 s += " #>";
2338 return s;
2339}
2340
2341// Return the source location of the last character of the AST `Node`.
2342template <typename NodeTy>
2343static std::optional<SourceLocation>
2344getEndCharLoc(const NodeTy *Node, const SourceManager &SM,
2345 const LangOptions &LangOpts) {
2346 unsigned TkLen = Lexer::MeasureTokenLength(Node->getEndLoc(), SM, LangOpts);
2347 SourceLocation Loc = Node->getEndLoc().getLocWithOffset(TkLen - 1);
2348
2349 if (Loc.isValid())
2350 return Loc;
2351
2352 return std::nullopt;
2353}
2354
2355// Return the source location just past the last character of the AST `Node`.
2356template <typename NodeTy>
2357static std::optional<SourceLocation> getPastLoc(const NodeTy *Node,
2358 const SourceManager &SM,
2359 const LangOptions &LangOpts) {
2361 Lexer::getLocForEndOfToken(Node->getEndLoc(), 0, SM, LangOpts);
2362 if (Loc.isValid())
2363 return Loc;
2364 return std::nullopt;
2365}
2366
2367// Return text representation of an `Expr`.
2368static std::optional<StringRef> getExprText(const Expr *E,
2369 const SourceManager &SM,
2370 const LangOptions &LangOpts) {
2371 std::optional<SourceLocation> LastCharLoc = getPastLoc(E, SM, LangOpts);
2372
2373 if (LastCharLoc)
2374 return Lexer::getSourceText(
2375 CharSourceRange::getCharRange(E->getBeginLoc(), *LastCharLoc), SM,
2376 LangOpts);
2377
2378 return std::nullopt;
2379}
2380
2381// Returns the literal text in `SourceRange SR`, if `SR` is a valid range.
2382static std::optional<StringRef> getRangeText(SourceRange SR,
2383 const SourceManager &SM,
2384 const LangOptions &LangOpts) {
2385 bool Invalid = false;
2387 StringRef Text = Lexer::getSourceText(CSR, SM, LangOpts, &Invalid);
2388
2389 if (!Invalid)
2390 return Text;
2391 return std::nullopt;
2392}
2393
2394// Returns the begin location of the identifier of the given variable
2395// declaration.
2397 // According to the implementation of `VarDecl`, `VD->getLocation()` actually
2398 // returns the begin location of the identifier of the declaration:
2399 return VD->getLocation();
2400}
2401
2402// Returns the literal text of the identifier of the given variable declaration.
2403static std::optional<StringRef>
2405 const LangOptions &LangOpts) {
2406 SourceLocation ParmIdentBeginLoc = getVarDeclIdentifierLoc(VD);
2407 SourceLocation ParmIdentEndLoc =
2408 Lexer::getLocForEndOfToken(ParmIdentBeginLoc, 0, SM, LangOpts);
2409
2410 if (ParmIdentEndLoc.isMacroID() &&
2411 !Lexer::isAtEndOfMacroExpansion(ParmIdentEndLoc, SM, LangOpts))
2412 return std::nullopt;
2413 return getRangeText({ParmIdentBeginLoc, ParmIdentEndLoc}, SM, LangOpts);
2414}
2415
2416// We cannot fix a variable declaration if it has some other specifiers than the
2417// type specifier. Because the source ranges of those specifiers could overlap
2418// with the source range that is being replaced using fix-its. Especially when
2419// we often cannot obtain accurate source ranges of cv-qualified type
2420// specifiers.
2421// FIXME: also deal with type attributes
2422static bool hasUnsupportedSpecifiers(const VarDecl *VD,
2423 const SourceManager &SM) {
2424 // AttrRangeOverlapping: true if at least one attribute of `VD` overlaps the
2425 // source range of `VD`:
2426 bool AttrRangeOverlapping = llvm::any_of(VD->attrs(), [&](Attr *At) -> bool {
2427 return !(SM.isBeforeInTranslationUnit(At->getRange().getEnd(),
2428 VD->getBeginLoc())) &&
2429 !(SM.isBeforeInTranslationUnit(VD->getEndLoc(),
2430 At->getRange().getBegin()));
2431 });
2432 return VD->isInlineSpecified() || VD->isConstexpr() ||
2434 AttrRangeOverlapping;
2435}
2436
2437// Returns the `SourceRange` of `D`. The reason why this function exists is
2438// that `D->getSourceRange()` may return a range where the end location is the
2439// starting location of the last token. The end location of the source range
2440// returned by this function is the last location of the last token.
2442 const SourceManager &SM,
2443 const LangOptions &LangOpts) {
2446 End = // `D->getEndLoc` should always return the starting location of the
2447 // last token, so we should get the end of the token
2448 Lexer::getLocForEndOfToken(D->getEndLoc(), 0, SM, LangOpts);
2449
2450 return SourceRange(Begin, End);
2451}
2452
2453// Returns the text of the pointee type of `T` from a `VarDecl` of a pointer
2454// type. The text is obtained through from `TypeLoc`s. Since `TypeLoc` does not
2455// have source ranges of qualifiers ( The `QualifiedTypeLoc` looks hacky too me
2456// :( ), `Qualifiers` of the pointee type is returned separately through the
2457// output parameter `QualifiersToAppend`.
2458static std::optional<std::string>
2460 const LangOptions &LangOpts,
2461 std::optional<Qualifiers> *QualifiersToAppend) {
2462 QualType Ty = VD->getType();
2463 QualType PteTy;
2464
2465 assert(Ty->isPointerType() && !Ty->isFunctionPointerType() &&
2466 "Expecting a VarDecl of type of pointer to object type");
2467 PteTy = Ty->getPointeeType();
2468
2470 TypeLoc PteTyLoc;
2471
2472 // We only deal with the cases that we know `TypeLoc::getNextTypeLoc` returns
2473 // the `TypeLoc` of the pointee type:
2474 switch (TyLoc.getTypeLocClass()) {
2475 case TypeLoc::ConstantArray:
2476 case TypeLoc::IncompleteArray:
2477 case TypeLoc::VariableArray:
2478 case TypeLoc::DependentSizedArray:
2479 case TypeLoc::Decayed:
2480 assert(isa<ParmVarDecl>(VD) && "An array type shall not be treated as a "
2481 "pointer type unless it decays.");
2482 PteTyLoc = TyLoc.getNextTypeLoc();
2483 break;
2484 case TypeLoc::Pointer:
2485 PteTyLoc = TyLoc.castAs<PointerTypeLoc>().getPointeeLoc();
2486 break;
2487 default:
2488 return std::nullopt;
2489 }
2490 if (PteTyLoc.isNull())
2491 // Sometimes we cannot get a useful `TypeLoc` for the pointee type, e.g.,
2492 // when the pointer type is `auto`.
2493 return std::nullopt;
2494
2496
2497 if (!(IdentLoc.isValid() && PteTyLoc.getSourceRange().isValid())) {
2498 // We are expecting these locations to be valid. But in some cases, they are
2499 // not all valid. It is a Clang bug to me and we are not responsible for
2500 // fixing it. So we will just give up for now when it happens.
2501 return std::nullopt;
2502 }
2503
2504 // Note that TypeLoc.getEndLoc() returns the begin location of the last token:
2505 SourceLocation PteEndOfTokenLoc =
2506 Lexer::getLocForEndOfToken(PteTyLoc.getEndLoc(), 0, SM, LangOpts);
2507
2508 if (!PteEndOfTokenLoc.isValid())
2509 // Sometimes we cannot get the end location of the pointee type, e.g., when
2510 // there are macros involved.
2511 return std::nullopt;
2512 if (!SM.isBeforeInTranslationUnit(PteEndOfTokenLoc, IdentLoc)) {
2513 // We only deal with the cases where the source text of the pointee type
2514 // appears on the left-hand side of the variable identifier completely,
2515 // including the following forms:
2516 // `T ident`,
2517 // `T ident[]`, where `T` is any type.
2518 // Examples of excluded cases are `T (*ident)[]` or `T ident[][n]`.
2519 return std::nullopt;
2520 }
2521 if (PteTy.hasQualifiers()) {
2522 // TypeLoc does not provide source ranges for qualifiers (it says it's
2523 // intentional but seems fishy to me), so we cannot get the full text
2524 // `PteTy` via source ranges.
2525 *QualifiersToAppend = PteTy.getQualifiers();
2526 }
2527 return getRangeText({PteTyLoc.getBeginLoc(), PteEndOfTokenLoc}, SM, LangOpts)
2528 ->str();
2529}
2530
2531// Returns the text of the name (with qualifiers) of a `FunctionDecl`.
2532static std::optional<StringRef> getFunNameText(const FunctionDecl *FD,
2533 const SourceManager &SM,
2534 const LangOptions &LangOpts) {
2535 SourceLocation BeginLoc = FD->getQualifier()
2537 : FD->getNameInfo().getBeginLoc();
2538 // Note that `FD->getNameInfo().getEndLoc()` returns the begin location of the
2539 // last token:
2541 FD->getNameInfo().getEndLoc(), 0, SM, LangOpts);
2542 SourceRange NameRange{BeginLoc, EndLoc};
2543
2544 return getRangeText(NameRange, SM, LangOpts);
2545}
2546
2547// Returns the text representing a `std::span` type where the element type is
2548// represented by `EltTyText`.
2549//
2550// Note the optional parameter `Qualifiers`: one needs to pass qualifiers
2551// explicitly if the element type needs to be qualified.
2552static std::string
2553getSpanTypeText(StringRef EltTyText,
2554 std::optional<Qualifiers> Quals = std::nullopt) {
2555 const char *const SpanOpen = "std::span<";
2556
2557 if (Quals)
2558 return SpanOpen + EltTyText.str() + ' ' + Quals->getAsString() + '>';
2559 return SpanOpen + EltTyText.str() + '>';
2560}
2561
2562std::optional<FixItList>
2564 const VarDecl *VD = dyn_cast<VarDecl>(BaseDeclRefExpr->getDecl());
2565
2566 if (VD && s.lookup(VD) == FixitStrategy::Kind::Span) {
2567 ASTContext &Ctx = VD->getASTContext();
2568 // std::span can't represent elements before its begin()
2569 if (auto ConstVal = Offset->getIntegerConstantExpr(Ctx))
2570 if (ConstVal->isNegative())
2571 return std::nullopt;
2572
2573 // note that the expr may (oddly) has multiple layers of parens
2574 // example:
2575 // *((..(pointer + 123)..))
2576 // goal:
2577 // pointer[123]
2578 // Fix-It:
2579 // remove '*('
2580 // replace ' + ' with '['
2581 // replace ')' with ']'
2582
2583 // example:
2584 // *((..(123 + pointer)..))
2585 // goal:
2586 // 123[pointer]
2587 // Fix-It:
2588 // remove '*('
2589 // replace ' + ' with '['
2590 // replace ')' with ']'
2591
2592 const Expr *LHS = AddOp->getLHS(), *RHS = AddOp->getRHS();
2593 const SourceManager &SM = Ctx.getSourceManager();
2594 const LangOptions &LangOpts = Ctx.getLangOpts();
2595 CharSourceRange StarWithTrailWhitespace =
2597 LHS->getBeginLoc());
2598
2599 std::optional<SourceLocation> LHSLocation = getPastLoc(LHS, SM, LangOpts);
2600 if (!LHSLocation)
2601 return std::nullopt;
2602
2603 CharSourceRange PlusWithSurroundingWhitespace =
2604 clang::CharSourceRange::getCharRange(*LHSLocation, RHS->getBeginLoc());
2605
2606 std::optional<SourceLocation> AddOpLocation =
2607 getPastLoc(AddOp, SM, LangOpts);
2608 std::optional<SourceLocation> DerefOpLocation =
2609 getPastLoc(DerefOp, SM, LangOpts);
2610
2611 if (!AddOpLocation || !DerefOpLocation)
2612 return std::nullopt;
2613
2614 CharSourceRange ClosingParenWithPrecWhitespace =
2615 clang::CharSourceRange::getCharRange(*AddOpLocation, *DerefOpLocation);
2616
2617 return FixItList{
2618 {FixItHint::CreateRemoval(StarWithTrailWhitespace),
2619 FixItHint::CreateReplacement(PlusWithSurroundingWhitespace, "["),
2620 FixItHint::CreateReplacement(ClosingParenWithPrecWhitespace, "]")}};
2621 }
2622 return std::nullopt; // something wrong or unsupported, give up
2623}
2624
2625std::optional<FixItList>
2626PointerDereferenceGadget::getFixits(const FixitStrategy &S) const {
2627 const VarDecl *VD = cast<VarDecl>(BaseDeclRefExpr->getDecl());
2628 switch (S.lookup(VD)) {
2629 case FixitStrategy::Kind::Span: {
2630 ASTContext &Ctx = VD->getASTContext();
2632 // Required changes: *(ptr); => (ptr[0]); and *ptr; => ptr[0]
2633 // Deletes the *operand
2635 Op->getBeginLoc(), Op->getBeginLoc().getLocWithOffset(1));
2636 // Inserts the [0]
2637 if (auto LocPastOperand =
2638 getPastLoc(BaseDeclRefExpr, SM, Ctx.getLangOpts())) {
2639 return FixItList{{FixItHint::CreateRemoval(derefRange),
2640 FixItHint::CreateInsertion(*LocPastOperand, "[0]")}};
2641 }
2642 break;
2643 }
2644 case FixitStrategy::Kind::Iterator:
2645 case FixitStrategy::Kind::Array:
2646 return std::nullopt;
2647 case FixitStrategy::Kind::Vector:
2648 llvm_unreachable("FixitStrategy not implemented yet!");
2649 case FixitStrategy::Kind::Wontfix:
2650 llvm_unreachable("Invalid strategy!");
2651 }
2652
2653 return std::nullopt;
2654}
2655
2656static inline std::optional<FixItList> createDataFixit(const ASTContext &Ctx,
2657 const DeclRefExpr *DRE) {
2658 const SourceManager &SM = Ctx.getSourceManager();
2659 // Inserts the .data() after the DRE
2660 std::optional<SourceLocation> EndOfOperand =
2661 getPastLoc(DRE, SM, Ctx.getLangOpts());
2662
2663 if (EndOfOperand)
2664 return FixItList{{FixItHint::CreateInsertion(*EndOfOperand, ".data()")}};
2665
2666 return std::nullopt;
2667}
2668
2669// Generates fix-its replacing an expression of the form UPC(DRE) with
2670// `DRE.data()`
2671std::optional<FixItList>
2672UPCStandalonePointerGadget::getFixits(const FixitStrategy &S) const {
2673 const auto VD = cast<VarDecl>(Node->getDecl());
2674 switch (S.lookup(VD)) {
2675 case FixitStrategy::Kind::Array:
2676 case FixitStrategy::Kind::Span: {
2677 return createDataFixit(VD->getASTContext(), Node);
2678 // FIXME: Points inside a macro expansion.
2679 break;
2680 }
2681 case FixitStrategy::Kind::Wontfix:
2682 case FixitStrategy::Kind::Iterator:
2683 return std::nullopt;
2684 case FixitStrategy::Kind::Vector:
2685 llvm_unreachable("unsupported strategies for FixableGadgets");
2686 }
2687
2688 return std::nullopt;
2689}
2690
2691// Generates fix-its replacing an expression of the form `&DRE[e]` with
2692// `&DRE.data()[e]`:
2693static std::optional<FixItList>
2695 const auto *ArraySub = cast<ArraySubscriptExpr>(Node->getSubExpr());
2696 const auto *DRE = cast<DeclRefExpr>(ArraySub->getBase()->IgnoreImpCasts());
2697 // FIXME: this `getASTContext` call is costly, we should pass the
2698 // ASTContext in:
2699 const ASTContext &Ctx = DRE->getDecl()->getASTContext();
2700 const Expr *Idx = ArraySub->getIdx();
2701 const SourceManager &SM = Ctx.getSourceManager();
2702 const LangOptions &LangOpts = Ctx.getLangOpts();
2703 std::stringstream SS;
2704 bool IdxIsLitZero = false;
2705
2706 if (auto ICE = Idx->getIntegerConstantExpr(Ctx))
2707 if ((*ICE).isZero())
2708 IdxIsLitZero = true;
2709 std::optional<StringRef> DreString = getExprText(DRE, SM, LangOpts);
2710 if (!DreString)
2711 return std::nullopt;
2712
2713 if (IdxIsLitZero) {
2714 // If the index is literal zero, we produce the most concise fix-it:
2715 SS << (*DreString).str() << ".data()";
2716 } else {
2717 std::optional<StringRef> IndexString = getExprText(Idx, SM, LangOpts);
2718 if (!IndexString)
2719 return std::nullopt;
2720
2721 SS << "&" << (*DreString).str() << ".data()"
2722 << "[" << (*IndexString).str() << "]";
2723 }
2724 return FixItList{
2726}
2727
2728std::optional<FixItList>
2730 DeclUseList DREs = getClaimedVarUseSites();
2731
2732 if (DREs.size() != 1)
2733 return std::nullopt; // In cases of `Ptr += n` where `Ptr` is not a DRE, we
2734 // give up
2735 if (const VarDecl *VD = dyn_cast<VarDecl>(DREs.front()->getDecl())) {
2736 if (S.lookup(VD) == FixitStrategy::Kind::Span) {
2737 FixItList Fixes;
2738
2739 const Stmt *AddAssignNode = Node;
2740 StringRef varName = VD->getName();
2741 const ASTContext &Ctx = VD->getASTContext();
2742
2743 if (!isNonNegativeIntegerExpr(Offset, VD, Ctx))
2744 return std::nullopt;
2745
2746 // To transform UUC(p += n) to UUC(p = p.subspan(..)):
2747 bool NotParenExpr =
2748 (Offset->IgnoreParens()->getBeginLoc() == Offset->getBeginLoc());
2749 std::string SS = varName.str() + " = " + varName.str() + ".subspan";
2750 if (NotParenExpr)
2751 SS += "(";
2752
2753 std::optional<SourceLocation> AddAssignLocation = getEndCharLoc(
2754 AddAssignNode, Ctx.getSourceManager(), Ctx.getLangOpts());
2755 if (!AddAssignLocation)
2756 return std::nullopt;
2757
2758 Fixes.push_back(FixItHint::CreateReplacement(
2759 SourceRange(AddAssignNode->getBeginLoc(), Node->getOperatorLoc()),
2760 SS));
2761 if (NotParenExpr)
2762 Fixes.push_back(FixItHint::CreateInsertion(
2763 Offset->getEndLoc().getLocWithOffset(1), ")"));
2764 return Fixes;
2765 }
2766 }
2767 return std::nullopt; // Not in the cases that we can handle for now, give up.
2768}
2769
2770std::optional<FixItList>
2772 DeclUseList DREs = getClaimedVarUseSites();
2773
2774 if (DREs.size() != 1)
2775 return std::nullopt; // In cases of `++Ptr` where `Ptr` is not a DRE, we
2776 // give up
2777 if (const VarDecl *VD = dyn_cast<VarDecl>(DREs.front()->getDecl())) {
2778 if (S.lookup(VD) == FixitStrategy::Kind::Span) {
2779 FixItList Fixes;
2780 std::stringstream SS;
2781 StringRef varName = VD->getName();
2782 const ASTContext &Ctx = VD->getASTContext();
2783
2784 // To transform UPC(++p) to UPC((p = p.subspan(1)).data()):
2785 SS << "(" << varName.data() << " = " << varName.data()
2786 << ".subspan(1)).data()";
2787 std::optional<SourceLocation> PreIncLocation =
2789 if (!PreIncLocation)
2790 return std::nullopt;
2791
2792 Fixes.push_back(FixItHint::CreateReplacement(
2793 SourceRange(Node->getBeginLoc(), *PreIncLocation), SS.str()));
2794 return Fixes;
2795 }
2796 }
2797 return std::nullopt; // Not in the cases that we can handle for now, give up.
2798}
2799
2800// For a non-null initializer `Init` of `T *` type, this function returns
2801// `FixItHint`s producing a list initializer `{Init, S}` as a part of a fix-it
2802// to output stream.
2803// In many cases, this function cannot figure out the actual extent `S`. It
2804// then will use a place holder to replace `S` to ask users to fill `S` in. The
2805// initializer shall be used to initialize a variable of type `std::span<T>`.
2806// In some cases (e. g. constant size array) the initializer should remain
2807// unchanged and the function returns empty list. In case the function can't
2808// provide the right fixit it will return nullopt.
2809//
2810// FIXME: Support multi-level pointers
2811//
2812// Parameters:
2813// `Init` a pointer to the initializer expression
2814// `Ctx` a reference to the ASTContext
2815static std::optional<FixItList>
2817 const StringRef UserFillPlaceHolder) {
2818 const SourceManager &SM = Ctx.getSourceManager();
2819 const LangOptions &LangOpts = Ctx.getLangOpts();
2820
2821 // If `Init` has a constant value that is (or equivalent to) a
2822 // NULL pointer, we use the default constructor to initialize the span
2823 // object, i.e., a `std:span` variable declaration with no initializer.
2824 // So the fix-it is just to remove the initializer.
2825 if (Init->isNullPointerConstant(
2826 Ctx,
2827 // FIXME: Why does this function not ask for `const ASTContext
2828 // &`? It should. Maybe worth an NFC patch later.
2830 NPC_ValueDependentIsNotNull)) {
2831 std::optional<SourceLocation> InitLocation =
2832 getEndCharLoc(Init, SM, LangOpts);
2833 if (!InitLocation)
2834 return std::nullopt;
2835
2836 SourceRange SR(Init->getBeginLoc(), *InitLocation);
2837
2838 return FixItList{FixItHint::CreateRemoval(SR)};
2839 }
2840
2841 FixItList FixIts{};
2842 std::string ExtentText = UserFillPlaceHolder.data();
2843 StringRef One = "1";
2844
2845 // Insert `{` before `Init`:
2846 FixIts.push_back(FixItHint::CreateInsertion(Init->getBeginLoc(), "{"));
2847 // Try to get the data extent. Break into different cases:
2848 if (auto CxxNew = dyn_cast<CXXNewExpr>(Init->IgnoreImpCasts())) {
2849 // In cases `Init` is `new T[n]` and there is no explicit cast over
2850 // `Init`, we know that `Init` must evaluates to a pointer to `n` objects
2851 // of `T`. So the extent is `n` unless `n` has side effects. Similar but
2852 // simpler for the case where `Init` is `new T`.
2853 if (const Expr *Ext = CxxNew->getArraySize().value_or(nullptr)) {
2854 if (!Ext->HasSideEffects(Ctx)) {
2855 std::optional<StringRef> ExtentString = getExprText(Ext, SM, LangOpts);
2856 if (!ExtentString)
2857 return std::nullopt;
2858 ExtentText = *ExtentString;
2859 }
2860 } else if (!CxxNew->isArray())
2861 // Although the initializer is not allocating a buffer, the pointer
2862 // variable could still be used in buffer access operations.
2863 ExtentText = One;
2864 } else if (Ctx.getAsConstantArrayType(Init->IgnoreImpCasts()->getType())) {
2865 // std::span has a single parameter constructor for initialization with
2866 // constant size array. The size is auto-deduced as the constructor is a
2867 // function template. The correct fixit is empty - no changes should happen.
2868 return FixItList{};
2869 } else {
2870 // In cases `Init` is of the form `&Var` after stripping of implicit
2871 // casts, where `&` is the built-in operator, the extent is 1.
2872 if (auto AddrOfExpr = dyn_cast<UnaryOperator>(Init->IgnoreImpCasts()))
2873 if (AddrOfExpr->getOpcode() == UnaryOperatorKind::UO_AddrOf &&
2874 isa_and_present<DeclRefExpr>(AddrOfExpr->getSubExpr()))
2875 ExtentText = One;
2876 // TODO: we can handle more cases, e.g., `&a[0]`, `&a`, `std::addressof`,
2877 // and explicit casting, etc. etc.
2878 }
2879
2880 SmallString<32> StrBuffer{};
2881 std::optional<SourceLocation> LocPassInit = getPastLoc(Init, SM, LangOpts);
2882
2883 if (!LocPassInit)
2884 return std::nullopt;
2885
2886 StrBuffer.append(", ");
2887 StrBuffer.append(ExtentText);
2888 StrBuffer.append("}");
2889 FixIts.push_back(FixItHint::CreateInsertion(*LocPassInit, StrBuffer.str()));
2890 return FixIts;
2891}
2892
2893#ifndef NDEBUG
2894#define DEBUG_NOTE_DECL_FAIL(D, Msg) \
2895 Handler.addDebugNoteForVar((D), (D)->getBeginLoc(), \
2896 "failed to produce fixit for declaration '" + \
2897 (D)->getNameAsString() + "'" + (Msg))
2898#else
2899#define DEBUG_NOTE_DECL_FAIL(D, Msg)
2900#endif
2901
2902// For the given variable declaration with a pointer-to-T type, returns the text
2903// `std::span<T>`. If it is unable to generate the text, returns
2904// `std::nullopt`.
2905static std::optional<std::string>
2907 assert(VD->getType()->isPointerType());
2908
2909 std::optional<Qualifiers> PteTyQualifiers = std::nullopt;
2910 std::optional<std::string> PteTyText = getPointeeTypeText(
2911 VD, Ctx.getSourceManager(), Ctx.getLangOpts(), &PteTyQualifiers);
2912
2913 if (!PteTyText)
2914 return std::nullopt;
2915
2916 std::string SpanTyText = "std::span<";
2917
2918 SpanTyText.append(*PteTyText);
2919 // Append qualifiers to span element type if any:
2920 if (PteTyQualifiers) {
2921 SpanTyText.append(" ");
2922 SpanTyText.append(PteTyQualifiers->getAsString());
2923 }
2924 SpanTyText.append(">");
2925 return SpanTyText;
2926}
2927
2928// For a `VarDecl` of the form `T * var (= Init)?`, this
2929// function generates fix-its that
2930// 1) replace `T * var` with `std::span<T> var`; and
2931// 2) change `Init` accordingly to a span constructor, if it exists.
2932//
2933// FIXME: support Multi-level pointers
2934//
2935// Parameters:
2936// `D` a pointer the variable declaration node
2937// `Ctx` a reference to the ASTContext
2938// `UserFillPlaceHolder` the user-input placeholder text
2939// Returns:
2940// the non-empty fix-it list, if fix-its are successfuly generated; empty
2941// list otherwise.
2942static FixItList fixLocalVarDeclWithSpan(const VarDecl *D, ASTContext &Ctx,
2943 const StringRef UserFillPlaceHolder,
2944 UnsafeBufferUsageHandler &Handler) {
2946 return {};
2947
2948 FixItList FixIts{};
2949 std::optional<std::string> SpanTyText = createSpanTypeForVarDecl(D, Ctx);
2950
2951 if (!SpanTyText) {
2952 DEBUG_NOTE_DECL_FAIL(D, " : failed to generate 'std::span' type");
2953 return {};
2954 }
2955
2956 // Will hold the text for `std::span<T> Ident`:
2957 std::stringstream SS;
2958
2959 SS << *SpanTyText;
2960 // Fix the initializer if it exists:
2961 if (const Expr *Init = D->getInit()) {
2962 std::optional<FixItList> InitFixIts =
2963 FixVarInitializerWithSpan(Init, Ctx, UserFillPlaceHolder);
2964 if (!InitFixIts)
2965 return {};
2966 FixIts.insert(FixIts.end(), std::make_move_iterator(InitFixIts->begin()),
2967 std::make_move_iterator(InitFixIts->end()));
2968 }
2969 // For declaration of the form `T * ident = init;`, we want to replace
2970 // `T * ` with `std::span<T>`.
2971 // We ignore CV-qualifiers so for `T * const ident;` we also want to replace
2972 // just `T *` with `std::span<T>`.
2973 const SourceLocation EndLocForReplacement = D->getTypeSpecEndLoc();
2974 if (!EndLocForReplacement.isValid()) {
2975 DEBUG_NOTE_DECL_FAIL(D, " : failed to locate the end of the declaration");
2976 return {};
2977 }
2978 // The only exception is that for `T *ident` we'll add a single space between
2979 // "std::span<T>" and "ident".
2980 // FIXME: The condition is false for identifiers expended from macros.
2981 if (EndLocForReplacement.getLocWithOffset(1) == getVarDeclIdentifierLoc(D))
2982 SS << " ";
2983
2984 FixIts.push_back(FixItHint::CreateReplacement(
2985 SourceRange(D->getBeginLoc(), EndLocForReplacement), SS.str()));
2986 return FixIts;
2987}
2988
2989static bool hasConflictingOverload(const FunctionDecl *FD) {
2990 return !FD->getDeclContext()->lookup(FD->getDeclName()).isSingleResult();
2991}
2992
2993// For a `FunctionDecl`, whose `ParmVarDecl`s are being changed to have new
2994// types, this function produces fix-its to make the change self-contained. Let
2995// 'F' be the entity defined by the original `FunctionDecl` and "NewF" be the
2996// entity defined by the `FunctionDecl` after the change to the parameters.
2997// Fix-its produced by this function are
2998// 1. Add the `[[clang::unsafe_buffer_usage]]` attribute to each declaration
2999// of 'F';
3000// 2. Create a declaration of "NewF" next to each declaration of `F`;
3001// 3. Create a definition of "F" (as its' original definition is now belongs
3002// to "NewF") next to its original definition. The body of the creating
3003// definition calls to "NewF".
3004//
3005// Example:
3006//
3007// void f(int *p); // original declaration
3008// void f(int *p) { // original definition
3009// p[5];
3010// }
3011//
3012// To change the parameter `p` to be of `std::span<int>` type, we
3013// also add overloads:
3014//
3015// [[clang::unsafe_buffer_usage]] void f(int *p); // original decl
3016// void f(std::span<int> p); // added overload decl
3017// void f(std::span<int> p) { // original def where param is changed
3018// p[5];
3019// }
3020// [[clang::unsafe_buffer_usage]] void f(int *p) { // added def
3021// return f(std::span(p, <# size #>));
3022// }
3023//
3024static std::optional<FixItList>
3026 const ASTContext &Ctx,
3027 UnsafeBufferUsageHandler &Handler) {
3028 // FIXME: need to make this conflict checking better:
3029 if (hasConflictingOverload(FD))
3030 return std::nullopt;
3031
3032 const SourceManager &SM = Ctx.getSourceManager();
3033 const LangOptions &LangOpts = Ctx.getLangOpts();
3034 const unsigned NumParms = FD->getNumParams();
3035 std::vector<std::string> NewTysTexts(NumParms);
3036 std::vector<bool> ParmsMask(NumParms, false);
3037 bool AtLeastOneParmToFix = false;
3038
3039 for (unsigned i = 0; i < NumParms; i++) {
3040 const ParmVarDecl *PVD = FD->getParamDecl(i);
3041
3042 if (S.lookup(PVD) == FixitStrategy::Kind::Wontfix)
3043 continue;
3044 if (S.lookup(PVD) != FixitStrategy::Kind::Span)
3045 // Not supported, not suppose to happen:
3046 return std::nullopt;
3047
3048 std::optional<Qualifiers> PteTyQuals = std::nullopt;
3049 std::optional<std::string> PteTyText =
3050 getPointeeTypeText(PVD, SM, LangOpts, &PteTyQuals);
3051
3052 if (!PteTyText)
3053 // something wrong in obtaining the text of the pointee type, give up
3054 return std::nullopt;
3055 // FIXME: whether we should create std::span type depends on the
3056 // FixitStrategy.
3057 NewTysTexts[i] = getSpanTypeText(*PteTyText, PteTyQuals);
3058 ParmsMask[i] = true;
3059 AtLeastOneParmToFix = true;
3060 }
3061 if (!AtLeastOneParmToFix)
3062 // No need to create function overloads:
3063 return {};
3064 // FIXME Respect indentation of the original code.
3065
3066 // A lambda that creates the text representation of a function declaration
3067 // with the new type signatures:
3068 const auto NewOverloadSignatureCreator =
3069 [&SM, &LangOpts, &NewTysTexts,
3070 &ParmsMask](const FunctionDecl *FD) -> std::optional<std::string> {
3071 std::stringstream SS;
3072
3073 SS << ";";
3074 SS << getEndOfLine().str();
3075 // Append: ret-type func-name "("
3076 if (auto Prefix = getRangeText(
3077 SourceRange(FD->getBeginLoc(), (*FD->param_begin())->getBeginLoc()),
3078 SM, LangOpts))
3079 SS << Prefix->str();
3080 else
3081 return std::nullopt; // give up
3082 // Append: parameter-type-list
3083 const unsigned NumParms = FD->getNumParams();
3084
3085 for (unsigned i = 0; i < NumParms; i++) {
3086 const ParmVarDecl *Parm = FD->getParamDecl(i);
3087
3088 if (Parm->isImplicit())
3089 continue;
3090 if (ParmsMask[i]) {
3091 // This `i`-th parameter will be fixed with `NewTysTexts[i]` being its
3092 // new type:
3093 SS << NewTysTexts[i];
3094 // print parameter name if provided:
3095 if (IdentifierInfo *II = Parm->getIdentifier())
3096 SS << ' ' << II->getName().str();
3097 } else if (auto ParmTypeText =
3098 getRangeText(getSourceRangeToTokenEnd(Parm, SM, LangOpts),
3099 SM, LangOpts)) {
3100 // print the whole `Parm` without modification:
3101 SS << ParmTypeText->str();
3102 } else
3103 return std::nullopt; // something wrong, give up
3104 if (i != NumParms - 1)
3105 SS << ", ";
3106 }
3107 SS << ")";
3108 return SS.str();
3109 };
3110
3111 // A lambda that creates the text representation of a function definition with
3112 // the original signature:
3113 const auto OldOverloadDefCreator =
3114 [&Handler, &SM, &LangOpts, &NewTysTexts,
3115 &ParmsMask](const FunctionDecl *FD) -> std::optional<std::string> {
3116 std::stringstream SS;
3117
3118 SS << getEndOfLine().str();
3119 // Append: attr-name ret-type func-name "(" param-list ")" "{"
3120 if (auto FDPrefix = getRangeText(
3121 SourceRange(FD->getBeginLoc(), FD->getBody()->getBeginLoc()), SM,
3122 LangOpts))
3123 SS << Handler.getUnsafeBufferUsageAttributeTextAt(FD->getBeginLoc(), " ")
3124 << FDPrefix->str() << "{";
3125 else
3126 return std::nullopt;
3127 // Append: "return" func-name "("
3128 if (auto FunQualName = getFunNameText(FD, SM, LangOpts))
3129 SS << "return " << FunQualName->str() << "(";
3130 else
3131 return std::nullopt;
3132
3133 // Append: arg-list
3134 const unsigned NumParms = FD->getNumParams();
3135 for (unsigned i = 0; i < NumParms; i++) {
3136 const ParmVarDecl *Parm = FD->getParamDecl(i);
3137
3138 if (Parm->isImplicit())
3139 continue;
3140 // FIXME: If a parameter has no name, it is unused in the
3141 // definition. So we could just leave it as it is.
3142 if (!Parm->getIdentifier())
3143 // If a parameter of a function definition has no name:
3144 return std::nullopt;
3145 if (ParmsMask[i])
3146 // This is our spanified paramter!
3147 SS << NewTysTexts[i] << "(" << Parm->getIdentifier()->getName().str()
3148 << ", " << getUserFillPlaceHolder("size") << ")";
3149 else
3150 SS << Parm->getIdentifier()->getName().str();
3151 if (i != NumParms - 1)
3152 SS << ", ";
3153 }
3154 // finish call and the body
3155 SS << ");}" << getEndOfLine().str();
3156 // FIXME: 80-char line formatting?
3157 return SS.str();
3158 };
3159
3160 FixItList FixIts{};
3161 for (FunctionDecl *FReDecl : FD->redecls()) {
3162 std::optional<SourceLocation> Loc = getPastLoc(FReDecl, SM, LangOpts);
3163
3164 if (!Loc)
3165 return {};
3166 if (FReDecl->isThisDeclarationADefinition()) {
3167 assert(FReDecl == FD && "inconsistent function definition");
3168 // Inserts a definition with the old signature to the end of
3169 // `FReDecl`:
3170 if (auto OldOverloadDef = OldOverloadDefCreator(FReDecl))
3171 FixIts.emplace_back(FixItHint::CreateInsertion(*Loc, *OldOverloadDef));
3172 else
3173 return {}; // give up
3174 } else {
3175 // Adds the unsafe-buffer attribute (if not already there) to `FReDecl`:
3176 if (!FReDecl->hasAttr<UnsafeBufferUsageAttr>()) {
3177 FixIts.emplace_back(FixItHint::CreateInsertion(
3178 FReDecl->getBeginLoc(), Handler.getUnsafeBufferUsageAttributeTextAt(
3179 FReDecl->getBeginLoc(), " ")));
3180 }
3181 // Inserts a declaration with the new signature to the end of `FReDecl`:
3182 if (auto NewOverloadDecl = NewOverloadSignatureCreator(FReDecl))
3183 FixIts.emplace_back(FixItHint::CreateInsertion(*Loc, *NewOverloadDecl));
3184 else
3185 return {};
3186 }
3187 }
3188 return FixIts;
3189}
3190
3191// To fix a `ParmVarDecl` to be of `std::span` type.
3192static FixItList fixParamWithSpan(const ParmVarDecl *PVD, const ASTContext &Ctx,
3193 UnsafeBufferUsageHandler &Handler) {
3195 DEBUG_NOTE_DECL_FAIL(PVD, " : has unsupport specifier(s)");
3196 return {};
3197 }
3198 if (PVD->hasDefaultArg()) {
3199 // FIXME: generate fix-its for default values:
3200 DEBUG_NOTE_DECL_FAIL(PVD, " : has default arg");
3201 return {};
3202 }
3203
3204 std::optional<Qualifiers> PteTyQualifiers = std::nullopt;
3205 std::optional<std::string> PteTyText = getPointeeTypeText(
3206 PVD, Ctx.getSourceManager(), Ctx.getLangOpts(), &PteTyQualifiers);
3207
3208 if (!PteTyText) {
3209 DEBUG_NOTE_DECL_FAIL(PVD, " : invalid pointee type");
3210 return {};
3211 }
3212
3213 std::optional<StringRef> PVDNameText = PVD->getIdentifier()->getName();
3214
3215 if (!PVDNameText) {
3216 DEBUG_NOTE_DECL_FAIL(PVD, " : invalid identifier name");
3217 return {};
3218 }
3219
3220 std::stringstream SS;
3221 std::optional<std::string> SpanTyText = createSpanTypeForVarDecl(PVD, Ctx);
3222
3223 if (PteTyQualifiers)
3224 // Append qualifiers if they exist:
3225 SS << getSpanTypeText(*PteTyText, PteTyQualifiers);
3226 else
3227 SS << getSpanTypeText(*PteTyText);
3228 // Append qualifiers to the type of the parameter:
3229 if (PVD->getType().hasQualifiers())
3230 SS << ' ' << PVD->getType().getQualifiers().getAsString();
3231 // Append parameter's name:
3232 SS << ' ' << PVDNameText->str();
3233 // Add replacement fix-it:
3234 return {FixItHint::CreateReplacement(PVD->getSourceRange(), SS.str())};
3235}
3236
3237static FixItList fixVariableWithSpan(const VarDecl *VD,
3238 const DeclUseTracker &Tracker,
3239 ASTContext &Ctx,
3240 UnsafeBufferUsageHandler &Handler) {
3241 const DeclStmt *DS = Tracker.lookupDecl(VD);
3242 if (!DS) {
3244 " : variables declared this way not implemented yet");
3245 return {};
3246 }
3247 if (!DS->isSingleDecl()) {
3248 // FIXME: to support handling multiple `VarDecl`s in a single `DeclStmt`
3249 DEBUG_NOTE_DECL_FAIL(VD, " : multiple VarDecls");
3250 return {};
3251 }
3252 // Currently DS is an unused variable but we'll need it when
3253 // non-single decls are implemented, where the pointee type name
3254 // and the '*' are spread around the place.
3255 (void)DS;
3256
3257 // FIXME: handle cases where DS has multiple declarations
3258 return fixLocalVarDeclWithSpan(VD, Ctx, getUserFillPlaceHolder(), Handler);
3259}
3260
3261static FixItList fixVarDeclWithArray(const VarDecl *D, const ASTContext &Ctx,
3262 UnsafeBufferUsageHandler &Handler) {
3263 FixItList FixIts{};
3264
3265 // Note: the code below expects the declaration to not use any type sugar like
3266 // typedef.
3267 if (auto CAT = Ctx.getAsConstantArrayType(D->getType())) {
3268 const QualType &ArrayEltT = CAT->getElementType();
3269 assert(!ArrayEltT.isNull() && "Trying to fix a non-array type variable!");
3270 // FIXME: support multi-dimensional arrays
3271 if (isa<clang::ArrayType>(ArrayEltT.getCanonicalType()))
3272 return {};
3273
3275
3276 // Get the spelling of the element type as written in the source file
3277 // (including macros, etc.).
3278 auto MaybeElemTypeTxt =
3280 Ctx.getLangOpts());
3281 if (!MaybeElemTypeTxt)
3282 return {};
3283 const llvm::StringRef ElemTypeTxt = MaybeElemTypeTxt->trim();
3284
3285 // Find the '[' token.
3286 std::optional<Token> NextTok = Lexer::findNextToken(
3288 while (NextTok && !NextTok->is(tok::l_square) &&
3289 NextTok->getLocation() <= D->getSourceRange().getEnd())
3290 NextTok = Lexer::findNextToken(NextTok->getLocation(),
3291 Ctx.getSourceManager(), Ctx.getLangOpts());
3292 if (!NextTok)
3293 return {};
3294 const SourceLocation LSqBracketLoc = NextTok->getLocation();
3295
3296 // Get the spelling of the array size as written in the source file
3297 // (including macros, etc.).
3298 auto MaybeArraySizeTxt = getRangeText(
3299 {LSqBracketLoc.getLocWithOffset(1), D->getTypeSpecEndLoc()},
3300 Ctx.getSourceManager(), Ctx.getLangOpts());
3301 if (!MaybeArraySizeTxt)
3302 return {};
3303 const llvm::StringRef ArraySizeTxt = MaybeArraySizeTxt->trim();
3304 if (ArraySizeTxt.empty()) {
3305 // FIXME: Support array size getting determined from the initializer.
3306 // Examples:
3307 // int arr1[] = {0, 1, 2};
3308 // int arr2{3, 4, 5};
3309 // We might be able to preserve the non-specified size with `auto` and
3310 // `std::to_array`:
3311 // auto arr1 = std::to_array<int>({0, 1, 2});
3312 return {};
3313 }
3314
3315 std::optional<StringRef> IdentText =
3317
3318 if (!IdentText) {
3319 DEBUG_NOTE_DECL_FAIL(D, " : failed to locate the identifier");
3320 return {};
3321 }
3322
3323 SmallString<32> Replacement;
3324 raw_svector_ostream OS(Replacement);
3325 OS << "std::array<" << ElemTypeTxt << ", " << ArraySizeTxt << "> "
3326 << IdentText->str();
3327
3328 FixIts.push_back(FixItHint::CreateReplacement(
3329 SourceRange{D->getBeginLoc(), D->getTypeSpecEndLoc()}, OS.str()));
3330 }
3331
3332 return FixIts;
3333}
3334
3335static FixItList fixVariableWithArray(const VarDecl *VD,
3336 const DeclUseTracker &Tracker,
3337 const ASTContext &Ctx,
3338 UnsafeBufferUsageHandler &Handler) {
3339 const DeclStmt *DS = Tracker.lookupDecl(VD);
3340 assert(DS && "Fixing non-local variables not implemented yet!");
3341 if (!DS->isSingleDecl()) {
3342 // FIXME: to support handling multiple `VarDecl`s in a single `DeclStmt`
3343 return {};
3344 }
3345 // Currently DS is an unused variable but we'll need it when
3346 // non-single decls are implemented, where the pointee type name
3347 // and the '*' are spread around the place.
3348 (void)DS;
3349
3350 // FIXME: handle cases where DS has multiple declarations
3351 return fixVarDeclWithArray(VD, Ctx, Handler);
3352}
3353
3354// TODO: we should be consistent to use `std::nullopt` to represent no-fix due
3355// to any unexpected problem.
3356static FixItList
3358 /* The function decl under analysis */ const Decl *D,
3359 const DeclUseTracker &Tracker, ASTContext &Ctx,
3360 UnsafeBufferUsageHandler &Handler) {
3361 if (const auto *PVD = dyn_cast<ParmVarDecl>(VD)) {
3362 auto *FD = dyn_cast<clang::FunctionDecl>(PVD->getDeclContext());
3363 if (!FD || FD != D) {
3364 // `FD != D` means that `PVD` belongs to a function that is not being
3365 // analyzed currently. Thus `FD` may not be complete.
3366 DEBUG_NOTE_DECL_FAIL(VD, " : function not currently analyzed");
3367 return {};
3368 }
3369
3370 // TODO If function has a try block we can't change params unless we check
3371 // also its catch block for their use.
3372 // FIXME We might support static class methods, some select methods,
3373 // operators and possibly lamdas.
3374 if (FD->isMain() || FD->isConstexpr() ||
3375 FD->getTemplatedKind() != FunctionDecl::TemplatedKind::TK_NonTemplate ||
3376 FD->isVariadic() ||
3377 // also covers call-operator of lamdas
3378 isa<CXXMethodDecl>(FD) ||
3379 // skip when the function body is a try-block
3380 (FD->hasBody() && isa<CXXTryStmt>(FD->getBody())) ||
3381 FD->isOverloadedOperator()) {
3382 DEBUG_NOTE_DECL_FAIL(VD, " : unsupported function decl");
3383 return {}; // TODO test all these cases
3384 }
3385 }
3386
3387 switch (K) {
3388 case FixitStrategy::Kind::Span: {
3389 if (VD->getType()->isPointerType()) {
3390 if (const auto *PVD = dyn_cast<ParmVarDecl>(VD))
3391 return fixParamWithSpan(PVD, Ctx, Handler);
3392
3393 if (VD->isLocalVarDecl())
3394 return fixVariableWithSpan(VD, Tracker, Ctx, Handler);
3395 }
3396 DEBUG_NOTE_DECL_FAIL(VD, " : not a pointer");
3397 return {};
3398 }
3399 case FixitStrategy::Kind::Array: {
3400 if (VD->isLocalVarDecl() && Ctx.getAsConstantArrayType(VD->getType()))
3401 return fixVariableWithArray(VD, Tracker, Ctx, Handler);
3402
3403 DEBUG_NOTE_DECL_FAIL(VD, " : not a local const-size array");
3404 return {};
3405 }
3406 case FixitStrategy::Kind::Iterator:
3407 case FixitStrategy::Kind::Vector:
3408 llvm_unreachable("FixitStrategy not implemented yet!");
3409 case FixitStrategy::Kind::Wontfix:
3410 llvm_unreachable("Invalid strategy!");
3411 }
3412 llvm_unreachable("Unknown strategy!");
3413}
3414
3415// Returns true iff there exists a `FixItHint` 'h' in `FixIts` such that the
3416// `RemoveRange` of 'h' overlaps with a macro use.
3417static bool overlapWithMacro(const FixItList &FixIts) {
3418 // FIXME: For now we only check if the range (or the first token) is (part of)
3419 // a macro expansion. Ideally, we want to check for all tokens in the range.
3420 return llvm::any_of(FixIts, [](const FixItHint &Hint) {
3421 auto Range = Hint.RemoveRange;
3423 // If the range (or the first token) is (part of) a macro expansion:
3424 return true;
3425 return false;
3426 });
3427}
3428
3429// Returns true iff `VD` is a parameter of the declaration `D`:
3430static bool isParameterOf(const VarDecl *VD, const Decl *D) {
3431 return isa<ParmVarDecl>(VD) &&
3432 VD->getDeclContext() == dyn_cast<DeclContext>(D);
3433}
3434
3435// Erases variables in `FixItsForVariable`, if such a variable has an unfixable
3436// group mate. A variable `v` is unfixable iff `FixItsForVariable` does not
3437// contain `v`.
3439 std::map<const VarDecl *, FixItList> &FixItsForVariable,
3440 const VariableGroupsManager &VarGrpMgr) {
3441 // Variables will be removed from `FixItsForVariable`:
3443
3444 for (const auto &[VD, Ignore] : FixItsForVariable) {
3445 VarGrpRef Grp = VarGrpMgr.getGroupOfVar(VD);
3446 if (llvm::any_of(Grp,
3447 [&FixItsForVariable](const VarDecl *GrpMember) -> bool {
3448 return !FixItsForVariable.count(GrpMember);
3449 })) {
3450 // At least one group member cannot be fixed, so we have to erase the
3451 // whole group:
3452 for (const VarDecl *Member : Grp)
3453 ToErase.push_back(Member);
3454 }
3455 }
3456 for (auto *VarToErase : ToErase)
3457 FixItsForVariable.erase(VarToErase);
3458}
3459
3460// Returns the fix-its that create bounds-safe function overloads for the
3461// function `D`, if `D`'s parameters will be changed to safe-types through
3462// fix-its in `FixItsForVariable`.
3463//
3464// NOTE: In case `D`'s parameters will be changed but bounds-safe function
3465// overloads cannot created, the whole group that contains the parameters will
3466// be erased from `FixItsForVariable`.
3468 std::map<const VarDecl *, FixItList> &FixItsForVariable /* mutable */,
3469 const VariableGroupsManager &VarGrpMgr, const FunctionDecl *FD,
3470 const FixitStrategy &S, ASTContext &Ctx,
3471 UnsafeBufferUsageHandler &Handler) {
3472 FixItList FixItsSharedByParms{};
3473
3474 std::optional<FixItList> OverloadFixes =
3475 createOverloadsForFixedParams(S, FD, Ctx, Handler);
3476
3477 if (OverloadFixes) {
3478 FixItsSharedByParms.append(*OverloadFixes);
3479 } else {
3480 // Something wrong in generating `OverloadFixes`, need to remove the
3481 // whole group, where parameters are in, from `FixItsForVariable` (Note
3482 // that all parameters should be in the same group):
3483 for (auto *Member : VarGrpMgr.getGroupOfParms())
3484 FixItsForVariable.erase(Member);
3485 }
3486 return FixItsSharedByParms;
3487}
3488
3489// Constructs self-contained fix-its for each variable in `FixablesForAllVars`.
3490static std::map<const VarDecl *, FixItList>
3491getFixIts(FixableGadgetSets &FixablesForAllVars, const FixitStrategy &S,
3492 ASTContext &Ctx,
3493 /* The function decl under analysis */ const Decl *D,
3494 const DeclUseTracker &Tracker, UnsafeBufferUsageHandler &Handler,
3495 const VariableGroupsManager &VarGrpMgr) {
3496 // `FixItsForVariable` will map each variable to a set of fix-its directly
3497 // associated to the variable itself. Fix-its of distinct variables in
3498 // `FixItsForVariable` are disjoint.
3499 std::map<const VarDecl *, FixItList> FixItsForVariable;
3500
3501 // Populate `FixItsForVariable` with fix-its directly associated with each
3502 // variable. Fix-its directly associated to a variable 'v' are the ones
3503 // produced by the `FixableGadget`s whose claimed variable is 'v'.
3504 for (const auto &[VD, Fixables] : FixablesForAllVars.byVar) {
3505 FixItsForVariable[VD] =
3506 fixVariable(VD, S.lookup(VD), D, Tracker, Ctx, Handler);
3507 // If we fail to produce Fix-It for the declaration we have to skip the
3508 // variable entirely.
3509 if (FixItsForVariable[VD].empty()) {
3510 FixItsForVariable.erase(VD);
3511 continue;
3512 }
3513 for (const auto &F : Fixables) {
3514 std::optional<FixItList> Fixits = F->getFixits(S);
3515
3516 if (Fixits) {
3517 FixItsForVariable[VD].insert(FixItsForVariable[VD].end(),
3518 Fixits->begin(), Fixits->end());
3519 continue;
3520 }
3521#ifndef NDEBUG
3522 Handler.addDebugNoteForVar(
3523 VD, F->getSourceLoc(),
3524 ("gadget '" + F->getDebugName() + "' refused to produce a fix")
3525 .str());
3526#endif
3527 FixItsForVariable.erase(VD);
3528 break;
3529 }
3530 }
3531
3532 // `FixItsForVariable` now contains only variables that can be
3533 // fixed. A variable can be fixed if its' declaration and all Fixables
3534 // associated to it can all be fixed.
3535
3536 // To further remove from `FixItsForVariable` variables whose group mates
3537 // cannot be fixed...
3538 eraseVarsForUnfixableGroupMates(FixItsForVariable, VarGrpMgr);
3539 // Now `FixItsForVariable` gets further reduced: a variable is in
3540 // `FixItsForVariable` iff it can be fixed and all its group mates can be
3541 // fixed.
3542
3543 // Fix-its of bounds-safe overloads of `D` are shared by parameters of `D`.
3544 // That is, when fixing multiple parameters in one step, these fix-its will
3545 // be applied only once (instead of being applied per parameter).
3546 FixItList FixItsSharedByParms{};
3547
3548 if (auto *FD = dyn_cast<FunctionDecl>(D))
3549 FixItsSharedByParms = createFunctionOverloadsForParms(
3550 FixItsForVariable, VarGrpMgr, FD, S, Ctx, Handler);
3551
3552 // The map that maps each variable `v` to fix-its for the whole group where
3553 // `v` is in:
3554 std::map<const VarDecl *, FixItList> FinalFixItsForVariable{
3555 FixItsForVariable};
3556
3557 for (auto &[Var, Ignore] : FixItsForVariable) {
3558 bool AnyParm = false;
3559 const auto VarGroupForVD = VarGrpMgr.getGroupOfVar(Var, &AnyParm);
3560
3561 for (const VarDecl *GrpMate : VarGroupForVD) {
3562 if (Var == GrpMate)
3563 continue;
3564 if (FixItsForVariable.count(GrpMate))
3565 FinalFixItsForVariable[Var].append(FixItsForVariable[GrpMate]);
3566 }
3567 if (AnyParm) {
3568 // This assertion should never fail. Otherwise we have a bug.
3569 assert(!FixItsSharedByParms.empty() &&
3570 "Should not try to fix a parameter that does not belong to a "
3571 "FunctionDecl");
3572 FinalFixItsForVariable[Var].append(FixItsSharedByParms);
3573 }
3574 }
3575 // Fix-its that will be applied in one step shall NOT:
3576 // 1. overlap with macros or/and templates; or
3577 // 2. conflict with each other.
3578 // Otherwise, the fix-its will be dropped.
3579 for (auto Iter = FinalFixItsForVariable.begin();
3580 Iter != FinalFixItsForVariable.end();)
3581 if (overlapWithMacro(Iter->second) ||
3583 Iter = FinalFixItsForVariable.erase(Iter);
3584 } else
3585 Iter++;
3586 return FinalFixItsForVariable;
3587}
3588
3589template <typename VarDeclIterTy>
3590static FixitStrategy
3591getNaiveStrategy(llvm::iterator_range<VarDeclIterTy> UnsafeVars) {
3592 FixitStrategy S;
3593 for (const VarDecl *VD : UnsafeVars) {
3594 if (isa<ConstantArrayType>(VD->getType().getCanonicalType()))
3595 S.set(VD, FixitStrategy::Kind::Array);
3596 else
3597 S.set(VD, FixitStrategy::Kind::Span);
3598 }
3599 return S;
3600}
3601
3602// Manages variable groups:
3604 const std::vector<VarGrpTy> Groups;
3605 const std::map<const VarDecl *, unsigned> &VarGrpMap;
3606 const llvm::SetVector<const VarDecl *> &GrpsUnionForParms;
3607
3608public:
3610 const std::vector<VarGrpTy> &Groups,
3611 const std::map<const VarDecl *, unsigned> &VarGrpMap,
3612 const llvm::SetVector<const VarDecl *> &GrpsUnionForParms)
3613 : Groups(Groups), VarGrpMap(VarGrpMap),
3614 GrpsUnionForParms(GrpsUnionForParms) {}
3615
3616 VarGrpRef getGroupOfVar(const VarDecl *Var, bool *HasParm) const override {
3617 if (GrpsUnionForParms.contains(Var)) {
3618 if (HasParm)
3619 *HasParm = true;
3620 return GrpsUnionForParms.getArrayRef();
3621 }
3622 if (HasParm)
3623 *HasParm = false;
3624
3625 auto It = VarGrpMap.find(Var);
3626
3627 if (It == VarGrpMap.end())
3628 return {};
3629 return Groups[It->second];
3630 }
3631
3632 VarGrpRef getGroupOfParms() const override {
3633 return GrpsUnionForParms.getArrayRef();
3634 }
3635};
3636
3637void applyGadgets(const Decl *D, FixableGadgetList FixableGadgets,
3638 WarningGadgetList WarningGadgets, DeclUseTracker Tracker,
3639 UnsafeBufferUsageHandler &Handler, bool EmitSuggestions) {
3640 if (!EmitSuggestions) {
3641 // Our job is very easy without suggestions. Just warn about
3642 // every problematic operation and consider it done. No need to deal
3643 // with fixable gadgets, no need to group operations by variable.
3644 for (const auto &G : WarningGadgets) {
3645 G->handleUnsafeOperation(Handler, /*IsRelatedToDecl=*/false,
3646 D->getASTContext());
3647 }
3648
3649 // This return guarantees that most of the machine doesn't run when
3650 // suggestions aren't requested.
3651 assert(FixableGadgets.size() == 0 &&
3652 "Fixable gadgets found but suggestions not requested!");
3653 return;
3654 }
3655
3656 // If no `WarningGadget`s ever matched, there is no unsafe operations in the
3657 // function under the analysis. No need to fix any Fixables.
3658 if (!WarningGadgets.empty()) {
3659 // Gadgets "claim" variables they're responsible for. Once this loop
3660 // finishes, the tracker will only track DREs that weren't claimed by any
3661 // gadgets, i.e. not understood by the analysis.
3662 for (const auto &G : FixableGadgets) {
3663 for (const auto *DRE : G->getClaimedVarUseSites()) {
3664 Tracker.claimUse(DRE);
3665 }
3666 }
3667 }
3668
3669 // If no `WarningGadget`s ever matched, there is no unsafe operations in the
3670 // function under the analysis. Thus, it early returns here as there is
3671 // nothing needs to be fixed.
3672 //
3673 // Note this claim is based on the assumption that there is no unsafe
3674 // variable whose declaration is invisible from the analyzing function.
3675 // Otherwise, we need to consider if the uses of those unsafe varuables needs
3676 // fix.
3677 // So far, we are not fixing any global variables or class members. And,
3678 // lambdas will be analyzed along with the enclosing function. So this early
3679 // return is correct for now.
3680 if (WarningGadgets.empty())
3681 return;
3682
3683 WarningGadgetSets UnsafeOps =
3684 groupWarningGadgetsByVar(std::move(WarningGadgets));
3685 FixableGadgetSets FixablesForAllVars =
3686 groupFixablesByVar(std::move(FixableGadgets));
3687
3688 std::map<const VarDecl *, FixItList> FixItsForVariableGroup;
3689
3690 // Filter out non-local vars and vars with unclaimed DeclRefExpr-s.
3691 for (auto it = FixablesForAllVars.byVar.cbegin();
3692 it != FixablesForAllVars.byVar.cend();) {
3693 // FIXME: need to deal with global variables later
3694 if ((!it->first->isLocalVarDecl() && !isa<ParmVarDecl>(it->first))) {
3695#ifndef NDEBUG
3696 Handler.addDebugNoteForVar(it->first, it->first->getBeginLoc(),
3697 ("failed to produce fixit for '" +
3698 it->first->getNameAsString() +
3699 "' : neither local nor a parameter"));
3700#endif
3701 it = FixablesForAllVars.byVar.erase(it);
3702 } else if (it->first->getType().getCanonicalType()->isReferenceType()) {
3703#ifndef NDEBUG
3704 Handler.addDebugNoteForVar(it->first, it->first->getBeginLoc(),
3705 ("failed to produce fixit for '" +
3706 it->first->getNameAsString() +
3707 "' : has a reference type"));
3708#endif
3709 it = FixablesForAllVars.byVar.erase(it);
3710 } else if (Tracker.hasUnclaimedUses(it->first)) {
3711 it = FixablesForAllVars.byVar.erase(it);
3712 } else if (it->first->isInitCapture()) {
3713#ifndef NDEBUG
3714 Handler.addDebugNoteForVar(it->first, it->first->getBeginLoc(),
3715 ("failed to produce fixit for '" +
3716 it->first->getNameAsString() +
3717 "' : init capture"));
3718#endif
3719 it = FixablesForAllVars.byVar.erase(it);
3720 } else {
3721 ++it;
3722 }
3723 }
3724
3725#ifndef NDEBUG
3726 for (const auto &it : UnsafeOps.byVar) {
3727 const VarDecl *const UnsafeVD = it.first;
3728 auto UnclaimedDREs = Tracker.getUnclaimedUses(UnsafeVD);
3729 if (UnclaimedDREs.empty())
3730 continue;
3731 const auto UnfixedVDName = UnsafeVD->getNameAsString();
3732 for (const clang::DeclRefExpr *UnclaimedDRE : UnclaimedDREs) {
3733 std::string UnclaimedUseTrace =
3734 getDREAncestorString(UnclaimedDRE, D->getASTContext());
3735
3736 Handler.addDebugNoteForVar(
3737 UnsafeVD, UnclaimedDRE->getBeginLoc(),
3738 ("failed to produce fixit for '" + UnfixedVDName +
3739 "' : has an unclaimed use\nThe unclaimed DRE trace: " +
3740 UnclaimedUseTrace));
3741 }
3742 }
3743#endif
3744
3745 // Fixpoint iteration for pointer assignments
3746 using DepMapTy = DenseMap<const VarDecl *, llvm::SetVector<const VarDecl *>>;
3747 DepMapTy DependenciesMap{};
3748 DepMapTy PtrAssignmentGraph{};
3749
3750 for (auto it : FixablesForAllVars.byVar) {
3751 for (const FixableGadget *fixable : it.second) {
3752 std::optional<std::pair<const VarDecl *, const VarDecl *>> ImplPair =
3753 fixable->getStrategyImplications();
3754 if (ImplPair) {
3755 std::pair<const VarDecl *, const VarDecl *> Impl = std::move(*ImplPair);
3756 PtrAssignmentGraph[Impl.first].insert(Impl.second);
3757 }
3758 }
3759 }
3760
3761 /*
3762 The following code does a BFS traversal of the `PtrAssignmentGraph`
3763 considering all unsafe vars as starting nodes and constructs an undirected
3764 graph `DependenciesMap`. Constructing the `DependenciesMap` in this manner
3765 elimiates all variables that are unreachable from any unsafe var. In other
3766 words, this removes all dependencies that don't include any unsafe variable
3767 and consequently don't need any fixit generation.
3768 Note: A careful reader would observe that the code traverses
3769 `PtrAssignmentGraph` using `CurrentVar` but adds edges between `Var` and
3770 `Adj` and not between `CurrentVar` and `Adj`. Both approaches would
3771 achieve the same result but the one used here dramatically cuts the
3772 amount of hoops the second part of the algorithm needs to jump, given that
3773 a lot of these connections become "direct". The reader is advised not to
3774 imagine how the graph is transformed because of using `Var` instead of
3775 `CurrentVar`. The reader can continue reading as if `CurrentVar` was used,
3776 and think about why it's equivalent later.
3777 */
3778 std::set<const VarDecl *> VisitedVarsDirected{};
3779 for (const auto &[Var, ignore] : UnsafeOps.byVar) {
3780 if (VisitedVarsDirected.find(Var) == VisitedVarsDirected.end()) {
3781
3782 std::queue<const VarDecl *> QueueDirected{};
3783 QueueDirected.push(Var);
3784 while (!QueueDirected.empty()) {
3785 const VarDecl *CurrentVar = QueueDirected.front();
3786 QueueDirected.pop();
3787 VisitedVarsDirected.insert(CurrentVar);
3788 auto AdjacentNodes = PtrAssignmentGraph[CurrentVar];
3789 for (const VarDecl *Adj : AdjacentNodes) {
3790 if (VisitedVarsDirected.find(Adj) == VisitedVarsDirected.end()) {
3791 QueueDirected.push(Adj);
3792 }
3793 DependenciesMap[Var].insert(Adj);
3794 DependenciesMap[Adj].insert(Var);
3795 }
3796 }
3797 }
3798 }
3799
3800 // `Groups` stores the set of Connected Components in the graph.
3801 std::vector<VarGrpTy> Groups;
3802 // `VarGrpMap` maps variables that need fix to the groups (indexes) that the
3803 // variables belong to. Group indexes refer to the elements in `Groups`.
3804 // `VarGrpMap` is complete in that every variable that needs fix is in it.
3805 std::map<const VarDecl *, unsigned> VarGrpMap;
3806 // The union group over the ones in "Groups" that contain parameters of `D`:
3807 llvm::SetVector<const VarDecl *>
3808 GrpsUnionForParms; // these variables need to be fixed in one step
3809
3810 // Group Connected Components for Unsafe Vars
3811 // (Dependencies based on pointer assignments)
3812 std::set<const VarDecl *> VisitedVars{};
3813 for (const auto &[Var, ignore] : UnsafeOps.byVar) {
3814 if (VisitedVars.find(Var) == VisitedVars.end()) {
3815 VarGrpTy &VarGroup = Groups.emplace_back();
3816 std::queue<const VarDecl *> Queue{};
3817
3818 Queue.push(Var);
3819 while (!Queue.empty()) {
3820 const VarDecl *CurrentVar = Queue.front();
3821 Queue.pop();
3822 VisitedVars.insert(CurrentVar);
3823 VarGroup.push_back(CurrentVar);
3824 auto AdjacentNodes = DependenciesMap[CurrentVar];
3825 for (const VarDecl *Adj : AdjacentNodes) {
3826 if (VisitedVars.find(Adj) == VisitedVars.end()) {
3827 Queue.push(Adj);
3828 }
3829 }
3830 }
3831
3832 bool HasParm = false;
3833 unsigned GrpIdx = Groups.size() - 1;
3834
3835 for (const VarDecl *V : VarGroup) {
3836 VarGrpMap[V] = GrpIdx;
3837 if (!HasParm && isParameterOf(V, D))
3838 HasParm = true;
3839 }
3840 if (HasParm)
3841 GrpsUnionForParms.insert(VarGroup.begin(), VarGroup.end());
3842 }
3843 }
3844
3845 // Remove a `FixableGadget` if the associated variable is not in the graph
3846 // computed above. We do not want to generate fix-its for such variables,
3847 // since they are neither warned nor reachable from a warned one.
3848 //
3849 // Note a variable is not warned if it is not directly used in any unsafe
3850 // operation. A variable `v` is NOT reachable from an unsafe variable, if it
3851 // does not exist another variable `u` such that `u` is warned and fixing `u`
3852 // (transitively) implicates fixing `v`.
3853 //
3854 // For example,
3855 // ```
3856 // void f(int * p) {
3857 // int * a = p; *p = 0;
3858 // }
3859 // ```
3860 // `*p = 0` is a fixable gadget associated with a variable `p` that is neither
3861 // warned nor reachable from a warned one. If we add `a[5] = 0` to the end of
3862 // the function above, `p` becomes reachable from a warned variable.
3863 for (auto I = FixablesForAllVars.byVar.begin();
3864 I != FixablesForAllVars.byVar.end();) {
3865 // Note `VisitedVars` contain all the variables in the graph:
3866 if (!VisitedVars.count((*I).first)) {
3867 // no such var in graph:
3868 I = FixablesForAllVars.byVar.erase(I);
3869 } else
3870 ++I;
3871 }
3872
3873 // We assign strategies to variables that are 1) in the graph and 2) can be
3874 // fixed. Other variables have the default "Won't fix" strategy.
3875 FixitStrategy NaiveStrategy = getNaiveStrategy(llvm::make_filter_range(
3876 VisitedVars, [&FixablesForAllVars](const VarDecl *V) {
3877 // If a warned variable has no "Fixable", it is considered unfixable:
3878 return FixablesForAllVars.byVar.count(V);
3879 }));
3880 VariableGroupsManagerImpl VarGrpMgr(Groups, VarGrpMap, GrpsUnionForParms);
3881
3882 if (isa<NamedDecl>(D))
3883 // The only case where `D` is not a `NamedDecl` is when `D` is a
3884 // `BlockDecl`. Let's not fix variables in blocks for now
3885 FixItsForVariableGroup =
3886 getFixIts(FixablesForAllVars, NaiveStrategy, D->getASTContext(), D,
3887 Tracker, Handler, VarGrpMgr);
3888
3889 for (const auto &G : UnsafeOps.noVar) {
3890 G->handleUnsafeOperation(Handler, /*IsRelatedToDecl=*/false,
3891 D->getASTContext());
3892 }
3893
3894 for (const auto &[VD, WarningGadgets] : UnsafeOps.byVar) {
3895 auto FixItsIt = FixItsForVariableGroup.find(VD);
3896 Handler.handleUnsafeVariableGroup(VD, VarGrpMgr,
3897 FixItsIt != FixItsForVariableGroup.end()
3898 ? std::move(FixItsIt->second)
3899 : FixItList{},
3900 D, NaiveStrategy);
3901 for (const auto &G : WarningGadgets) {
3902 G->handleUnsafeOperation(Handler, /*IsRelatedToDecl=*/true,
3903 D->getASTContext());
3904 }
3905 }
3906}
3907
3909 UnsafeBufferUsageHandler &Handler,
3910 bool EmitSuggestions) {
3911#ifndef NDEBUG
3912 Handler.clearDebugNotes();
3913#endif
3914
3915 assert(D);
3916
3917 SmallVector<Stmt *> Stmts;
3918
3919 if (const auto *FD = dyn_cast<FunctionDecl>(D)) {
3920 // We do not want to visit a Lambda expression defined inside a method
3921 // independently. Instead, it should be visited along with the outer method.
3922 // FIXME: do we want to do the same thing for `BlockDecl`s?
3923 if (const auto *MD = dyn_cast<CXXMethodDecl>(D)) {
3924 if (MD->getParent()->isLambda() && MD->getParent()->isLocalClass())
3925 return;
3926 }
3927
3928 for (FunctionDecl *FReDecl : FD->redecls()) {
3929 if (FReDecl->isExternC()) {
3930 // Do not emit fixit suggestions for functions declared in an
3931 // extern "C" block.
3932 EmitSuggestions = false;
3933 break;
3934 }
3935 }
3936
3937 Stmts.push_back(FD->getBody());
3938
3939 if (const auto *ID = dyn_cast<CXXConstructorDecl>(D)) {
3940 for (const CXXCtorInitializer *CI : ID->inits()) {
3941 Stmts.push_back(CI->getInit());
3942 }
3943 }
3944 } else if (isa<BlockDecl>(D) || isa<ObjCMethodDecl>(D)) {
3945 Stmts.push_back(D->getBody());
3946 }
3947
3948 assert(!Stmts.empty());
3949
3950 FixableGadgetList FixableGadgets;
3951 WarningGadgetList WarningGadgets;
3952 DeclUseTracker Tracker;
3953 for (Stmt *S : Stmts) {
3954 findGadgets(S, D->getASTContext(), Handler, EmitSuggestions, FixableGadgets,
3955 WarningGadgets, Tracker);
3956 }
3957 applyGadgets(D, std::move(FixableGadgets), std::move(WarningGadgets),
3958 std::move(Tracker), Handler, EmitSuggestions);
3959}
Defines the clang::ASTContext interface.
#define V(N, I)
Definition: ASTContext.h:3453
BoundNodesTreeBuilder Nodes
DynTypedNode Node
#define AST_MATCHER(Type, DefineMatcher)
AST_MATCHER(Type, DefineMatcher) { ... } defines a zero parameter function named DefineMatcher() that...
#define AST_MATCHER_P(Type, DefineMatcher, ParamType, Param)
AST_MATCHER_P(Type, DefineMatcher, ParamType, Param) { ... } defines a single-parameter function name...
#define SM(sm)
Definition: Cuda.cpp:84
const Decl * D
Expr * E
llvm::APSInt APSInt
Definition: Compiler.cpp:23
static Decl::Kind getKind(const Decl *D)
Definition: DeclBase.cpp:1172
StringRef Text
Definition: Format.cpp:3052
unsigned Iter
Definition: HTMLLogger.cpp:153
static const Decl * getCanonicalDecl(const Decl *D)
llvm::MachO::Target Target
Definition: MachO.h:51
Defines the clang::Preprocessor interface.
static bool hasAttr(const Decl *D, bool IgnoreImplicitAttr)
Definition: SemaCUDA.cpp:109
SourceRange Range
Definition: SemaObjC.cpp:758
SourceLocation Loc
Definition: SemaObjC.cpp:759
Defines the clang::SourceLocation class and associated facilities.
static QualType getPointeeType(const MemRegion *R)
C Language Family Type Representation.
SourceLocation Begin
static std::string getUserFillPlaceHolder(StringRef HintTextToUser="placeholder")
static FixItList fixVariableWithSpan(const VarDecl *VD, const DeclUseTracker &Tracker, ASTContext &Ctx, UnsafeBufferUsageHandler &Handler)
static std::optional< FixItList > fixUPCAddressofArraySubscriptWithSpan(const UnaryOperator *Node)
static std::optional< StringRef > getExprText(const Expr *E, const SourceManager &SM, const LangOptions &LangOpts)
static WarningGadgetSets groupWarningGadgetsByVar(const WarningGadgetList &AllUnsafeOperations)
static StringRef getEndOfLine()
static std::optional< FixItList > FixVarInitializerWithSpan(const Expr *Init, ASTContext &Ctx, const StringRef UserFillPlaceHolder)
#define NEXT
static std::optional< SourceLocation > getEndCharLoc(const NodeTy *Node, const SourceManager &SM, const LangOptions &LangOpts)
static FixItList fixVariableWithArray(const VarDecl *VD, const DeclUseTracker &Tracker, const ASTContext &Ctx, UnsafeBufferUsageHandler &Handler)
static std::string getSpanTypeText(StringRef EltTyText, std::optional< Qualifiers > Quals=std::nullopt)
static SourceRange getSourceRangeToTokenEnd(const Decl *D, const SourceManager &SM, const LangOptions &LangOpts)
static FixItList fixLocalVarDeclWithSpan(const VarDecl *D, ASTContext &Ctx, const StringRef UserFillPlaceHolder, UnsafeBufferUsageHandler &Handler)
static std::optional< FixItList > createDataFixit(const ASTContext &Ctx, const DeclRefExpr *DRE)
static FixItList createFunctionOverloadsForParms(std::map< const VarDecl *, FixItList > &FixItsForVariable, const VariableGroupsManager &VarGrpMgr, const FunctionDecl *FD, const FixitStrategy &S, ASTContext &Ctx, UnsafeBufferUsageHandler &Handler)
#define FIXABLE_GADGET(name)
#define WARNING_OPTIONAL_GADGET(x)
static FixItList fixVarDeclWithArray(const VarDecl *D, const ASTContext &Ctx, UnsafeBufferUsageHandler &Handler)
void applyGadgets(const Decl *D, FixableGadgetList FixableGadgets, WarningGadgetList WarningGadgets, DeclUseTracker Tracker, UnsafeBufferUsageHandler &Handler, bool EmitSuggestions)
#define WARNING_GADGET(name)
static FixItList fixVariable(const VarDecl *VD, FixitStrategy::Kind K, const Decl *D, const DeclUseTracker &Tracker, ASTContext &Ctx, UnsafeBufferUsageHandler &Handler)
static FixItList fixParamWithSpan(const ParmVarDecl *PVD, const ASTContext &Ctx, UnsafeBufferUsageHandler &Handler)
static std::optional< StringRef > getRangeText(SourceRange SR, const SourceManager &SM, const LangOptions &LangOpts)
static FixitStrategy getNaiveStrategy(llvm::iterator_range< VarDeclIterTy > UnsafeVars)
static std::optional< std::string > createSpanTypeForVarDecl(const VarDecl *VD, const ASTContext &Ctx)
static SourceLocation getVarDeclIdentifierLoc(const VarDecl *VD)
static std::optional< SourceLocation > getPastLoc(const NodeTy *Node, const SourceManager &SM, const LangOptions &LangOpts)
static bool hasConflictingOverload(const FunctionDecl *FD)
static std::optional< StringRef > getVarDeclIdentifierText(const VarDecl *VD, const SourceManager &SM, const LangOptions &LangOpts)
static std::optional< std::string > getPointeeTypeText(const VarDecl *VD, const SourceManager &SM, const LangOptions &LangOpts, std::optional< Qualifiers > *QualifiersToAppend)
static bool isNonNegativeIntegerExpr(const Expr *Expr, const VarDecl *VD, const ASTContext &Ctx)
static bool overlapWithMacro(const FixItList &FixIts)
static bool hasUnsupportedSpecifiers(const VarDecl *VD, const SourceManager &SM)
#define DEBUG_NOTE_DECL_FAIL(D, Msg)
static void findGadgets(const Stmt *S, ASTContext &Ctx, const UnsafeBufferUsageHandler &Handler, bool EmitSuggestions, FixableGadgetList &FixableGadgets, WarningGadgetList &WarningGadgets, DeclUseTracker &Tracker)
Scan the function and return a list of gadgets found with provided kits.
static std::map< const VarDecl *, FixItList > getFixIts(FixableGadgetSets &FixablesForAllVars, const FixitStrategy &S, ASTContext &Ctx, const Decl *D, const DeclUseTracker &Tracker, UnsafeBufferUsageHandler &Handler, const VariableGroupsManager &VarGrpMgr)
static std::optional< FixItList > createOverloadsForFixedParams(const FixitStrategy &S, const FunctionDecl *FD, const ASTContext &Ctx, UnsafeBufferUsageHandler &Handler)
static void eraseVarsForUnfixableGroupMates(std::map< const VarDecl *, FixItList > &FixItsForVariable, const VariableGroupsManager &VarGrpMgr)
static FixableGadgetSets groupFixablesByVar(FixableGadgetList &&AllFixableOperations)
static bool isParameterOf(const VarDecl *VD, const Decl *D)
static std::optional< StringRef > getFunNameText(const FunctionDecl *FD, const SourceManager &SM, const LangOptions &LangOpts)
__device__ __2f16 float __ockl_bool s
virtual std::optional< FixItList > getFixits(const FixitStrategy &s) const final
DerefSimplePtrArithFixableGadget(const MatchFinder::MatchResult &Result)
SourceLocation getSourceLoc() const override
virtual DeclUseList getClaimedVarUseSites() const final
virtual std::optional< FixItList > getFixits(const FixitStrategy &S) const override
SourceLocation getSourceLoc() const override
virtual DeclUseList getClaimedVarUseSites() const override
static bool classof(const Gadget *G)
UPCPreIncrementGadget(const MatchFinder::MatchResult &Result)
static bool classof(const Gadget *G)
static Matcher matcher()
UUCAddAssignGadget(const MatchFinder::MatchResult &Result)
virtual std::optional< FixItList > getFixits(const FixitStrategy &S) const override
virtual DeclUseList getClaimedVarUseSites() const override
SourceLocation getSourceLoc() const override
VariableGroupsManagerImpl(const std::vector< VarGrpTy > &Groups, const std::map< const VarDecl *, unsigned > &VarGrpMap, const llvm::SetVector< const VarDecl * > &GrpsUnionForParms)
VarGrpRef getGroupOfVar(const VarDecl *Var, bool *HasParm) const override
Returns the set of variables (including Var) that need to be fixed together in one step.
VarGrpRef getGroupOfParms() const override
Returns the non-empty group of variables that include parameters of the analyzing function,...
APSInt & getInt()
Definition: APValue.h:465
Holds long-lived AST nodes (such as types and decls) that can be referred to throughout the semantic ...
Definition: ASTContext.h:188
SourceManager & getSourceManager()
Definition: ASTContext.h:741
const ConstantArrayType * getAsConstantArrayType(QualType T) const
Definition: ASTContext.h:2915
DynTypedNodeList getParents(const NodeT &Node)
Forwards to get node parents from the ParentMapContext.
QualType getFILEType() const
Retrieve the C FILE type.
Definition: ASTContext.h:2089
const LangOptions & getLangOpts() const
Definition: ASTContext.h:834
const TargetInfo & getTargetInfo() const
Definition: ASTContext.h:799
ArraySubscriptExpr - [C99 6.5.2.1] Array Subscripting.
Definition: Expr.h:2718
SourceLocation getBeginLoc() const LLVM_READONLY
Definition: Expr.h:2761
Attr - This represents one attribute.
Definition: Attr.h:43
A builtin binary operation expression such as "x + y" or "x <= y".
Definition: Expr.h:3909
Expr * getLHS() const
Definition: Expr.h:3959
SourceLocation getBeginLoc() const LLVM_READONLY
Definition: Expr.h:3964
static StringRef getOpcodeStr(Opcode Op)
getOpcodeStr - Turn an Opcode enum value into the punctuation char it corresponds to,...
Definition: Expr.cpp:2149
Expr * getRHS() const
Definition: Expr.h:3961
Represents a call to a C++ constructor.
Definition: ExprCXX.h:1546
Expr * getArg(unsigned Arg)
Return the specified argument.
Definition: ExprCXX.h:1689
SourceLocation getBeginLoc() const LLVM_READONLY
Definition: ExprCXX.cpp:562
Represents a C++ base or member initializer.
Definition: DeclCXX.h:2318
A use of a default initializer in a constructor or in aggregate initialization.
Definition: ExprCXX.h:1375
Represents a static or instance method of a struct/union/class.
Definition: DeclCXX.h:2078
Represents a C++11 noexcept expression (C++ [expr.unary.noexcept]).
Definition: ExprCXX.h:4126
Represents a C++ struct/union/class.
Definition: DeclCXX.h:258
CXXRecordDecl * getCanonicalDecl() override
Retrieves the "canonical" declaration of the given declaration.
Definition: DeclCXX.h:524
A C++ typeid expression (C++ [expr.typeid]), which gets the type_info that corresponds to the supplie...
Definition: ExprCXX.h:845
CallExpr - Represents a function call (C99 6.5.2.2, C++ [expr.call]).
Definition: Expr.h:2874
CastExpr - Base class for type casts, including both implicit casts (ImplicitCastExpr) and explicit c...
Definition: Expr.h:3547
static const char * getCastKindName(CastKind CK)
Definition: Expr.cpp:1967
Represents a character-granular source range.
static CharSourceRange getCharRange(SourceRange R)
SourceLocation getEnd() const
ConstStmtVisitor - This class implements a simple visitor for Stmt subclasses.
Definition: StmtVisitor.h:195
lookup_result lookup(DeclarationName Name) const
lookup - Find the declarations (if any) with the given Name in this context.
Definition: DeclBase.cpp:1854
A reference to a declared variable, function, enum, etc.
Definition: Expr.h:1265
SourceLocation getBeginLoc() const LLVM_READONLY
Definition: Expr.cpp:550
ValueDecl * getDecl()
Definition: Expr.h:1333
DeclStmt - Adaptor class for mixing declarations with statements and expressions.
Definition: Stmt.h:1519
bool isSingleDecl() const
isSingleDecl - This method returns true if this DeclStmt refers to a single Decl.
Definition: Stmt.h:1532
decl_range decls()
Definition: Stmt.h:1567
Decl - This represents one declaration (or definition), e.g.
Definition: DeclBase.h:86
bool isInStdNamespace() const
Definition: DeclBase.cpp:422
SourceLocation getEndLoc() const LLVM_READONLY
Definition: DeclBase.h:438
ASTContext & getASTContext() const LLVM_READONLY
Definition: DeclBase.cpp:520
bool isImplicit() const
isImplicit - Indicates whether the declaration was implicitly generated by the implementation.
Definition: DeclBase.h:596
virtual Stmt * getBody() const
getBody - If this Decl represents a declaration for a body of code, such as a function or method defi...
Definition: DeclBase.h:1076
SourceLocation getLocation() const
Definition: DeclBase.h:442
DeclContext * getDeclContext()
Definition: DeclBase.h:451
attr_range attrs() const
Definition: DeclBase.h:538
SourceLocation getBeginLoc() const LLVM_READONLY
Definition: DeclBase.h:434
virtual SourceRange getSourceRange() const LLVM_READONLY
Source range that this declaration covers.
Definition: DeclBase.h:430
NestedNameSpecifier * getQualifier() const
Retrieve the nested-name-specifier that qualifies the name of this declaration, if it was present in ...
Definition: Decl.h:792
SourceLocation getBeginLoc() const LLVM_READONLY
Definition: Decl.h:786
NestedNameSpecifierLoc getQualifierLoc() const
Retrieve the nested-name-specifier (with source-location information) that qualifies the name of this...
Definition: Decl.h:800
TypeSourceInfo * getTypeSourceInfo() const
Definition: Decl.h:764
Container for either a single DynTypedNode or for an ArrayRef to DynTypedNode.
const DynTypedNode * begin() const
A dynamically typed AST node container.
SourceRange getSourceRange() const
For nodes which represent textual entities in the source code, return their SourceRange.
const T * get() const
Retrieve the stored node as type T.
static DynTypedNode create(const T &Node)
Creates a DynTypedNode from Node.
Recursive AST visitor that supports extension via dynamic dispatch.
virtual bool TraverseDecl(Decl *D)
Recursively visit a declaration, by dispatching to Traverse*Decl() based on the argument's dynamic ty...
virtual bool TraverseStmt(Stmt *S)
Recursively visit a statement or expression, by dispatching to Traverse*() based on the argument's dy...
bool ShouldVisitImplicitCode
Whether this visitor should recurse into implicit code, e.g.
bool ShouldVisitTemplateInstantiations
Whether this visitor should recurse into template instantiations.
ExplicitCastExpr - An explicit cast written in the source code.
Definition: Expr.h:3799
This represents one expression.
Definition: Expr.h:110
Expr * IgnoreParenImpCasts() LLVM_READONLY
Skip past any parentheses and implicit casts which might surround this expression until reaching a fi...
Definition: Expr.cpp:3097
Expr * IgnoreImplicit() LLVM_READONLY
Skip past any implicit AST nodes which might surround this expression until reaching a fixed point.
Definition: Expr.cpp:3085
Expr * IgnoreParens() LLVM_READONLY
Skip past any parentheses which might surround this expression until reaching a fixed point.
Definition: Expr.cpp:3093
NullPointerConstantValueDependence
Enumeration used to describe how isNullPointerConstant() should cope with value-dependent expressions...
Definition: Expr.h:820
std::optional< llvm::APSInt > getIntegerConstantExpr(const ASTContext &Ctx, SourceLocation *Loc=nullptr) const
isIntegerConstantExpr - Return the value if this expression is a valid integer constant expression.
QualType getType() const
Definition: Expr.h:142
Annotates a diagnostic with some code that should be inserted, removed, or replaced to fix the proble...
Definition: Diagnostic.h:75
CharSourceRange RemoveRange
Code that should be replaced to correct the error.
Definition: Diagnostic.h:79
static FixItHint CreateReplacement(CharSourceRange RemoveRange, StringRef Code)
Create a code modification hint that replaces the given source range with the given code string.
Definition: Diagnostic.h:138
static FixItHint CreateRemoval(CharSourceRange RemoveRange)
Create a code modification hint that removes the given source range.
Definition: Diagnostic.h:127
static FixItHint CreateInsertion(SourceLocation InsertionLoc, StringRef Code, bool BeforePreviousInsertions=false)
Create a code modification hint that inserts the given code string at a specific location.
Definition: Diagnostic.h:101
Represents a function declaration or definition.
Definition: Decl.h:1935
const ParmVarDecl * getParamDecl(unsigned i) const
Definition: Decl.h:2672
Stmt * getBody(const FunctionDecl *&Definition) const
Retrieve the body (definition) of the function.
Definition: Decl.cpp:3243
param_iterator param_begin()
Definition: Decl.h:2661
unsigned getNumParams() const
Return the number of parameters this function must have based on its FunctionType.
Definition: Decl.cpp:3702
DeclarationNameInfo getNameInfo() const
Definition: Decl.h:2146
Represents a C11 generic selection.
Definition: Expr.h:5966
One of these records is kept for each identifier that is lexed.
StringRef getName() const
Return the actual identifier string.
ImplicitCastExpr - Allows us to explicitly represent implicit type conversions, which have no direct ...
Definition: Expr.h:3724
Keeps track of the various options that can be enabled, which controls the dialect of C or C++ that i...
Definition: LangOptions.h:499
static StringRef getSourceText(CharSourceRange Range, const SourceManager &SM, const LangOptions &LangOpts, bool *Invalid=nullptr)
Returns a string for the source that the range encompasses.
Definition: Lexer.cpp:1023
static bool isAtEndOfMacroExpansion(SourceLocation loc, const SourceManager &SM, const LangOptions &LangOpts, SourceLocation *MacroEnd=nullptr)
Returns true if the given MacroID location points at the last token of the macro expansion.
Definition: Lexer.cpp:893
static unsigned MeasureTokenLength(SourceLocation Loc, const SourceManager &SM, const LangOptions &LangOpts)
MeasureTokenLength - Relex the token at the specified location and return its length in bytes in the ...
Definition: Lexer.cpp:498
static std::optional< Token > findNextToken(SourceLocation Loc, const SourceManager &SM, const LangOptions &LangOpts)
Finds the token that comes right after the given location.
Definition: Lexer.cpp:1324
static SourceLocation getLocForEndOfToken(SourceLocation Loc, unsigned Offset, const SourceManager &SM, const LangOptions &LangOpts)
Computes the source location just past the end of the token at this source location.
Definition: Lexer.cpp:849
IdentifierInfo * getIdentifier() const
Get the identifier that names this declaration, if there is one.
Definition: Decl.h:274
StringRef getName() const
Get the name of identifier for this declaration as a StringRef.
Definition: Decl.h:280
DeclarationName getDeclName() const
Get the actual, stored name of the declaration, which may be a special name.
Definition: Decl.h:319
std::string getNameAsString() const
Get a human-readable name for the declaration, even if it is one of the special kinds of names (C++ c...
Definition: Decl.h:296
SourceLocation getBeginLoc() const
Retrieve the location of the beginning of this nested-name-specifier.
Represents a parameter to a function.
Definition: Decl.h:1725
bool hasDefaultArg() const
Determines whether this parameter has a default argument, either parsed or not.
Definition: Decl.cpp:3023
SourceRange getSourceRange() const override LLVM_READONLY
Source range that this declaration covers.
Definition: Decl.cpp:2945
Wrapper for source info for pointers.
Definition: TypeLoc.h:1332
PointerType - C99 6.7.5.1 - Pointer Declarators.
Definition: Type.h:3198
A (possibly-)qualified type.
Definition: Type.h:929
bool hasQualifiers() const
Determine whether this type has any qualifiers.
Definition: Type.h:8025
bool isNull() const
Return true if this QualType doesn't point to a type yet.
Definition: Type.h:996
Qualifiers getQualifiers() const
Retrieve the set of qualifiers applied to this type.
Definition: Type.h:7976
QualType getCanonicalType() const
Definition: Type.h:7988
bool isConstQualified() const
Determine whether this type is const-qualified.
Definition: Type.h:8009
std::string getAsString() const
redecl_range redecls() const
Returns an iterator range for all the redeclarations of the same decl.
Definition: Redeclarable.h:295
Encodes a location in the source.
bool isValid() const
Return true if this is a valid SourceLocation object.
SourceLocation getLocWithOffset(IntTy Offset) const
Return a source location with the specified offset from this SourceLocation.
This class handles loading and caching of source files into memory.
A trivial tuple used to represent a source range.
SourceLocation getEnd() const
SourceLocation getBegin() const
bool isValid() const
Stmt - This represents one statement.
Definition: Stmt.h:84
SourceLocation getEndLoc() const LLVM_READONLY
Definition: Stmt.cpp:357
StmtClass getStmtClass() const
Definition: Stmt.h:1380
SourceLocation getBeginLoc() const LLVM_READONLY
Definition: Stmt.cpp:345
Exposes information about the current target.
Definition: TargetInfo.h:220
Base wrapper for a particular "section" of type source info.
Definition: TypeLoc.h:59
UnqualTypeLoc getUnqualifiedLoc() const
Skips past any qualifiers, if this is qualified.
Definition: TypeLoc.h:338
TypeLoc getNextTypeLoc() const
Get the next TypeLoc pointed by this TypeLoc, e.g for "int*" the TypeLoc is a PointerLoc and next Typ...
Definition: TypeLoc.h:170
T castAs() const
Convert to the specified TypeLoc type, asserting that this TypeLoc is of the desired type.
Definition: TypeLoc.h:78
SourceRange getSourceRange() const LLVM_READONLY
Get the full source range.
Definition: TypeLoc.h:153
TypeLocClass getTypeLocClass() const
Definition: TypeLoc.h:116
bool isNull() const
Definition: TypeLoc.h:121
SourceLocation getEndLoc() const
Get the end source location.
Definition: TypeLoc.cpp:235
SourceLocation getBeginLoc() const
Get the begin source location.
Definition: TypeLoc.cpp:192
TypeLoc getTypeLoc() const
Return the TypeLoc wrapper for the type source info.
Definition: TypeLoc.h:256
bool isFunctionPointerType() const
Definition: Type.h:8231
bool isPointerType() const
Definition: Type.h:8191
bool isIntegerType() const
isIntegerType() does not include complex integers (a GCC extension).
Definition: Type.h:8555
const T * castAs() const
Member-template castAs<specific type>.
Definition: Type.h:8805
QualType getPointeeType() const
If this is a pointer, ObjC object pointer, or block pointer, this returns the respective pointee.
Definition: Type.cpp:738
bool isUnsignedIntegerType() const
Return true if this is an integer type that is unsigned, according to C99 6.2.5p6 [which returns true...
Definition: Type.cpp:2230
UnaryExprOrTypeTraitExpr - expression with either a type or (unevaluated) expression operand.
Definition: Expr.h:2622
UnaryOperator - This represents the unary-expression's (except sizeof and alignof),...
Definition: Expr.h:2232
SourceLocation getOperatorLoc() const
getOperatorLoc - Return the location of the operator.
Definition: Expr.h:2281
Expr * getSubExpr() const
Definition: Expr.h:2277
Opcode getOpcode() const
Definition: Expr.h:2272
SourceLocation getBeginLoc() const LLVM_READONLY
Definition: Expr.h:2354
static StringRef getOpcodeStr(Opcode Op)
getOpcodeStr - Turn an Opcode enum value into the punctuation char it corresponds to,...
Definition: Expr.cpp:1408
The interface that lets the caller handle unsafe buffer usage analysis results by overriding this cla...
void addDebugNoteForVar(const VarDecl *VD, SourceLocation Loc, std::string Text)
virtual std::string getUnsafeBufferUsageAttributeTextAt(SourceLocation Loc, StringRef WSSuffix="") const =0
virtual void handleUnsafeOperation(const Stmt *Operation, bool IsRelatedToDecl, ASTContext &Ctx)=0
Invoked when an unsafe operation over raw pointers is found.
virtual void handleUnsafeVariableGroup(const VarDecl *Variable, const VariableGroupsManager &VarGrpMgr, FixItList &&Fixes, const Decl *D, const FixitStrategy &VarTargetTypes)=0
Invoked when a fix is suggested against a variable.
virtual void handleUnsafeOperationInContainer(const Stmt *Operation, bool IsRelatedToDecl, ASTContext &Ctx)=0
Invoked when an unsafe operation with a std container is found.
virtual void handleUnsafeLibcCall(const CallExpr *Call, unsigned PrintfInfo, ASTContext &Ctx, const Expr *UnsafeArg=nullptr)=0
Invoked when a call to an unsafe libc function is found.
QualType getType() const
Definition: Decl.h:682
Represents a variable declaration or definition.
Definition: Decl.h:882
bool isConstexpr() const
Whether this variable is (C++11) constexpr.
Definition: Decl.h:1513
VarDecl * getCanonicalDecl() override
Retrieves the "canonical" declaration of the given declaration.
Definition: Decl.cpp:2246
bool isInlineSpecified() const
Definition: Decl.h:1498
bool hasConstantInitialization() const
Determine whether this variable has constant initialization.
Definition: Decl.cpp:2620
bool hasLocalStorage() const
Returns true if a variable with function scope is a non-static local variable.
Definition: Decl.h:1135
bool isLocalVarDecl() const
Returns true for local variable declarations other than parameters.
Definition: Decl.h:1204
virtual VarGrpRef getGroupOfVar(const VarDecl *Var, bool *HasParm=nullptr) const =0
Returns the set of variables (including Var) that need to be fixed together in one step.
virtual VarGrpRef getGroupOfParms() const =0
Returns the non-empty group of variables that include parameters of the analyzing function,...
bool findMatch(const DynTypedNode &DynNode)
bool TraverseCXXNoexceptExpr(CXXNoexceptExpr *Node) override
bool TraverseDecltypeTypeLoc(DecltypeTypeLoc Node) override
bool TraverseCXXDefaultInitExpr(CXXDefaultInitExpr *Node) override
bool TraverseUnaryExprOrTypeTraitExpr(UnaryExprOrTypeTraitExpr *Node) override
bool TraverseGenericSelectionExpr(GenericSelectionExpr *Node) override
bool TraverseTypeOfExprTypeLoc(TypeOfExprTypeLoc Node) override
bool TraverseStmt(Stmt *Node) override
Recursively visit a statement or expression, by dispatching to Traverse*() based on the argument's dy...
bool TraverseCXXTypeidExpr(CXXTypeidExpr *Node) override
MatchDescendantVisitor(const internal::DynTypedMatcher *Matcher, internal::ASTMatchFinder *Finder, internal::BoundNodesTreeBuilder *Builder, internal::ASTMatchFinder::BindKind Bind, const bool ignoreUnevaluatedContext)
bool TraverseDecl(Decl *Node) override
Recursively visit a declaration, by dispatching to Traverse*Decl() based on the argument's dynamic ty...
Called when the Match registered for it was successfully found in the AST.
virtual void run(const MatchResult &Result)=0
Called on every match by the MatchFinder.
A class to allow finding matches over the Clang AST.
void addMatcher(const DeclarationMatcher &NodeMatch, MatchCallback *Action)
Adds a matcher to execute when running over the AST.
void match(const T &Node, ASTContext &Context)
Calls the registered callbacks on all matches on the given Node.
bool ParsePrintfString(FormatStringHandler &H, const char *beg, const char *end, const LangOptions &LO, const TargetInfo &Target, bool isFreeBSDKPrintf)
static bool isNullTermPointer(const Expr *Ptr)
static bool hasUnsafeFormatOrSArg(const CallExpr *Call, const Expr *&UnsafeArg, const unsigned FmtArgIdx, ASTContext &Ctx, bool isKprintf=false)
const internal::VariadicDynCastAllOfMatcher< Decl, VarDecl > varDecl
Matches variable declarations.
const internal::VariadicDynCastAllOfMatcher< Stmt, DeclRefExpr > declRefExpr
Matches expressions that refer to declarations.
const AstTypeMatcher< EnumType > enumType
Matches enum types.
static auto isInUnspecifiedLvalueContext(internal::Matcher< Expr > innerMatcher)
const internal::VariadicOperatorMatcherFunc< 1, 1 > unless
Matches if the provided matcher does not match.
const internal::VariadicDynCastAllOfMatcher< Stmt, ImplicitCastExpr > implicitCastExpr
Matches the implicit cast nodes of Clang's AST.
const internal::VariadicDynCastAllOfMatcher< Stmt, StringLiteral > stringLiteral
Matches string literals (also matches wide string literals).
const AstTypeMatcher< PointerType > pointerType
Matches pointer types, but does not match Objective-C object pointer types.
const internal::VariadicDynCastAllOfMatcher< Decl, BindingDecl > bindingDecl
Matches binding declarations Example matches foo and bar (matcher = bindingDecl()
internal::Matcher< NamedDecl > hasName(StringRef Name)
Matches NamedDecl nodes that have the specified name.
Definition: ASTMatchers.h:3099
const internal::VariadicDynCastAllOfMatcher< Stmt, CallExpr > callExpr
Matches call expressions.
const internal::VariadicDynCastAllOfMatcher< Stmt, CompoundStmt > compoundStmt
Matches compound statements.
const internal::ArgumentAdaptingMatcherFunc< internal::ForEachMatcher > forEach
Matches AST nodes that have child AST nodes that match the provided matcher.
const AstTypeMatcher< ArrayType > arrayType
Matches all kinds of arrays.
const internal::VariadicDynCastAllOfMatcher< Stmt, UnaryOperator > unaryOperator
Matches unary operator expressions.
const internal::VariadicDynCastAllOfMatcher< Stmt, ArraySubscriptExpr > arraySubscriptExpr
Matches array subscript expressions.
static internal::Matcher< Stmt > isInUnspecifiedUntypedContext(internal::Matcher< Stmt > InnerMatcher)
const internal::VariadicDynCastAllOfMatcher< Stmt, CXXMemberCallExpr > cxxMemberCallExpr
Matches member call expressions.
const internal::VariadicDynCastAllOfMatcher< Decl, CXXConstructorDecl > cxxConstructorDecl
Matches C++ constructor declarations.
const internal::VariadicDynCastAllOfMatcher< Stmt, ArrayInitIndexExpr > arrayInitIndexExpr
The arrayInitIndexExpr consists of two subexpressions: a common expression (the source array) that is...
const internal::VariadicDynCastAllOfMatcher< Stmt, BinaryOperator > binaryOperator
Matches binary operator expressions.
const internal::VariadicDynCastAllOfMatcher< Stmt, ParenExpr > parenExpr
Matches parentheses used in expressions.
const internal::ArgumentAdaptingMatcherFunc< internal::HasMatcher > has
Matches AST nodes that have child AST nodes that match the provided matcher.
const internal::VariadicDynCastAllOfMatcher< Stmt, ExplicitCastExpr > explicitCastExpr
Matches explicit cast expressions.
internal::PolymorphicMatcher< internal::ValueEqualsMatcher, void(internal::AllNodeBaseTypes), ValueT > equals(const ValueT &Value)
Matches literals that are equal to the given value of type ValueT.
Definition: ASTMatchers.h:5891
const AstTypeMatcher< ConstantArrayType > constantArrayType
Matches C arrays with a specified constant size.
const internal::VariadicOperatorMatcherFunc< 2, std::numeric_limits< unsigned >::max()> eachOf
Matches if any of the given matchers matches.
const internal::VariadicDynCastAllOfMatcher< Stmt, CXXConstructExpr > cxxConstructExpr
Matches constructor call expressions (including implicit ones).
const internal::VariadicDynCastAllOfMatcher< Decl, FieldDecl > fieldDecl
Matches field declarations.
static internal::Matcher< Stmt > isInUnspecifiedPointerContext(internal::Matcher< Stmt > InnerMatcher)
const internal::VariadicOperatorMatcherFunc< 2, std::numeric_limits< unsigned >::max()> allOf
Matches if all given matchers match.
const internal::VariadicDynCastAllOfMatcher< Decl, FunctionDecl > functionDecl
Matches function declarations.
const internal::VariadicDynCastAllOfMatcher< Stmt, MemberExpr > memberExpr
Matches member expressions.
static auto hasPointerType()
const internal::VariadicDynCastAllOfMatcher< Stmt, IntegerLiteral > integerLiteral
Matches integer literals of all sizes / encodings, e.g.
internal::PolymorphicMatcher< internal::HasDeclarationMatcher, void(internal::HasDeclarationSupportedTypes), internal::Matcher< Decl > > hasDeclaration(const internal::Matcher< Decl > &InnerMatcher)
Matches a node if the declaration associated with that node matches the given matcher.
Definition: ASTMatchers.h:3696
const internal::VariadicDynCastAllOfMatcher< Stmt, DeclStmt > declStmt
Matches declaration statements.
const internal::VariadicAllOfMatcher< Stmt > stmt
Matches statements.
const internal::VariadicDynCastAllOfMatcher< Stmt, Expr > expr
Matches expressions.
const internal::VariadicOperatorMatcherFunc< 2, std::numeric_limits< unsigned >::max()> anyOf
Matches if any of the given matchers matches.
const internal::VariadicFunction< internal::PolymorphicMatcher< internal::HasAnyOperatorNameMatcher, AST_POLYMORPHIC_SUPPORTED_TYPES(BinaryOperator, CXXOperatorCallExpr, CXXRewrittenBinaryOperator, UnaryOperator), std::vector< std::string > >, StringRef, internal::hasAnyOperatorNameFunc > hasAnyOperatorName
Matches operator expressions (binary or unary) that have any of the specified names.
const internal::VariadicDynCastAllOfMatcher< Decl, CXXMethodDecl > cxxMethodDecl
Matches method declarations.
const internal::VariadicDynCastAllOfMatcher< Stmt, CastExpr > castExpr
Matches any cast nodes of Clang's AST.
const internal::VariadicDynCastAllOfMatcher< Stmt, IfStmt > ifStmt
Matches if statements.
bool anyConflict(const llvm::SmallVectorImpl< FixItHint > &FixIts, const SourceManager &SM)
bool Call(InterpState &S, CodePtr OpPC, const Function *Func, uint32_t VarArgSize)
Definition: Interp.cpp:1270
RangeSelector member(std::string ID)
Given a MemberExpr, selects the member token.
The JSON file list parser is used to communicate input to InstallAPI.
void checkUnsafeBufferUsage(const Decl *D, UnsafeBufferUsageHandler &Handler, bool EmitSuggestions)
std::vector< const VarDecl * > VarGrpTy
const FunctionProtoType * T
Diagnostic wrappers for TextAPI types for error reporting.
Definition: Dominators.h:30
#define false
Definition: stdbool.h:26
bool operator()(const NodeTy *N1, const NodeTy *N2) const
std::map< const VarDecl *, std::set< const FixableGadget * >, CompareNode< VarDecl > > byVar
std::map< const VarDecl *, std::set< const WarningGadget * >, CompareNode< VarDecl > > byVar
llvm::SmallVector< const WarningGadget *, 16 > noVar
SourceLocation getBeginLoc() const
getBeginLoc - Retrieve the location of the first token.
SourceLocation getEndLoc() const LLVM_READONLY
EvalResult is a struct with detailed info about an evaluated expression.
Definition: Expr.h:642
APValue Val
Val - This is the value the expression can be folded to.
Definition: Expr.h:644
Wraps an identifier and optional source location for the identifier.
Definition: ParsedAttr.h:103
Contains all information for a given match.