clang 23.0.0git
Origins.cpp
Go to the documentation of this file.
1//===- Origins.cpp - Origin Implementation -----------------------*- C++-*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
11#include "clang/AST/Attr.h"
12#include "clang/AST/Decl.h"
13#include "clang/AST/DeclCXX.h"
15#include "clang/AST/Expr.h"
16#include "clang/AST/ExprCXX.h"
18#include "clang/AST/TypeBase.h"
22#include "llvm/ADT/StringMap.h"
23
25namespace {
26/// A utility class to traverse the function body in the analysis
27/// context and collect the count of expressions with missing origins.
28class MissingOriginCollector
29 : public RecursiveASTVisitor<MissingOriginCollector> {
30public:
31 MissingOriginCollector(
32 const llvm::DenseMap<const clang::Expr *, OriginList *> &ExprToOriginList,
33 const OriginManager &OM, LifetimeSafetyStats &LSStats)
34 : ExprToOriginList(ExprToOriginList), OM(OM), LSStats(LSStats) {}
35 bool VisitExpr(Expr *E) {
36 if (!OM.hasOrigins(E))
37 return true;
38 // Check if we have an origin for this expression.
39 if (!ExprToOriginList.contains(E)) {
40 // No origin found: count this as missing origin.
41 LSStats.ExprTypeToMissingOriginCount[E->getType().getTypePtr()]++;
42 LSStats.ExprStmtClassToMissingOriginCount[std::string(
43 E->getStmtClassName())]++;
44 }
45 return true;
46 }
47
48private:
49 const llvm::DenseMap<const clang::Expr *, OriginList *> &ExprToOriginList;
50 const OriginManager &OM;
51 LifetimeSafetyStats &LSStats;
52};
53
54class LifetimeAnnotatedOriginTypeCollector
55 : public RecursiveASTVisitor<LifetimeAnnotatedOriginTypeCollector> {
56public:
57 bool VisitCallExpr(const CallExpr *CE) {
58 // Indirect calls (e.g., function pointers) are skipped because lifetime
59 // annotations currently apply to declarations, not types.
60 if (const auto *FD = CE->getDirectCallee())
61 collect(FD, FD->getReturnType());
62 return true;
63 }
64
65 bool VisitCXXConstructExpr(const CXXConstructExpr *CCE) {
66 collect(CCE->getConstructor(), CCE->getType());
67 return true;
68 }
69
70 bool shouldVisitLambdaBody() const { return false; }
71 bool shouldVisitTemplateInstantiations() const { return true; }
72
73 const llvm::SmallVector<QualType> &getCollectedTypes() const {
74 return CollectedTypes;
75 }
76
77private:
78 llvm::SmallVector<QualType> CollectedTypes;
79
80 void collect(const FunctionDecl *FD, QualType RetType) {
81 if (!FD)
82 return;
84
85 if (const auto *MD = dyn_cast<CXXMethodDecl>(FD);
86 MD && MD->isInstance() && !isa<CXXConstructorDecl>(MD) &&
88 CollectedTypes.push_back(RetType);
89 return;
90 }
91
92 for (const auto *Param : FD->parameters()) {
93 if (Param->hasAttr<LifetimeBoundAttr>()) {
94 CollectedTypes.push_back(RetType);
95 return;
96 }
97 }
98 }
99};
100
101} // namespace
102
103bool OriginManager::hasOrigins(QualType QT, bool IntrinsicOnly) const {
105 return true;
106 if (!IntrinsicOnly &&
107 LifetimeAnnotatedOriginTypes.contains(QT.getCanonicalType().getTypePtr()))
108 return true;
109 const auto *RD = QT->getAsCXXRecordDecl();
110 if (!RD)
111 return false;
112 // Standard library callable wrappers (e.g., std::function) can propagate the
113 // stored lambda's origins.
115 return true;
116 // TODO: Limit to lambdas for now. This will be extended to user-defined
117 // structs with pointer-like fields.
118 if (!RD->isLambda())
119 return false;
120 for (const auto *FD : RD->fields())
121 if (hasOrigins(FD->getType(), IntrinsicOnly))
122 return true;
123 return false;
124}
125
126/// Determines if an expression has origins that need to be tracked.
127///
128/// An expression has origins if:
129/// - It's a glvalue (has addressable storage), OR
130/// - Its type is pointer-like (pointer, reference, or gsl::Pointer), OR
131/// - Its type is registered for origin tracking (e.g., return type of a
132/// [[clang::lifetimebound]] function)
133///
134/// Examples:
135/// - `int x; x` : has origin (glvalue)
136/// - `int* p; p` : has 2 origins (1 for glvalue and 1 for pointer type)
137/// - `std::string_view{}` : has 1 origin (prvalue of pointer type)
138/// - `42` : no origin (prvalue of non-pointer type)
139/// - `x + y` : (where x, y are int) → no origin (prvalue of non-pointer type)
140bool OriginManager::hasOrigins(const Expr *E) const {
141 return E->isGLValue() || hasOrigins(E->getType());
142}
143
144/// Returns true if the declaration has its own storage that can be borrowed.
145///
146/// References generally have no storage - they are aliases to other storage.
147/// For example:
148/// int x; // has storage (can issue loans to x's storage)
149/// int& r = x; // no storage (r is an alias to x's storage)
150/// int* p; // has storage (the pointer variable p itself has storage)
151///
152/// TODO: Handle lifetime extension. References initialized by temporaries
153/// can have storage when the temporary's lifetime is extended:
154/// const int& r = 42; // temporary has storage, lifetime extended
155/// Foo&& f = Foo{}; // temporary has storage, lifetime extended
156/// Currently, this function returns false for all reference types.
158 return !D->getType()->isReferenceType();
159}
160
162 : AST(AC.getASTContext()) {
163 collectLifetimeAnnotatedOriginTypes(AC);
164 initializeThisOrigins(AC.getDecl());
165}
166
167void OriginManager::initializeThisOrigins(const Decl *D) {
168 const auto *MD = llvm::dyn_cast_or_null<CXXMethodDecl>(D);
169 if (!MD || !MD->isInstance())
170 return;
171 // Lambdas can capture 'this' from the surrounding context, but in that case
172 // 'this' does not refer to the lambda object itself.
173 if (const CXXRecordDecl *P = MD->getParent(); P && P->isLambda())
174 return;
175 ThisOrigins = buildListForType(MD->getThisType(), MD);
176}
177
178OriginList *OriginManager::createNode(const ValueDecl *D, QualType QT) {
179 OriginID NewID = getNextOriginID();
180 AllOrigins.emplace_back(NewID, D, QT.getTypePtrOrNull());
181 return new (ListAllocator.Allocate<OriginList>()) OriginList(NewID);
182}
183
184OriginList *OriginManager::createNode(const Expr *E, QualType QT) {
185 OriginID NewID = getNextOriginID();
186 AllOrigins.emplace_back(NewID, E, QT.getTypePtrOrNull());
187 return new (ListAllocator.Allocate<OriginList>()) OriginList(NewID);
188}
189
191 return new (ListAllocator.Allocate<OriginList>()) OriginList(OID);
192}
193
194template <typename T>
195OriginList *OriginManager::buildListForType(QualType QT, const T *Node) {
196 assert(hasOrigins(QT) && "buildListForType called for non-pointer type");
197 OriginList *Head = createNode(Node, QT);
198
199 if (QT->isPointerOrReferenceType()) {
200 QualType PointeeTy = QT->getPointeeType();
201 // We recurse if the pointee type is pointer-like, to build the next
202 // level in the origin tree. E.g., for T*& / View&.
203 if (hasOrigins(PointeeTy))
204 Head->setInnerOriginList(buildListForType(PointeeTy, Node));
205 }
206 return Head;
207}
208
210 if (!hasOrigins(D->getType()))
211 return nullptr;
212 auto It = DeclToList.find(D);
213 if (It != DeclToList.end())
214 return It->second;
215 return DeclToList[D] = buildListForType(D->getType(), D);
216}
217
219 if (auto *ParenIgnored = E->IgnoreParens(); ParenIgnored != E)
220 return getOrCreateList(ParenIgnored);
221 // We do not see CFG stmts for ExprWithCleanups. Simply peel them.
222 if (const ExprWithCleanups *EWC = dyn_cast<ExprWithCleanups>(E))
223 return getOrCreateList(EWC->getSubExpr());
224
225 // An OpaqueValueExpr is a placeholder for an already-evaluated subexpression
226 // (e.g. the common operand of `a ?: b`) and is not itself a CFG statement, so
227 // reuse its source's origins rather than flowing into a fresh node.
228 if (const auto *OVE = dyn_cast<OpaqueValueExpr>(E))
229 if (const Expr *Src = OVE->getSourceExpr())
230 return getOrCreateList(Src);
231
232 if (!hasOrigins(E))
233 return nullptr;
234
235 auto It = ExprToList.find(E);
236 if (It != ExprToList.end())
237 return It->second;
238
239 QualType Type = E->getType();
240 // Special handling for 'this' expressions to share origins with the method's
241 // implicit object parameter.
242 if (isa<CXXThisExpr>(E) && ThisOrigins)
243 return *ThisOrigins;
244
245 // Special handling for expressions referring to a decl to share origins with
246 // the underlying decl.
247 const ValueDecl *ReferencedDecl = nullptr;
248 if (auto *DRE = dyn_cast<DeclRefExpr>(E))
249 ReferencedDecl = DRE->getDecl();
250 else if (auto *ME = dyn_cast<MemberExpr>(E))
251 if (auto *Field = dyn_cast<FieldDecl>(ME->getMemberDecl());
252 Field && isa<CXXThisExpr>(ME->getBase()->IgnoreParenImpCasts()))
253 ReferencedDecl = Field;
254 if (ReferencedDecl) {
255 OriginList *Head = nullptr;
256 // For non-reference declarations (e.g., `int* p`), the expression is an
257 // lvalue (addressable) that can be borrowed, so we create an outer origin
258 // for the lvalue itself, with the pointee being the declaration's list.
259 // This models taking the address: `&p` borrows the storage of `p`, not what
260 // `p` points to.
261 if (doesDeclHaveStorage(ReferencedDecl)) {
262 Head = createNode(E, QualType{});
263 // This ensures origin sharing: multiple expressions to the same
264 // declaration share the same underlying origins.
265 Head->setInnerOriginList(getOrCreateList(ReferencedDecl));
266 } else {
267 // For reference-typed declarations (e.g., `int& r = p`) which have no
268 // storage, the DeclRefExpr directly reuses the declaration's list since
269 // references don't add an extra level of indirection at the expression
270 // level.
271 Head = getOrCreateList(ReferencedDecl);
272 }
273 return ExprToList[E] = Head;
274 }
275
276 // If E is an lvalue , it refers to storage. We model this storage as the
277 // first level of origin list, as if it were a reference, because l-values are
278 // addressable.
279 if (E->isGLValue() && !Type->isReferenceType())
280 Type = AST.getLValueReferenceType(Type);
281 return ExprToList[E] = buildListForType(Type, E);
282}
283
284void OriginManager::dump(OriginID OID, llvm::raw_ostream &OS) const {
285 OS << OID << " (";
286 Origin O = getOrigin(OID);
287 if (const ValueDecl *VD = O.getDecl()) {
288 OS << "Decl: " << VD->getNameAsString();
289 } else if (const Expr *E = O.getExpr()) {
290 OS << "Expr: " << E->getStmtClassName();
291 if (auto *DRE = dyn_cast<DeclRefExpr>(E)) {
292 if (const ValueDecl *VD = DRE->getDecl())
293 OS << ", Decl: " << VD->getNameAsString();
294 }
295 } else {
296 OS << "Unknown";
297 }
298 if (O.Ty)
299 OS << ", Type : " << QualType(O.Ty, 0).getAsString();
300 OS << ")";
301}
302
304 assert(ID.Value < AllOrigins.size());
305 return AllOrigins[ID.Value];
306}
307
309 LifetimeSafetyStats &LSStats) {
310 MissingOriginCollector Collector(this->ExprToList, *this, LSStats);
311 Collector.TraverseStmt(const_cast<Stmt *>(&FunctionBody));
312}
313
314void OriginManager::collectLifetimeAnnotatedOriginTypes(
315 const AnalysisDeclContext &AC) {
316 LifetimeAnnotatedOriginTypeCollector Collector;
317 if (Stmt *Body = AC.getBody())
318 Collector.TraverseStmt(Body);
319 if (const auto *CD = dyn_cast<CXXConstructorDecl>(AC.getDecl()))
320 for (const auto *Init : CD->inits())
321 Collector.TraverseStmt(Init->getInit());
322 for (QualType QT : Collector.getCollectedTypes())
323 registerLifetimeAnnotatedOriginType(QT);
324}
325
326void OriginManager::registerLifetimeAnnotatedOriginType(QualType QT) {
327 if (!QT->getAsCXXRecordDecl() || hasOrigins(QT))
328 return;
329
330 LifetimeAnnotatedOriginTypes.insert(QT.getCanonicalType().getTypePtr());
331}
332
333} // namespace clang::lifetimes::internal
Defines the clang::ASTContext interface.
This file defines AnalysisDeclContext, a class that manages the analysis context data for context sen...
Defines the C++ Decl subclasses, other than those for templates (found in DeclTemplate....
Defines the C++ template declaration subclasses.
Defines the clang::Expr interface and subclasses for C++ expressions.
C Language Family Type Representation.
AnalysisDeclContext contains the context data for the function, method or block under analysis.
Represents a C++ struct/union/class.
Definition DeclCXX.h:258
DeclContext * getParent()
getParent - Returns the containing DeclContext.
Definition DeclBase.h:2122
Decl - This represents one declaration (or definition), e.g.
Definition DeclBase.h:86
Represents an expression – generally a full-expression – that introduces cleanups to be run at the en...
Definition ExprCXX.h:3661
This represents one expression.
Definition Expr.h:112
bool isGLValue() const
Definition Expr.h:287
Expr * IgnoreParens() LLVM_READONLY
Skip past any parentheses which might surround this expression until reaching a fixed point.
Definition Expr.cpp:3095
QualType getType() const
Definition Expr.h:144
A (possibly-)qualified type.
Definition TypeBase.h:937
const Type * getTypePtr() const
Retrieves a pointer to the underlying (unqualified) type.
Definition TypeBase.h:8447
QualType getCanonicalType() const
Definition TypeBase.h:8499
const Type * getTypePtrOrNull() const
Definition TypeBase.h:8451
static std::string getAsString(SplitQualType split, const PrintingPolicy &Policy)
Definition TypeBase.h:1347
Stmt - This represents one statement.
Definition Stmt.h:86
const char * getStmtClassName() const
Definition Stmt.cpp:86
The base class of the type hierarchy.
Definition TypeBase.h:1875
CXXRecordDecl * getAsCXXRecordDecl() const
Retrieves the CXXRecordDecl that this type refers to, either because the type is a RecordType or beca...
Definition Type.h:26
bool isReferenceType() const
Definition TypeBase.h:8708
QualType getPointeeType() const
If this is a pointer, ObjC object pointer, or block pointer, this returns the respective pointee.
Definition Type.cpp:789
bool isPointerOrReferenceType() const
Definition TypeBase.h:8688
Represent the declaration of a variable (in which case it is an lvalue) a function (in which case it ...
Definition Decl.h:712
QualType getType() const
Definition Decl.h:723
A list of origins representing levels of indirection for pointer-like types.
Definition Origins.h:95
void setInnerOriginList(OriginList *Inner)
Definition Origins.h:102
OriginList * getOrCreateList(const ValueDecl *D)
Gets or creates the OriginList for a given ValueDecl.
Definition Origins.cpp:209
OriginList * createSingleOriginList(OriginID OID)
Wraps an existing OriginID in a new single-element OriginList, so a fact can refer to a single level ...
Definition Origins.cpp:190
const Origin & getOrigin(OriginID ID) const
Definition Origins.cpp:303
void collectMissingOrigins(Stmt &FunctionBody, LifetimeSafetyStats &LSStats)
Collects statistics about expressions that lack associated origins.
Definition Origins.cpp:308
OriginManager(const AnalysisDeclContext &AC)
Definition Origins.cpp:161
void dump(OriginID OID, llvm::raw_ostream &OS) const
Definition Origins.cpp:284
bool hasOrigins(QualType QT, bool IntrinsicOnly=false) const
Determines whether a type can carry lifetime origins.
Definition Origins.cpp:103
utils::ID< struct OriginTag > OriginID
Definition Origins.h:28
bool doesDeclHaveStorage(const ValueDecl *D)
Returns true if the declaration has its own storage that can be borrowed.
Definition Origins.cpp:157
bool isGslPointerType(QualType QT)
bool isStdCallableWrapperType(const CXXRecordDecl *RD)
bool implicitObjectParamIsLifetimeBound(const FunctionDecl *FD)
const FunctionDecl * getDeclWithMergedLifetimeBoundAttrs(const FunctionDecl *FD)
bool isa(CodeGen::Address addr)
Definition Address.h:330
A structure to hold the statistics related to LifetimeAnalysis.
An Origin is a symbolic identifier that represents the set of possible loans a pointer-like object co...
Definition Origins.h:40
const clang::Expr * getExpr() const
Definition Origins.h:64
const clang::ValueDecl * getDecl() const
Definition Origins.h:61
const Type * Ty
The type at this indirection level.
Definition Origins.h:54