clang 23.0.0git
Origins.cpp
Go to the documentation of this file.
1//===- Origins.cpp - Origin Implementation -----------------------*- C++-*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
11#include "clang/AST/Attr.h"
12#include "clang/AST/Decl.h"
13#include "clang/AST/DeclCXX.h"
15#include "clang/AST/Expr.h"
16#include "clang/AST/ExprCXX.h"
18#include "clang/AST/TypeBase.h"
22#include "llvm/ADT/StringMap.h"
23
25namespace {
26/// A utility class to traverse the function body in the analysis
27/// context and collect the count of expressions with missing origins.
28class MissingOriginCollector
29 : public RecursiveASTVisitor<MissingOriginCollector> {
30public:
31 MissingOriginCollector(
32 const llvm::DenseMap<const clang::Expr *, OriginList *> &ExprToOriginList,
33 const OriginManager &OM, LifetimeSafetyStats &LSStats)
34 : ExprToOriginList(ExprToOriginList), OM(OM), LSStats(LSStats) {}
35 bool VisitExpr(Expr *E) {
36 if (!OM.hasOrigins(E))
37 return true;
38 // Check if we have an origin for this expression.
39 if (!ExprToOriginList.contains(E)) {
40 // No origin found: count this as missing origin.
41 LSStats.ExprTypeToMissingOriginCount[E->getType().getTypePtr()]++;
42 LSStats.ExprStmtClassToMissingOriginCount[std::string(
43 E->getStmtClassName())]++;
44 }
45 return true;
46 }
47
48private:
49 const llvm::DenseMap<const clang::Expr *, OriginList *> &ExprToOriginList;
50 const OriginManager &OM;
51 LifetimeSafetyStats &LSStats;
52};
53
54class LifetimeAnnotatedOriginTypeCollector
55 : public RecursiveASTVisitor<LifetimeAnnotatedOriginTypeCollector> {
56public:
57 bool VisitCallExpr(const CallExpr *CE) {
58 // Indirect calls (e.g., function pointers) are skipped because lifetime
59 // annotations currently apply to declarations, not types.
60 if (const auto *FD = CE->getDirectCallee())
61 collect(FD, FD->getReturnType());
62 return true;
63 }
64
65 bool VisitCXXConstructExpr(const CXXConstructExpr *CCE) {
66 collect(CCE->getConstructor(), CCE->getType());
67 return true;
68 }
69
70 bool shouldVisitLambdaBody() const { return false; }
71
72 const llvm::SmallVector<QualType> &getCollectedTypes() const {
73 return CollectedTypes;
74 }
75
76private:
77 llvm::SmallVector<QualType> CollectedTypes;
78
79 void collect(const FunctionDecl *FD, QualType RetType) {
80 if (!FD)
81 return;
83
84 if (const auto *MD = dyn_cast<CXXMethodDecl>(FD);
85 MD && MD->isInstance() && !isa<CXXConstructorDecl>(MD) &&
87 CollectedTypes.push_back(RetType);
88 return;
89 }
90
91 for (const auto *Param : FD->parameters()) {
92 if (Param->hasAttr<LifetimeBoundAttr>()) {
93 CollectedTypes.push_back(RetType);
94 return;
95 }
96 }
97 }
98};
99
100} // namespace
101
104 return true;
105 if (LifetimeAnnotatedOriginTypes.contains(QT.getCanonicalType().getTypePtr()))
106 return true;
107 const auto *RD = QT->getAsCXXRecordDecl();
108 if (!RD)
109 return false;
110 // Standard library callable wrappers (e.g., std::function) can propagate the
111 // stored lambda's origins.
113 return true;
114 // TODO: Limit to lambdas for now. This will be extended to user-defined
115 // structs with pointer-like fields.
116 if (!RD->isLambda())
117 return false;
118 for (const auto *FD : RD->fields())
119 if (hasOrigins(FD->getType()))
120 return true;
121 return false;
122}
123
124/// Determines if an expression has origins that need to be tracked.
125///
126/// An expression has origins if:
127/// - It's a glvalue (has addressable storage), OR
128/// - Its type is pointer-like (pointer, reference, or gsl::Pointer), OR
129/// - Its type is registered for origin tracking (e.g., return type of a
130/// [[clang::lifetimebound]] function)
131///
132/// Examples:
133/// - `int x; x` : has origin (glvalue)
134/// - `int* p; p` : has 2 origins (1 for glvalue and 1 for pointer type)
135/// - `std::string_view{}` : has 1 origin (prvalue of pointer type)
136/// - `42` : no origin (prvalue of non-pointer type)
137/// - `x + y` : (where x, y are int) → no origin (prvalue of non-pointer type)
138bool OriginManager::hasOrigins(const Expr *E) const {
139 return E->isGLValue() || hasOrigins(E->getType());
140}
141
142/// Returns true if the declaration has its own storage that can be borrowed.
143///
144/// References generally have no storage - they are aliases to other storage.
145/// For example:
146/// int x; // has storage (can issue loans to x's storage)
147/// int& r = x; // no storage (r is an alias to x's storage)
148/// int* p; // has storage (the pointer variable p itself has storage)
149///
150/// TODO: Handle lifetime extension. References initialized by temporaries
151/// can have storage when the temporary's lifetime is extended:
152/// const int& r = 42; // temporary has storage, lifetime extended
153/// Foo&& f = Foo{}; // temporary has storage, lifetime extended
154/// Currently, this function returns false for all reference types.
156 return !D->getType()->isReferenceType();
157}
158
160 : AST(AC.getASTContext()) {
161 collectLifetimeAnnotatedOriginTypes(AC);
162 initializeThisOrigins(AC.getDecl());
163}
164
165void OriginManager::initializeThisOrigins(const Decl *D) {
166 const auto *MD = llvm::dyn_cast_or_null<CXXMethodDecl>(D);
167 if (!MD || !MD->isInstance())
168 return;
169 // Lambdas can capture 'this' from the surrounding context, but in that case
170 // 'this' does not refer to the lambda object itself.
171 if (const CXXRecordDecl *P = MD->getParent(); P && P->isLambda())
172 return;
173 ThisOrigins = buildListForType(MD->getThisType(), MD);
174}
175
176OriginList *OriginManager::createNode(const ValueDecl *D, QualType QT) {
177 OriginID NewID = getNextOriginID();
178 AllOrigins.emplace_back(NewID, D, QT.getTypePtrOrNull());
179 return new (ListAllocator.Allocate<OriginList>()) OriginList(NewID);
180}
181
182OriginList *OriginManager::createNode(const Expr *E, QualType QT) {
183 OriginID NewID = getNextOriginID();
184 AllOrigins.emplace_back(NewID, E, QT.getTypePtrOrNull());
185 return new (ListAllocator.Allocate<OriginList>()) OriginList(NewID);
186}
187
189 return new (ListAllocator.Allocate<OriginList>()) OriginList(OID);
190}
191
192template <typename T>
193OriginList *OriginManager::buildListForType(QualType QT, const T *Node) {
194 assert(hasOrigins(QT) && "buildListForType called for non-pointer type");
195 OriginList *Head = createNode(Node, QT);
196
197 if (QT->isPointerOrReferenceType()) {
198 QualType PointeeTy = QT->getPointeeType();
199 // We recurse if the pointee type is pointer-like, to build the next
200 // level in the origin tree. E.g., for T*& / View&.
201 if (hasOrigins(PointeeTy))
202 Head->setInnerOriginList(buildListForType(PointeeTy, Node));
203 }
204 return Head;
205}
206
208 if (!hasOrigins(D->getType()))
209 return nullptr;
210 auto It = DeclToList.find(D);
211 if (It != DeclToList.end())
212 return It->second;
213 return DeclToList[D] = buildListForType(D->getType(), D);
214}
215
217 if (auto *ParenIgnored = E->IgnoreParens(); ParenIgnored != E)
218 return getOrCreateList(ParenIgnored);
219 // We do not see CFG stmts for ExprWithCleanups. Simply peel them.
220 if (const ExprWithCleanups *EWC = dyn_cast<ExprWithCleanups>(E))
221 return getOrCreateList(EWC->getSubExpr());
222
223 if (!hasOrigins(E))
224 return nullptr;
225
226 auto It = ExprToList.find(E);
227 if (It != ExprToList.end())
228 return It->second;
229
230 QualType Type = E->getType();
231 // Special handling for 'this' expressions to share origins with the method's
232 // implicit object parameter.
233 if (isa<CXXThisExpr>(E) && ThisOrigins)
234 return *ThisOrigins;
235
236 // Special handling for expressions referring to a decl to share origins with
237 // the underlying decl.
238 const ValueDecl *ReferencedDecl = nullptr;
239 if (auto *DRE = dyn_cast<DeclRefExpr>(E))
240 ReferencedDecl = DRE->getDecl();
241 else if (auto *ME = dyn_cast<MemberExpr>(E))
242 if (auto *Field = dyn_cast<FieldDecl>(ME->getMemberDecl());
243 Field && isa<CXXThisExpr>(ME->getBase()->IgnoreParenImpCasts()))
244 ReferencedDecl = Field;
245 if (ReferencedDecl) {
246 OriginList *Head = nullptr;
247 // For non-reference declarations (e.g., `int* p`), the expression is an
248 // lvalue (addressable) that can be borrowed, so we create an outer origin
249 // for the lvalue itself, with the pointee being the declaration's list.
250 // This models taking the address: `&p` borrows the storage of `p`, not what
251 // `p` points to.
252 if (doesDeclHaveStorage(ReferencedDecl)) {
253 Head = createNode(E, QualType{});
254 // This ensures origin sharing: multiple expressions to the same
255 // declaration share the same underlying origins.
256 Head->setInnerOriginList(getOrCreateList(ReferencedDecl));
257 } else {
258 // For reference-typed declarations (e.g., `int& r = p`) which have no
259 // storage, the DeclRefExpr directly reuses the declaration's list since
260 // references don't add an extra level of indirection at the expression
261 // level.
262 Head = getOrCreateList(ReferencedDecl);
263 }
264 return ExprToList[E] = Head;
265 }
266
267 // If E is an lvalue , it refers to storage. We model this storage as the
268 // first level of origin list, as if it were a reference, because l-values are
269 // addressable.
270 if (E->isGLValue() && !Type->isReferenceType())
271 Type = AST.getLValueReferenceType(Type);
272 return ExprToList[E] = buildListForType(Type, E);
273}
274
275void OriginManager::dump(OriginID OID, llvm::raw_ostream &OS) const {
276 OS << OID << " (";
277 Origin O = getOrigin(OID);
278 if (const ValueDecl *VD = O.getDecl()) {
279 OS << "Decl: " << VD->getNameAsString();
280 } else if (const Expr *E = O.getExpr()) {
281 OS << "Expr: " << E->getStmtClassName();
282 if (auto *DRE = dyn_cast<DeclRefExpr>(E)) {
283 if (const ValueDecl *VD = DRE->getDecl())
284 OS << ", Decl: " << VD->getNameAsString();
285 }
286 } else {
287 OS << "Unknown";
288 }
289 if (O.Ty)
290 OS << ", Type : " << QualType(O.Ty, 0).getAsString();
291 OS << ")";
292}
293
295 assert(ID.Value < AllOrigins.size());
296 return AllOrigins[ID.Value];
297}
298
300 LifetimeSafetyStats &LSStats) {
301 MissingOriginCollector Collector(this->ExprToList, *this, LSStats);
302 Collector.TraverseStmt(const_cast<Stmt *>(&FunctionBody));
303}
304
305void OriginManager::collectLifetimeAnnotatedOriginTypes(
306 const AnalysisDeclContext &AC) {
307 LifetimeAnnotatedOriginTypeCollector Collector;
308 if (Stmt *Body = AC.getBody())
309 Collector.TraverseStmt(Body);
310 if (const auto *CD = dyn_cast<CXXConstructorDecl>(AC.getDecl()))
311 for (const auto *Init : CD->inits())
312 Collector.TraverseStmt(Init->getInit());
313 for (QualType QT : Collector.getCollectedTypes())
314 registerLifetimeAnnotatedOriginType(QT);
315}
316
317void OriginManager::registerLifetimeAnnotatedOriginType(QualType QT) {
318 if (!QT->getAsCXXRecordDecl() || hasOrigins(QT))
319 return;
320
321 LifetimeAnnotatedOriginTypes.insert(QT.getCanonicalType().getTypePtr());
322}
323
324} // namespace clang::lifetimes::internal
Defines the clang::ASTContext interface.
This file defines AnalysisDeclContext, a class that manages the analysis context data for context sen...
Defines the C++ Decl subclasses, other than those for templates (found in DeclTemplate....
Defines the C++ template declaration subclasses.
Defines the clang::Expr interface and subclasses for C++ expressions.
C Language Family Type Representation.
AnalysisDeclContext contains the context data for the function, method or block under analysis.
Represents a C++ struct/union/class.
Definition DeclCXX.h:258
DeclContext * getParent()
getParent - Returns the containing DeclContext.
Definition DeclBase.h:2122
Decl - This represents one declaration (or definition), e.g.
Definition DeclBase.h:86
Represents an expression – generally a full-expression – that introduces cleanups to be run at the en...
Definition ExprCXX.h:3658
This represents one expression.
Definition Expr.h:112
bool isGLValue() const
Definition Expr.h:287
Expr * IgnoreParens() LLVM_READONLY
Skip past any parentheses which might surround this expression until reaching a fixed point.
Definition Expr.cpp:3086
QualType getType() const
Definition Expr.h:144
A (possibly-)qualified type.
Definition TypeBase.h:937
const Type * getTypePtr() const
Retrieves a pointer to the underlying (unqualified) type.
Definition TypeBase.h:8431
QualType getCanonicalType() const
Definition TypeBase.h:8483
const Type * getTypePtrOrNull() const
Definition TypeBase.h:8435
static std::string getAsString(SplitQualType split, const PrintingPolicy &Policy)
Definition TypeBase.h:1338
Stmt - This represents one statement.
Definition Stmt.h:86
const char * getStmtClassName() const
Definition Stmt.cpp:86
The base class of the type hierarchy.
Definition TypeBase.h:1866
CXXRecordDecl * getAsCXXRecordDecl() const
Retrieves the CXXRecordDecl that this type refers to, either because the type is a RecordType or beca...
Definition Type.h:26
bool isReferenceType() const
Definition TypeBase.h:8692
QualType getPointeeType() const
If this is a pointer, ObjC object pointer, or block pointer, this returns the respective pointee.
Definition Type.cpp:754
bool isPointerOrReferenceType() const
Definition TypeBase.h:8672
Represent the declaration of a variable (in which case it is an lvalue) a function (in which case it ...
Definition Decl.h:712
QualType getType() const
Definition Decl.h:723
A list of origins representing levels of indirection for pointer-like types.
Definition Origins.h:95
void setInnerOriginList(OriginList *Inner)
Definition Origins.h:102
OriginList * getOrCreateList(const ValueDecl *D)
Gets or creates the OriginList for a given ValueDecl.
Definition Origins.cpp:207
OriginList * createSingleOriginList(OriginID OID)
Wraps an existing OriginID in a new single-element OriginList, so a fact can refer to a single level ...
Definition Origins.cpp:188
const Origin & getOrigin(OriginID ID) const
Definition Origins.cpp:294
void collectMissingOrigins(Stmt &FunctionBody, LifetimeSafetyStats &LSStats)
Collects statistics about expressions that lack associated origins.
Definition Origins.cpp:299
OriginManager(const AnalysisDeclContext &AC)
Definition Origins.cpp:159
void dump(OriginID OID, llvm::raw_ostream &OS) const
Definition Origins.cpp:275
utils::ID< struct OriginTag > OriginID
Definition Origins.h:28
bool doesDeclHaveStorage(const ValueDecl *D)
Returns true if the declaration has its own storage that can be borrowed.
Definition Origins.cpp:155
bool isGslPointerType(QualType QT)
bool isStdCallableWrapperType(const CXXRecordDecl *RD)
bool implicitObjectParamIsLifetimeBound(const FunctionDecl *FD)
const FunctionDecl * getDeclWithMergedLifetimeBoundAttrs(const FunctionDecl *FD)
bool isa(CodeGen::Address addr)
Definition Address.h:330
A structure to hold the statistics related to LifetimeAnalysis.
An Origin is a symbolic identifier that represents the set of possible loans a pointer-like object co...
Definition Origins.h:40
const clang::Expr * getExpr() const
Definition Origins.h:64
const clang::ValueDecl * getDecl() const
Definition Origins.h:61
const Type * Ty
The type at this indirection level.
Definition Origins.h:54