clang 23.0.0git
Origins.cpp
Go to the documentation of this file.
1//===- Origins.cpp - Origin Implementation -----------------------*- C++-*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
11#include "clang/AST/Attr.h"
12#include "clang/AST/Decl.h"
13#include "clang/AST/DeclCXX.h"
15#include "clang/AST/Expr.h"
16#include "clang/AST/ExprCXX.h"
18#include "clang/AST/TypeBase.h"
22#include "llvm/ADT/StringMap.h"
23
25namespace {
26/// A utility class to traverse the function body in the analysis
27/// context and collect the count of expressions with missing origins.
28class MissingOriginCollector
29 : public RecursiveASTVisitor<MissingOriginCollector> {
30public:
31 MissingOriginCollector(
32 const llvm::DenseMap<const clang::Expr *, OriginList *> &ExprToOriginList,
33 const OriginManager &OM, LifetimeSafetyStats &LSStats)
34 : ExprToOriginList(ExprToOriginList), OM(OM), LSStats(LSStats) {}
35 bool VisitExpr(Expr *E) {
36 if (!OM.hasOrigins(E))
37 return true;
38 // Check if we have an origin for this expression.
39 if (!ExprToOriginList.contains(E)) {
40 // No origin found: count this as missing origin.
41 LSStats.ExprTypeToMissingOriginCount[E->getType().getTypePtr()]++;
42 LSStats.ExprStmtClassToMissingOriginCount[std::string(
43 E->getStmtClassName())]++;
44 }
45 return true;
46 }
47
48private:
49 const llvm::DenseMap<const clang::Expr *, OriginList *> &ExprToOriginList;
50 const OriginManager &OM;
51 LifetimeSafetyStats &LSStats;
52};
53
54class LifetimeAnnotatedOriginTypeCollector
55 : public RecursiveASTVisitor<LifetimeAnnotatedOriginTypeCollector> {
56public:
57 bool VisitCallExpr(const CallExpr *CE) {
58 // Indirect calls (e.g., function pointers) are skipped because lifetime
59 // annotations currently apply to declarations, not types.
60 if (const auto *FD = CE->getDirectCallee())
61 collect(FD, FD->getReturnType());
62 return true;
63 }
64
65 bool VisitCXXConstructExpr(const CXXConstructExpr *CCE) {
66 collect(CCE->getConstructor(), CCE->getType());
67 return true;
68 }
69
70 bool shouldVisitLambdaBody() const { return false; }
71 bool shouldVisitTemplateInstantiations() const { return true; }
72
73 const llvm::SmallVector<QualType> &getCollectedTypes() const {
74 return CollectedTypes;
75 }
76
77private:
78 llvm::SmallVector<QualType> CollectedTypes;
79
80 void collect(const FunctionDecl *FD, QualType RetType) {
81 if (!FD)
82 return;
84
85 if (const auto *MD = dyn_cast<CXXMethodDecl>(FD);
86 MD && MD->isInstance() && !isa<CXXConstructorDecl>(MD) &&
88 CollectedTypes.push_back(RetType);
89 return;
90 }
91
92 for (const auto *Param : FD->parameters()) {
93 if (Param->hasAttr<LifetimeBoundAttr>()) {
94 CollectedTypes.push_back(RetType);
95 return;
96 }
97 }
98 }
99};
100
101} // namespace
102
103bool OriginManager::hasOrigins(QualType QT, bool IntrinsicOnly) const {
105 return true;
106 if (!IntrinsicOnly &&
107 LifetimeAnnotatedOriginTypes.contains(QT.getCanonicalType().getTypePtr()))
108 return true;
109 const auto *RD = QT->getAsCXXRecordDecl();
110 if (!RD)
111 return false;
112 // Standard library callable wrappers (e.g., std::function) can propagate the
113 // stored lambda's origins.
115 return true;
116 // TODO: Limit to lambdas for now. This will be extended to user-defined
117 // structs with pointer-like fields.
118 if (!RD->isLambda())
119 return false;
120 for (const auto *FD : RD->fields())
121 if (hasOrigins(FD->getType(), IntrinsicOnly))
122 return true;
123 return false;
124}
125
126/// Determines if an expression has origins that need to be tracked.
127///
128/// An expression has origins if:
129/// - It's a glvalue (has addressable storage), OR
130/// - Its type is pointer-like (pointer, reference, or gsl::Pointer), OR
131/// - Its type is registered for origin tracking (e.g., return type of a
132/// [[clang::lifetimebound]] function)
133///
134/// Examples:
135/// - `int x; x` : has origin (glvalue)
136/// - `int* p; p` : has 2 origins (1 for glvalue and 1 for pointer type)
137/// - `std::string_view{}` : has 1 origin (prvalue of pointer type)
138/// - `42` : no origin (prvalue of non-pointer type)
139/// - `x + y` : (where x, y are int) → no origin (prvalue of non-pointer type)
140bool OriginManager::hasOrigins(const Expr *E) const {
141 return E->isGLValue() || hasOrigins(E->getType());
142}
143
144/// Returns true if the declaration has its own storage that can be borrowed.
145///
146/// References generally have no storage - they are aliases to other storage.
147/// For example:
148/// int x; // has storage (can issue loans to x's storage)
149/// int& r = x; // no storage (r is an alias to x's storage)
150/// int* p; // has storage (the pointer variable p itself has storage)
151///
152/// TODO: Handle lifetime extension. References initialized by temporaries
153/// can have storage when the temporary's lifetime is extended:
154/// const int& r = 42; // temporary has storage, lifetime extended
155/// Foo&& f = Foo{}; // temporary has storage, lifetime extended
156/// Currently, this function returns false for all reference types.
158 return !D->getType()->isReferenceType();
159}
160
162 : AST(AC.getASTContext()) {
163 collectLifetimeAnnotatedOriginTypes(AC);
164 initializeThisOrigins(AC.getDecl());
165}
166
167void OriginManager::initializeThisOrigins(const Decl *D) {
168 const auto *MD = llvm::dyn_cast_or_null<CXXMethodDecl>(D);
169 if (!MD || !MD->isInstance())
170 return;
171 // Lambdas can capture 'this' from the surrounding context, but in that case
172 // 'this' does not refer to the lambda object itself.
173 if (const CXXRecordDecl *P = MD->getParent(); P && P->isLambda())
174 return;
175 ThisOrigins = buildListForType(MD->getThisType(), MD);
176}
177
178OriginList *OriginManager::createNode(const ValueDecl *D, QualType QT) {
179 OriginID NewID = getNextOriginID();
180 AllOrigins.emplace_back(NewID, D, QT.getTypePtrOrNull());
181 return new (ListAllocator.Allocate<OriginList>()) OriginList(NewID);
182}
183
184OriginList *OriginManager::createNode(const Expr *E, QualType QT) {
185 OriginID NewID = getNextOriginID();
186 AllOrigins.emplace_back(NewID, E, QT.getTypePtrOrNull());
187 return new (ListAllocator.Allocate<OriginList>()) OriginList(NewID);
188}
189
191 return new (ListAllocator.Allocate<OriginList>()) OriginList(OID);
192}
193
194template <typename T>
195OriginList *OriginManager::buildListForType(QualType QT, const T *Node) {
196 assert(hasOrigins(QT) && "buildListForType called for non-pointer type");
197 OriginList *Head = createNode(Node, QT);
198
199 if (QT->isPointerOrReferenceType()) {
200 QualType PointeeTy = QT->getPointeeType();
201 // We recurse if the pointee type is pointer-like, to build the next
202 // level in the origin tree. E.g., for T*& / View&.
203 if (hasOrigins(PointeeTy))
204 Head->setInnerOriginList(buildListForType(PointeeTy, Node));
205 }
206 return Head;
207}
208
210 if (!hasOrigins(D->getType()))
211 return nullptr;
212 auto It = DeclToList.find(D);
213 if (It != DeclToList.end())
214 return It->second;
215 return DeclToList[D] = buildListForType(D->getType(), D);
216}
217
219 if (auto *ParenIgnored = E->IgnoreParens(); ParenIgnored != E)
220 return getOrCreateList(ParenIgnored);
221 // We do not see CFG stmts for ExprWithCleanups. Simply peel them.
222 if (const ExprWithCleanups *EWC = dyn_cast<ExprWithCleanups>(E))
223 return getOrCreateList(EWC->getSubExpr());
224
225 if (!hasOrigins(E))
226 return nullptr;
227
228 auto It = ExprToList.find(E);
229 if (It != ExprToList.end())
230 return It->second;
231
232 QualType Type = E->getType();
233 // Special handling for 'this' expressions to share origins with the method's
234 // implicit object parameter.
235 if (isa<CXXThisExpr>(E) && ThisOrigins)
236 return *ThisOrigins;
237
238 // Special handling for expressions referring to a decl to share origins with
239 // the underlying decl.
240 const ValueDecl *ReferencedDecl = nullptr;
241 if (auto *DRE = dyn_cast<DeclRefExpr>(E))
242 ReferencedDecl = DRE->getDecl();
243 else if (auto *ME = dyn_cast<MemberExpr>(E))
244 if (auto *Field = dyn_cast<FieldDecl>(ME->getMemberDecl());
245 Field && isa<CXXThisExpr>(ME->getBase()->IgnoreParenImpCasts()))
246 ReferencedDecl = Field;
247 if (ReferencedDecl) {
248 OriginList *Head = nullptr;
249 // For non-reference declarations (e.g., `int* p`), the expression is an
250 // lvalue (addressable) that can be borrowed, so we create an outer origin
251 // for the lvalue itself, with the pointee being the declaration's list.
252 // This models taking the address: `&p` borrows the storage of `p`, not what
253 // `p` points to.
254 if (doesDeclHaveStorage(ReferencedDecl)) {
255 Head = createNode(E, QualType{});
256 // This ensures origin sharing: multiple expressions to the same
257 // declaration share the same underlying origins.
258 Head->setInnerOriginList(getOrCreateList(ReferencedDecl));
259 } else {
260 // For reference-typed declarations (e.g., `int& r = p`) which have no
261 // storage, the DeclRefExpr directly reuses the declaration's list since
262 // references don't add an extra level of indirection at the expression
263 // level.
264 Head = getOrCreateList(ReferencedDecl);
265 }
266 return ExprToList[E] = Head;
267 }
268
269 // If E is an lvalue , it refers to storage. We model this storage as the
270 // first level of origin list, as if it were a reference, because l-values are
271 // addressable.
272 if (E->isGLValue() && !Type->isReferenceType())
273 Type = AST.getLValueReferenceType(Type);
274 return ExprToList[E] = buildListForType(Type, E);
275}
276
277void OriginManager::dump(OriginID OID, llvm::raw_ostream &OS) const {
278 OS << OID << " (";
279 Origin O = getOrigin(OID);
280 if (const ValueDecl *VD = O.getDecl()) {
281 OS << "Decl: " << VD->getNameAsString();
282 } else if (const Expr *E = O.getExpr()) {
283 OS << "Expr: " << E->getStmtClassName();
284 if (auto *DRE = dyn_cast<DeclRefExpr>(E)) {
285 if (const ValueDecl *VD = DRE->getDecl())
286 OS << ", Decl: " << VD->getNameAsString();
287 }
288 } else {
289 OS << "Unknown";
290 }
291 if (O.Ty)
292 OS << ", Type : " << QualType(O.Ty, 0).getAsString();
293 OS << ")";
294}
295
297 assert(ID.Value < AllOrigins.size());
298 return AllOrigins[ID.Value];
299}
300
302 LifetimeSafetyStats &LSStats) {
303 MissingOriginCollector Collector(this->ExprToList, *this, LSStats);
304 Collector.TraverseStmt(const_cast<Stmt *>(&FunctionBody));
305}
306
307void OriginManager::collectLifetimeAnnotatedOriginTypes(
308 const AnalysisDeclContext &AC) {
309 LifetimeAnnotatedOriginTypeCollector Collector;
310 if (Stmt *Body = AC.getBody())
311 Collector.TraverseStmt(Body);
312 if (const auto *CD = dyn_cast<CXXConstructorDecl>(AC.getDecl()))
313 for (const auto *Init : CD->inits())
314 Collector.TraverseStmt(Init->getInit());
315 for (QualType QT : Collector.getCollectedTypes())
316 registerLifetimeAnnotatedOriginType(QT);
317}
318
319void OriginManager::registerLifetimeAnnotatedOriginType(QualType QT) {
320 if (!QT->getAsCXXRecordDecl() || hasOrigins(QT))
321 return;
322
323 LifetimeAnnotatedOriginTypes.insert(QT.getCanonicalType().getTypePtr());
324}
325
326} // namespace clang::lifetimes::internal
Defines the clang::ASTContext interface.
This file defines AnalysisDeclContext, a class that manages the analysis context data for context sen...
Defines the C++ Decl subclasses, other than those for templates (found in DeclTemplate....
Defines the C++ template declaration subclasses.
Defines the clang::Expr interface and subclasses for C++ expressions.
C Language Family Type Representation.
AnalysisDeclContext contains the context data for the function, method or block under analysis.
Represents a C++ struct/union/class.
Definition DeclCXX.h:258
DeclContext * getParent()
getParent - Returns the containing DeclContext.
Definition DeclBase.h:2122
Decl - This represents one declaration (or definition), e.g.
Definition DeclBase.h:86
Represents an expression – generally a full-expression – that introduces cleanups to be run at the en...
Definition ExprCXX.h:3661
This represents one expression.
Definition Expr.h:112
bool isGLValue() const
Definition Expr.h:287
Expr * IgnoreParens() LLVM_READONLY
Skip past any parentheses which might surround this expression until reaching a fixed point.
Definition Expr.cpp:3095
QualType getType() const
Definition Expr.h:144
A (possibly-)qualified type.
Definition TypeBase.h:937
const Type * getTypePtr() const
Retrieves a pointer to the underlying (unqualified) type.
Definition TypeBase.h:8447
QualType getCanonicalType() const
Definition TypeBase.h:8499
const Type * getTypePtrOrNull() const
Definition TypeBase.h:8451
static std::string getAsString(SplitQualType split, const PrintingPolicy &Policy)
Definition TypeBase.h:1347
Stmt - This represents one statement.
Definition Stmt.h:86
const char * getStmtClassName() const
Definition Stmt.cpp:86
The base class of the type hierarchy.
Definition TypeBase.h:1875
CXXRecordDecl * getAsCXXRecordDecl() const
Retrieves the CXXRecordDecl that this type refers to, either because the type is a RecordType or beca...
Definition Type.h:26
bool isReferenceType() const
Definition TypeBase.h:8708
QualType getPointeeType() const
If this is a pointer, ObjC object pointer, or block pointer, this returns the respective pointee.
Definition Type.cpp:789
bool isPointerOrReferenceType() const
Definition TypeBase.h:8688
Represent the declaration of a variable (in which case it is an lvalue) a function (in which case it ...
Definition Decl.h:712
QualType getType() const
Definition Decl.h:723
A list of origins representing levels of indirection for pointer-like types.
Definition Origins.h:95
void setInnerOriginList(OriginList *Inner)
Definition Origins.h:102
OriginList * getOrCreateList(const ValueDecl *D)
Gets or creates the OriginList for a given ValueDecl.
Definition Origins.cpp:209
OriginList * createSingleOriginList(OriginID OID)
Wraps an existing OriginID in a new single-element OriginList, so a fact can refer to a single level ...
Definition Origins.cpp:190
const Origin & getOrigin(OriginID ID) const
Definition Origins.cpp:296
void collectMissingOrigins(Stmt &FunctionBody, LifetimeSafetyStats &LSStats)
Collects statistics about expressions that lack associated origins.
Definition Origins.cpp:301
OriginManager(const AnalysisDeclContext &AC)
Definition Origins.cpp:161
void dump(OriginID OID, llvm::raw_ostream &OS) const
Definition Origins.cpp:277
bool hasOrigins(QualType QT, bool IntrinsicOnly=false) const
Determines whether a type can carry lifetime origins.
Definition Origins.cpp:103
utils::ID< struct OriginTag > OriginID
Definition Origins.h:28
bool doesDeclHaveStorage(const ValueDecl *D)
Returns true if the declaration has its own storage that can be borrowed.
Definition Origins.cpp:157
bool isGslPointerType(QualType QT)
bool isStdCallableWrapperType(const CXXRecordDecl *RD)
bool implicitObjectParamIsLifetimeBound(const FunctionDecl *FD)
const FunctionDecl * getDeclWithMergedLifetimeBoundAttrs(const FunctionDecl *FD)
bool isa(CodeGen::Address addr)
Definition Address.h:330
A structure to hold the statistics related to LifetimeAnalysis.
An Origin is a symbolic identifier that represents the set of possible loans a pointer-like object co...
Definition Origins.h:40
const clang::Expr * getExpr() const
Definition Origins.h:64
const clang::ValueDecl * getDecl() const
Definition Origins.h:61
const Type * Ty
The type at this indirection level.
Definition Origins.h:54