Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
45 commits
Select commit Hold shift + click to select a range
75bfb7a
[𝘀𝗽𝗿] changes to main this commit is based on
melver Sep 4, 2025
b689546
[𝘀𝗽𝗿] initial version
melver Sep 4, 2025
68b4783
[𝘀𝗽𝗿] changes introduced through rebase
melver Sep 4, 2025
cb3d52d
fixup! Insert AllocToken into index.rst
melver Sep 4, 2025
5397b6b
[𝘀𝗽𝗿] changes introduced through rebase
melver Sep 5, 2025
33d18b2
fixup! Switch to fixed MD
melver Sep 5, 2025
14c7544
fixup! fix for incomplete types
melver Sep 8, 2025
7f70661
fixup!
melver Sep 8, 2025
22570af
[𝘀𝗽𝗿] changes introduced through rebase
melver Sep 18, 2025
1358f5a
fixup! address reviewer comments
melver Sep 18, 2025
01f8d55
[𝘀𝗽𝗿] changes introduced through rebase
melver Sep 19, 2025
3b64919
fixup! address reviewer comments round 2
melver Sep 19, 2025
69aad6d
[𝘀𝗽𝗿] changes introduced through rebase
melver Sep 22, 2025
b0e9549
fixup! use update_test_checks.py for opt tests
melver Sep 22, 2025
d5a42a1
[𝘀𝗽𝗿] changes introduced through rebase
melver Sep 23, 2025
ebab546
fixup! do not strip _
melver Sep 23, 2025
7ba5526
[𝘀𝗽𝗿] changes introduced through rebase
melver Sep 26, 2025
fb160db
fixup! address some comments
melver Sep 26, 2025
25ac802
[𝘀𝗽𝗿] changes introduced through rebase
melver Sep 26, 2025
8281324
fixup! address more comments
melver Sep 26, 2025
cb25798
[𝘀𝗽𝗿] changes introduced through rebase
melver Sep 29, 2025
2fa07d7
rebase
melver Sep 29, 2025
8641f7f
[𝘀𝗽𝗿] changes introduced through rebase
melver Sep 30, 2025
9979bca
fixup! address comments
melver Sep 30, 2025
37031e1
[𝘀𝗽𝗿] changes introduced through rebase
melver Oct 2, 2025
ca51a2b
fixup!
melver Oct 2, 2025
946afaa
[𝘀𝗽𝗿] changes introduced through rebase
melver Oct 2, 2025
0cebd94
fixup! switch clang tests back to manually written
melver Oct 2, 2025
f3e8076
[𝘀𝗽𝗿] changes introduced through rebase
melver Oct 7, 2025
fecfe67
rebase
melver Oct 7, 2025
6e1451c
[𝘀𝗽𝗿] changes introduced through rebase
melver Oct 7, 2025
fa2bb2c
rebase
melver Oct 7, 2025
10a1b88
[𝘀𝗽𝗿] changes introduced through rebase
melver Oct 7, 2025
6f6aa54
rebase
melver Oct 7, 2025
8502fcf
[𝘀𝗽𝗿] changes introduced through rebase
melver Oct 7, 2025
6ed5fe6
rebase
melver Oct 7, 2025
5e9458c
[𝘀𝗽𝗿] changes introduced through rebase
melver Oct 7, 2025
346e06d
rebase
melver Oct 7, 2025
fbc5f29
[𝘀𝗽𝗿] changes introduced through rebase
melver Oct 7, 2025
45fb47d
rebase
melver Oct 7, 2025
cfc9648
[𝘀𝗽𝗿] changes introduced through rebase
melver Oct 7, 2025
6225eb5
rebase
melver Oct 7, 2025
43b6898
[𝘀𝗽𝗿] changes introduced through rebase
melver Oct 8, 2025
9574188
rebase
melver Oct 8, 2025
dc6551a
rebase
melver Oct 8, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9 changes: 7 additions & 2 deletions clang/docs/AllocToken.rst
Original file line number Diff line number Diff line change
Expand Up @@ -31,13 +31,18 @@ Token Assignment Mode

The default mode to calculate tokens is:

* ``typehash``: This mode assigns a token ID based on the hash of the allocated
type's name.
* ``typehashpointersplit``: This mode assigns a token ID based on the hash of
the allocated type's name, where the top half ID-space is reserved for types
that contain pointers and the bottom half for types that do not contain
pointers.

Other token ID assignment modes are supported, but they may be subject to
change or removal. These may (experimentally) be selected with ``-mllvm
-alloc-token-mode=<mode>``:

* ``typehash``: This mode assigns a token ID based on the hash of the allocated
type's name.

* ``random``: This mode assigns a statically-determined random token ID to each
allocation site.

Expand Down
70 changes: 67 additions & 3 deletions clang/lib/CodeGen/CGExpr.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1272,20 +1272,84 @@ void CodeGenFunction::EmitBoundsCheckImpl(const Expr *E, llvm::Value *Bound,
EmitCheck(std::make_pair(Check, CheckKind), CheckHandler, StaticData, Index);
}

static bool
typeContainsPointer(QualType T,
llvm::SmallPtrSet<const RecordDecl *, 4> &VisitedRD,
bool &IncompleteType) {
QualType CanonicalType = T.getCanonicalType();
if (CanonicalType->isPointerType())
return true; // base case

// Look through typedef chain to check for special types.
for (QualType CurrentT = T; const auto *TT = CurrentT->getAs<TypedefType>();
CurrentT = TT->getDecl()->getUnderlyingType()) {
const IdentifierInfo *II = TT->getDecl()->getIdentifier();
// Special Case: Syntactically uintptr_t is not a pointer; semantically,
// however, very likely used as such. Therefore, classify uintptr_t as a
// pointer, too.
if (II && II->isStr("uintptr_t"))
return true;
}

// The type is an array; check the element type.
if (const ArrayType *AT = dyn_cast<ArrayType>(CanonicalType))
return typeContainsPointer(AT->getElementType(), VisitedRD, IncompleteType);
// The type is a struct, class, or union.
if (const RecordDecl *RD = CanonicalType->getAsRecordDecl()) {
if (!RD->isCompleteDefinition()) {
IncompleteType = true;
return false;
}
if (!VisitedRD.insert(RD).second)
return false; // already visited
// Check all fields.
for (const FieldDecl *Field : RD->fields()) {
if (typeContainsPointer(Field->getType(), VisitedRD, IncompleteType))
return true;
}
// For C++ classes, also check base classes.
if (const CXXRecordDecl *CXXRD = dyn_cast<CXXRecordDecl>(RD)) {
// Polymorphic types require a vptr.
if (CXXRD->isDynamicClass())
return true;
for (const CXXBaseSpecifier &Base : CXXRD->bases()) {
if (typeContainsPointer(Base.getType(), VisitedRD, IncompleteType))
return true;
}
}
}
return false;
}

void CodeGenFunction::EmitAllocToken(llvm::CallBase *CB, QualType AllocType) {
assert(SanOpts.has(SanitizerKind::AllocToken) &&
"Only needed with -fsanitize=alloc-token");

llvm::MDBuilder MDB(getLLVMContext());

// Get unique type name.
PrintingPolicy Policy(CGM.getContext().getLangOpts());
Policy.SuppressTagKeyword = true;
Policy.FullyQualifiedName = true;
SmallString<64> TypeName;
llvm::raw_svector_ostream TypeNameOS(TypeName);
AllocType.getCanonicalType().print(TypeNameOS, Policy);
auto *TypeMDS = llvm::MDString::get(CGM.getLLVMContext(), TypeNameOS.str());
auto *TypeNameMD = MDB.createString(TypeNameOS.str());

// Check if QualType contains a pointer. Implements a simple DFS to
// recursively check if a type contains a pointer type.
llvm::SmallPtrSet<const RecordDecl *, 4> VisitedRD;
bool IncompleteType = false;
const bool ContainsPtr =
typeContainsPointer(AllocType, VisitedRD, IncompleteType);
if (!ContainsPtr && IncompleteType)
return;
auto *ContainsPtrC = Builder.getInt1(ContainsPtr);
auto *ContainsPtrMD = MDB.createConstant(ContainsPtrC);

// Format: !{<type-name>}
auto *MDN = llvm::MDNode::get(CGM.getLLVMContext(), {TypeMDS});
// Format: !{<type-name>, <contains-pointer>}
auto *MDN =
llvm::MDNode::get(CGM.getLLVMContext(), {TypeNameMD, ContainsPtrMD});
CB->setMetadata(llvm::LLVMContext::MD_alloc_token, MDN);
}

Expand Down
175 changes: 175 additions & 0 deletions clang/test/CodeGenCXX/alloc-token-pointer.cpp
Original file line number Diff line number Diff line change
@@ -0,0 +1,175 @@
// RUN: %clang_cc1 -fsanitize=alloc-token -triple x86_64-linux-gnu -std=c++20 -emit-llvm -disable-llvm-passes %s -o - | FileCheck %s

#include "../Analysis/Inputs/system-header-simulator-cxx.h"

typedef __UINTPTR_TYPE__ uintptr_t;

extern "C" {
void *malloc(size_t size);
}

// CHECK-LABEL: define dso_local noundef ptr @_Z15test_malloc_intv(
// CHECK: call ptr @malloc(i64 noundef 4)
void *test_malloc_int() {
int *a = (int *)malloc(sizeof(int));
*a = 42;
return a;
}

// CHECK-LABEL: define dso_local noundef ptr @_Z15test_malloc_ptrv(
// CHECK: call ptr @malloc(i64 noundef 8)
int **test_malloc_ptr() {
int **a = (int **)malloc(sizeof(int*));
*a = nullptr;
return a;
}

// CHECK-LABEL: define dso_local noundef ptr @_Z12test_new_intv(
// CHECK: call noalias noundef nonnull ptr @_Znwm(i64 noundef 4){{.*}} !alloc_token [[META_INT:![0-9]+]]
int *test_new_int() {
return new int;
}

// CHECK-LABEL: define dso_local noundef ptr @_Z20test_new_ulong_arrayv(
// CHECK: call noalias noundef nonnull ptr @_Znam(i64 noundef 80){{.*}} !alloc_token [[META_ULONG:![0-9]+]]
unsigned long *test_new_ulong_array() {
return new unsigned long[10];
}

// CHECK-LABEL: define dso_local noundef ptr @_Z12test_new_ptrv(
// CHECK: call noalias noundef nonnull ptr @_Znwm(i64 noundef 8){{.*}} !alloc_token [[META_INTPTR:![0-9]+]]
int **test_new_ptr() {
return new int*;
}

// CHECK-LABEL: define dso_local noundef ptr @_Z18test_new_ptr_arrayv(
// CHECK: call noalias noundef nonnull ptr @_Znam(i64 noundef 80){{.*}} !alloc_token [[META_INTPTR]]
int **test_new_ptr_array() {
return new int*[10];
}

struct ContainsPtr {
int a;
char *buf;
};

// CHECK-LABEL: define dso_local noundef ptr @_Z27test_malloc_struct_with_ptrv(
// CHECK: call ptr @malloc(i64 noundef 16)
ContainsPtr *test_malloc_struct_with_ptr() {
ContainsPtr *c = (ContainsPtr *)malloc(sizeof(ContainsPtr));
return c;
}

// CHECK-LABEL: define dso_local noundef ptr @_Z33test_malloc_struct_array_with_ptrv(
// CHECK: call ptr @malloc(i64 noundef 160)
ContainsPtr *test_malloc_struct_array_with_ptr() {
ContainsPtr *c = (ContainsPtr *)malloc(10 * sizeof(ContainsPtr));
return c;
}

// CHECK-LABEL: define dso_local noundef ptr @_Z32test_operatornew_struct_with_ptrv(
// CHECK: call noalias noundef nonnull ptr @_Znwm(i64 noundef 16)
ContainsPtr *test_operatornew_struct_with_ptr() {
ContainsPtr *c = (ContainsPtr *)__builtin_operator_new(sizeof(ContainsPtr));
return c;
}

// CHECK-LABEL: define dso_local noundef ptr @_Z38test_operatornew_struct_array_with_ptrv(
// CHECK: call noalias noundef nonnull ptr @_Znwm(i64 noundef 160)
ContainsPtr *test_operatornew_struct_array_with_ptr() {
ContainsPtr *c = (ContainsPtr *)__builtin_operator_new(10 * sizeof(ContainsPtr));
return c;
}

// CHECK-LABEL: define dso_local noundef ptr @_Z33test_operatornew_struct_with_ptr2v(
// CHECK: call noalias noundef nonnull ptr @_Znwm(i64 noundef 16)
ContainsPtr *test_operatornew_struct_with_ptr2() {
ContainsPtr *c = (ContainsPtr *)__builtin_operator_new(sizeof(*c));
return c;
}

// CHECK-LABEL: define dso_local noundef ptr @_Z39test_operatornew_struct_array_with_ptr2v(
// CHECK: call noalias noundef nonnull ptr @_Znwm(i64 noundef 160)
ContainsPtr *test_operatornew_struct_array_with_ptr2() {
ContainsPtr *c = (ContainsPtr *)__builtin_operator_new(10 * sizeof(*c));
return c;
}

// CHECK-LABEL: define dso_local noundef ptr @_Z24test_new_struct_with_ptrv(
// CHECK: call noalias noundef nonnull ptr @_Znwm(i64 noundef 16){{.*}} !alloc_token [[META_CONTAINSPTR:![0-9]+]]
ContainsPtr *test_new_struct_with_ptr() {
return new ContainsPtr;
}

// CHECK-LABEL: define dso_local noundef ptr @_Z30test_new_struct_array_with_ptrv(
// CHECK: call noalias noundef nonnull ptr @_Znam(i64 noundef 160){{.*}} !alloc_token [[META_CONTAINSPTR]]
ContainsPtr *test_new_struct_array_with_ptr() {
return new ContainsPtr[10];
}

class TestClass {
public:
void Foo();
~TestClass();
int data[16];
};

// CHECK-LABEL: define dso_local noundef ptr @_Z14test_new_classv(
// CHECK: call noalias noundef nonnull ptr @_Znwm(i64 noundef 64){{.*}} !alloc_token [[META_TESTCLASS:![0-9]+]]
TestClass *test_new_class() {
return new TestClass();
}

// CHECK-LABEL: define dso_local noundef ptr @_Z20test_new_class_arrayv(
// CHECK: call noalias noundef nonnull ptr @_Znam(i64 noundef 648){{.*}} !alloc_token [[META_TESTCLASS]]
TestClass *test_new_class_array() {
return new TestClass[10];
}

// Test that we detect that virtual classes have implicit vtable pointer.
class VirtualTestClass {
public:
virtual void Foo();
virtual ~VirtualTestClass();
int data[16];
};

// CHECK-LABEL: define dso_local noundef ptr @_Z22test_new_virtual_classv(
// CHECK: call noalias noundef nonnull ptr @_Znwm(i64 noundef 72){{.*}} !alloc_token [[META_VIRTUALTESTCLASS:![0-9]+]]
VirtualTestClass *test_new_virtual_class() {
return new VirtualTestClass();
}

// CHECK-LABEL: define dso_local noundef ptr @_Z28test_new_virtual_class_arrayv(
// CHECK: call noalias noundef nonnull ptr @_Znam(i64 noundef 728){{.*}} !alloc_token [[META_VIRTUALTESTCLASS]]
VirtualTestClass *test_new_virtual_class_array() {
return new VirtualTestClass[10];
}

// uintptr_t is treated as a pointer.
struct MyStructUintptr {
int a;
uintptr_t ptr;
};

// CHECK-LABEL: define dso_local noundef ptr @_Z18test_uintptr_isptrv(
// CHECK: call noalias noundef nonnull ptr @_Znwm(i64 noundef 16){{.*}} !alloc_token [[META_MYSTRUCTUINTPTR:![0-9]+]]
MyStructUintptr *test_uintptr_isptr() {
return new MyStructUintptr;
}

using uptr = uintptr_t;
// CHECK-LABEL: define dso_local noundef ptr @_Z19test_uintptr_isptr2v(
// CHECK: call noalias noundef nonnull ptr @_Znwm(i64 noundef 8){{.*}} !alloc_token [[META_UINTPTR:![0-9]+]]
uptr *test_uintptr_isptr2() {
return new uptr;
}

// CHECK: [[META_INT]] = !{!"int", i1 false}
// CHECK: [[META_ULONG]] = !{!"unsigned long", i1 false}
// CHECK: [[META_INTPTR]] = !{!"int *", i1 true}
// CHECK: [[META_CONTAINSPTR]] = !{!"ContainsPtr", i1 true}
// CHECK: [[META_TESTCLASS]] = !{!"TestClass", i1 false}
// CHECK: [[META_VIRTUALTESTCLASS]] = !{!"VirtualTestClass", i1 true}
// CHECK: [[META_MYSTRUCTUINTPTR]] = !{!"MyStructUintptr", i1 true}
// CHECK: [[META_UINTPTR]] = !{!"unsigned long", i1 true}
4 changes: 2 additions & 2 deletions clang/test/CodeGenCXX/alloc-token.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -137,5 +137,5 @@ TestClass *test_new_class_array() {
return arr;
}

// CHECK: [[META_INT]] = !{!"int"}
// CHECK: [[META_TESTCLASS]] = !{!"TestClass"}
// CHECK: [[META_INT]] = !{!"int", i1 false}
// CHECK: [[META_TESTCLASS]] = !{!"TestClass", i1 true}
5 changes: 3 additions & 2 deletions llvm/docs/LangRef.rst
Original file line number Diff line number Diff line change
Expand Up @@ -8588,13 +8588,14 @@ functions, and contains richer semantic information about the type of the
allocation. This information is consumed by the ``alloc-token`` pass to
instrument such calls with allocation token IDs.

The metadata contains a string with the type of an allocation.
The metadata contains: string with the type of an allocation, and a boolean
denoting if the type contains a pointer.

.. code-block:: none

call ptr @malloc(i64 64), !alloc_token !0

!0 = !{!"<type-name>"}
!0 = !{!"<type-name>", i1 <contains-pointer>}

Module Flags Metadata
=====================
Expand Down
4 changes: 3 additions & 1 deletion llvm/lib/IR/Verifier.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -5398,8 +5398,10 @@ void Verifier::visitCapturesMetadata(Instruction &I, const MDNode *Captures) {

void Verifier::visitAllocTokenMetadata(Instruction &I, MDNode *MD) {
Check(isa<CallBase>(I), "!alloc_token should only exist on calls", &I);
Check(MD->getNumOperands() == 1, "!alloc_token must have 1 operand", MD);
Check(MD->getNumOperands() == 2, "!alloc_token must have 2 operands", MD);
Check(isa<MDString>(MD->getOperand(0)), "expected string", MD);
Check(mdconst::dyn_extract_or_null<ConstantInt>(MD->getOperand(1)),
"expected integer constant", MD);
}

/// verifyInstruction - Verify that an instruction is well formed.
Expand Down
Loading