Skip to content

Commit 16c9b4f

Browse files
orbirilanza
authored andcommitted
[CIR][CIRGen] Add dynamic builtin alloca intrinsics support (llvm#547)
This patch adds the CIRGen for the following builtin functions: - `alloca`; - `_alloca`; - `__builtin_alloca`; - `__builtin_alloca_uninitialized`. Missing support to add in the future: - Non-default auto initialization setting. The default is to not initialize the allocated buffer, which is simpler to implement. This commit is leaving the skeleton to implement this feature following clang's codegen pattern. - It may be possible that the frontend has set non-default address space for the alloca's return value. This is the case for OpenCL or AMDGPU codes for example. This is handled in clang codegen via address space cast, and is left for future implementation. This commit introduces a guard-rail around this behaviour.
1 parent 3715ad9 commit 16c9b4f

File tree

6 files changed

+182
-12
lines changed

6 files changed

+182
-12
lines changed

clang/include/clang/CIR/Dialect/Builder/CIRBaseBuilder.h

+30
Original file line numberDiff line numberDiff line change
@@ -160,6 +160,36 @@ class CIRBaseBuilderTy : public mlir::OpBuilder {
160160
return create<mlir::cir::StoreOp>(loc, val, dst, _volatile, order);
161161
}
162162

163+
mlir::Value createAlloca(mlir::Location loc, mlir::cir::PointerType addrType,
164+
mlir::Type type, llvm::StringRef name,
165+
mlir::IntegerAttr alignment,
166+
mlir::Value dynAllocSize) {
167+
return create<mlir::cir::AllocaOp>(loc, addrType, type, name, alignment,
168+
dynAllocSize);
169+
}
170+
171+
mlir::Value createAlloca(mlir::Location loc, mlir::cir::PointerType addrType,
172+
mlir::Type type, llvm::StringRef name,
173+
clang::CharUnits alignment,
174+
mlir::Value dynAllocSize) {
175+
auto alignmentIntAttr = getSizeFromCharUnits(getContext(), alignment);
176+
return createAlloca(loc, addrType, type, name, alignmentIntAttr,
177+
dynAllocSize);
178+
}
179+
180+
mlir::Value createAlloca(mlir::Location loc, mlir::cir::PointerType addrType,
181+
mlir::Type type, llvm::StringRef name,
182+
mlir::IntegerAttr alignment) {
183+
return create<mlir::cir::AllocaOp>(loc, addrType, type, name, alignment);
184+
}
185+
186+
mlir::Value createAlloca(mlir::Location loc, mlir::cir::PointerType addrType,
187+
mlir::Type type, llvm::StringRef name,
188+
clang::CharUnits alignment) {
189+
auto alignmentIntAttr = getSizeFromCharUnits(getContext(), alignment);
190+
return createAlloca(loc, addrType, type, name, alignmentIntAttr);
191+
}
192+
163193
mlir::Value createSub(mlir::Value lhs, mlir::Value rhs, bool hasNUW = false,
164194
bool hasNSW = false) {
165195
auto op = create<mlir::cir::BinOp>(lhs.getLoc(), lhs.getType(),

clang/lib/CIR/CodeGen/CIRGenBuiltin.cpp

+61
Original file line numberDiff line numberDiff line change
@@ -71,6 +71,24 @@ buildBuiltinBitOp(CIRGenFunction &CGF, const CallExpr *E,
7171
return RValue::get(op);
7272
}
7373

74+
// Initialize the alloca with the given size and alignment according to the lang
75+
// opts. Supporting only the trivial non-initialization for now.
76+
static void initializeAlloca(CIRGenFunction &CGF,
77+
[[maybe_unused]] mlir::Value AllocaAddr,
78+
[[maybe_unused]] mlir::Value Size,
79+
[[maybe_unused]] CharUnits AlignmentInBytes) {
80+
81+
switch (CGF.getLangOpts().getTrivialAutoVarInit()) {
82+
case LangOptions::TrivialAutoVarInitKind::Uninitialized:
83+
// Nothing to initialize.
84+
return;
85+
case LangOptions::TrivialAutoVarInitKind::Zero:
86+
case LangOptions::TrivialAutoVarInitKind::Pattern:
87+
assert(false && "unexpected trivial auto var init kind NYI");
88+
return;
89+
}
90+
}
91+
7492
RValue CIRGenFunction::buildBuiltinExpr(const GlobalDecl GD, unsigned BuiltinID,
7593
const CallExpr *E,
7694
ReturnValueSlot ReturnValue) {
@@ -642,6 +660,49 @@ RValue CIRGenFunction::buildBuiltinExpr(const GlobalDecl GD, unsigned BuiltinID,
642660
Result = builder.createBoolToInt(Result, ResultType);
643661
return RValue::get(Result);
644662
}
663+
664+
case Builtin::BIalloca:
665+
case Builtin::BI_alloca:
666+
case Builtin::BI__builtin_alloca_uninitialized:
667+
case Builtin::BI__builtin_alloca: {
668+
// Get alloca size input
669+
mlir::Value Size = buildScalarExpr(E->getArg(0));
670+
671+
// The alignment of the alloca should correspond to __BIGGEST_ALIGNMENT__.
672+
const TargetInfo &TI = getContext().getTargetInfo();
673+
const CharUnits SuitableAlignmentInBytes =
674+
getContext().toCharUnitsFromBits(TI.getSuitableAlign());
675+
676+
// Emit the alloca op with type `u8 *` to match the semantics of
677+
// `llvm.alloca`. We later bitcast the type to `void *` to match the
678+
// semantics of C/C++
679+
// FIXME(cir): It may make sense to allow AllocaOp of type `u8` to return a
680+
// pointer of type `void *`. This will require a change to the allocaOp
681+
// verifier.
682+
auto AllocaAddr = builder.createAlloca(
683+
getLoc(E->getSourceRange()), builder.getUInt8PtrTy(),
684+
builder.getUInt8Ty(), "bi_alloca", SuitableAlignmentInBytes, Size);
685+
686+
// Initialize the allocated buffer if required.
687+
if (BuiltinID != Builtin::BI__builtin_alloca_uninitialized)
688+
initializeAlloca(*this, AllocaAddr, Size, SuitableAlignmentInBytes);
689+
690+
// An alloca will always return a pointer to the alloca (stack) address
691+
// space. This address space need not be the same as the AST / Language
692+
// default (e.g. in C / C++ auto vars are in the generic address space). At
693+
// the AST level this is handled within CreateTempAlloca et al., but for the
694+
// builtin / dynamic alloca we have to handle it here.
695+
assert(!UnimplementedFeature::addressSpace());
696+
LangAS AAS = getASTAllocaAddressSpace();
697+
LangAS EAS = E->getType()->getPointeeType().getAddressSpace();
698+
if (EAS != AAS) {
699+
assert(false && "Non-default address space for alloca NYI");
700+
}
701+
702+
// Bitcast the alloca to the expected type.
703+
return RValue::get(
704+
builder.createBitcast(AllocaAddr, builder.getVoidPtrTy()));
705+
}
645706
}
646707

647708
// If this is an alias for a lib function (e.g. __builtin_sin), emit

clang/lib/CIR/CodeGen/CIRGenExpr.cpp

+2-3
Original file line numberDiff line numberDiff line change
@@ -2479,9 +2479,8 @@ mlir::Value CIRGenFunction::buildAlloca(StringRef name, mlir::Type ty,
24792479
{
24802480
mlir::OpBuilder::InsertionGuard guard(builder);
24812481
builder.restoreInsertionPoint(ip);
2482-
addr = builder.create<mlir::cir::AllocaOp>(loc, /*addr type*/ localVarPtrTy,
2483-
/*var type*/ ty, name,
2484-
alignIntAttr, arraySize);
2482+
addr = builder.createAlloca(loc, /*addr type*/ localVarPtrTy,
2483+
/*var type*/ ty, name, alignIntAttr, arraySize);
24852484
if (currVarDecl) {
24862485
auto alloca = cast<mlir::cir::AllocaOp>(addr.getDefiningOp());
24872486
alloca.setAstAttr(ASTVarDeclAttr::get(builder.getContext(), currVarDecl));

clang/lib/CIR/Dialect/Transforms/LoweringPrepare.cpp

+4-9
Original file line numberDiff line numberDiff line change
@@ -497,29 +497,24 @@ static void lowerArrayDtorCtorIntoLoop(CIRBaseBuilderTy &builder,
497497
mlir::Value end = builder.create<mlir::cir::PtrStrideOp>(
498498
loc, eltTy, begin, numArrayElementsConst);
499499

500-
auto tmpAddr = builder.create<mlir::cir::AllocaOp>(
500+
auto tmpAddr = builder.createAlloca(
501501
loc, /*addr type*/ builder.getPointerTo(eltTy),
502-
/*var type*/ eltTy, "__array_idx",
503-
builder.getSizeFromCharUnits(builder.getContext(),
504-
clang::CharUnits::One()),
505-
nullptr);
502+
/*var type*/ eltTy, "__array_idx", clang::CharUnits::One());
506503
builder.createStore(loc, begin, tmpAddr);
507504

508505
auto loop = builder.createDoWhile(
509506
loc,
510507
/*condBuilder=*/
511508
[&](mlir::OpBuilder &b, mlir::Location loc) {
512-
auto currentElement =
513-
b.create<mlir::cir::LoadOp>(loc, eltTy, tmpAddr.getResult());
509+
auto currentElement = b.create<mlir::cir::LoadOp>(loc, eltTy, tmpAddr);
514510
mlir::Type boolTy = mlir::cir::BoolType::get(b.getContext());
515511
auto cmp = builder.create<mlir::cir::CmpOp>(
516512
loc, boolTy, mlir::cir::CmpOpKind::eq, currentElement, end);
517513
builder.createCondition(cmp);
518514
},
519515
/*bodyBuilder=*/
520516
[&](mlir::OpBuilder &b, mlir::Location loc) {
521-
auto currentElement =
522-
b.create<mlir::cir::LoadOp>(loc, eltTy, tmpAddr.getResult());
517+
auto currentElement = b.create<mlir::cir::LoadOp>(loc, eltTy, tmpAddr);
523518

524519
CallOp ctorCall;
525520
op->walk([&](CallOp c) { ctorCall = c; });
+62
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,62 @@
1+
// RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu -emit-cir %s -o - | FileCheck %s --check-prefix=CIR
2+
// RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu -fclangir -emit-llvm %s -o - | FileCheck %s -check-prefix=LLVM
3+
4+
typedef __SIZE_TYPE__ size_t;
5+
void *alloca(size_t size);
6+
void *_alloca(size_t size);
7+
8+
void my_alloca(size_t n)
9+
{
10+
int *c1 = alloca(n);
11+
}
12+
// CIR: cir.func @my_alloca([[ALLOCA_SIZE:%.*]]: !u64i
13+
// CIR: cir.store [[ALLOCA_SIZE]], [[LOCAL_VAR_ALLOCA_SIZE:%.*]] : !u64i, cir.ptr <!u64i>
14+
// CIR: [[TMP_ALLOCA_SIZE:%.*]] = cir.load [[LOCAL_VAR_ALLOCA_SIZE]] : cir.ptr <!u64i>, !u64i
15+
// CIR: [[ALLOCA_RES:%.*]] = cir.alloca !u8i, cir.ptr <!u8i>, [[TMP_ALLOCA_SIZE]] : !u64i, ["bi_alloca"] {alignment = 16 : i64}
16+
// CIR-NEXT: cir.cast(bitcast, [[ALLOCA_RES]] : !cir.ptr<!u8i>), !cir.ptr<!void>
17+
// CIR: }
18+
19+
20+
// LLVM: define void @my_alloca(i64 [[ALLOCA_SIZE:%.*]])
21+
// LLVM: store i64 [[ALLOCA_SIZE]], ptr [[LOCAL_VAR_ALLOCA_SIZE:%.*]],
22+
// LLVM: [[TMP_ALLOCA_SIZE:%.*]] = load i64, ptr [[LOCAL_VAR_ALLOCA_SIZE]],
23+
// LLVM: [[ALLOCA_RES:%.*]] = alloca i8, i64 [[TMP_ALLOCA_SIZE]], align 16
24+
// LLVM: }
25+
26+
void my___builtin_alloca(size_t n)
27+
{
28+
int *c1 = (int *)__builtin_alloca(n);
29+
}
30+
31+
// CIR: cir.func @my___builtin_alloca([[ALLOCA_SIZE:%.*]]: !u64i
32+
// CIR: cir.store [[ALLOCA_SIZE]], [[LOCAL_VAR_ALLOCA_SIZE:%.*]] : !u64i, cir.ptr <!u64i>
33+
// CIR: [[TMP_ALLOCA_SIZE:%.*]] = cir.load [[LOCAL_VAR_ALLOCA_SIZE]] : cir.ptr <!u64i>, !u64i
34+
// CIR: [[ALLOCA_RES:%.*]] = cir.alloca !u8i, cir.ptr <!u8i>, [[TMP_ALLOCA_SIZE]] : !u64i, ["bi_alloca"] {alignment = 16 : i64}
35+
// CIR-NEXT: cir.cast(bitcast, [[ALLOCA_RES]] : !cir.ptr<!u8i>), !cir.ptr<!void>
36+
// CIR: }
37+
38+
39+
// LLVM: define void @my___builtin_alloca(i64 [[ALLOCA_SIZE:%.*]])
40+
// LLVM: store i64 [[ALLOCA_SIZE]], ptr [[LOCAL_VAR_ALLOCA_SIZE:%.*]],
41+
// LLVM: [[TMP_ALLOCA_SIZE:%.*]] = load i64, ptr [[LOCAL_VAR_ALLOCA_SIZE]],
42+
// LLVM: [[ALLOCA_RES:%.*]] = alloca i8, i64 [[TMP_ALLOCA_SIZE]], align 16
43+
// LLVM: }
44+
45+
void my__builtin_alloca_uninitialized(size_t n)
46+
{
47+
int *c1 = (int *)__builtin_alloca_uninitialized(n);
48+
}
49+
50+
// CIR: cir.func @my__builtin_alloca_uninitialized([[ALLOCA_SIZE:%.*]]: !u64i
51+
// CIR: cir.store [[ALLOCA_SIZE]], [[LOCAL_VAR_ALLOCA_SIZE:%.*]] : !u64i, cir.ptr <!u64i>
52+
// CIR: [[TMP_ALLOCA_SIZE:%.*]] = cir.load [[LOCAL_VAR_ALLOCA_SIZE]] : cir.ptr <!u64i>, !u64i
53+
// CIR: [[ALLOCA_RES:%.*]] = cir.alloca !u8i, cir.ptr <!u8i>, [[TMP_ALLOCA_SIZE]] : !u64i, ["bi_alloca"] {alignment = 16 : i64}
54+
// CIR-NEXT: cir.cast(bitcast, [[ALLOCA_RES]] : !cir.ptr<!u8i>), !cir.ptr<!void>
55+
// CIR: }
56+
57+
58+
// LLVM: define void @my__builtin_alloca_uninitialized(i64 [[ALLOCA_SIZE:%.*]])
59+
// LLVM: store i64 [[ALLOCA_SIZE]], ptr [[LOCAL_VAR_ALLOCA_SIZE:%.*]],
60+
// LLVM: [[TMP_ALLOCA_SIZE:%.*]] = load i64, ptr [[LOCAL_VAR_ALLOCA_SIZE]],
61+
// LLVM: [[ALLOCA_RES:%.*]] = alloca i8, i64 [[TMP_ALLOCA_SIZE]], align 16
62+
// LLVM: }
+23
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,23 @@
1+
// RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu -fms-extensions -emit-cir %s -o - | FileCheck %s --check-prefix=CIR
2+
// RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu -fms-extensions -fclangir -emit-llvm %s -o - | FileCheck %s -check-prefix=LLVM
3+
4+
typedef __SIZE_TYPE__ size_t;
5+
6+
void my_win_alloca(size_t n)
7+
{
8+
int *c1 = (int *)_alloca(n);
9+
}
10+
11+
// CIR: cir.func @my_win_alloca([[ALLOCA_SIZE:%.*]]: !u64i
12+
// CIR: cir.store [[ALLOCA_SIZE]], [[LOCAL_VAR_ALLOCA_SIZE:%.*]] : !u64i, cir.ptr <!u64i>
13+
// CIR: [[TMP_ALLOCA_SIZE:%.*]] = cir.load [[LOCAL_VAR_ALLOCA_SIZE]] : cir.ptr <!u64i>, !u64i
14+
// CIR: [[ALLOCA_RES:%.*]] = cir.alloca !u8i, cir.ptr <!u8i>, [[TMP_ALLOCA_SIZE]] : !u64i, ["bi_alloca"] {alignment = 16 : i64}
15+
// CIR-NEXT: cir.cast(bitcast, [[ALLOCA_RES]] : !cir.ptr<!u8i>), !cir.ptr<!void>
16+
// CIR: }
17+
18+
19+
// LLVM: define void @my_win_alloca(i64 [[ALLOCA_SIZE:%.*]])
20+
// LLVM: store i64 [[ALLOCA_SIZE]], ptr [[LOCAL_VAR_ALLOCA_SIZE:%.*]],
21+
// LLVM: [[TMP_ALLOCA_SIZE:%.*]] = load i64, ptr [[LOCAL_VAR_ALLOCA_SIZE]],
22+
// LLVM: [[ALLOCA_RES:%.*]] = alloca i8, i64 [[TMP_ALLOCA_SIZE]], align 16
23+
// LLVM: }

0 commit comments

Comments
 (0)