Skip to content

Commit bee6966

Browse files
efriedma-quictstellar
authored andcommitted
[Arm64EC] Improve alignment mangling in arm64ec thunks. (#90115)
In some cases, MSVC's mangling for arm64ec thunks includes the alignment of a struct. I added some code to try to match... but it never really worked right. The issues: - Alignment is only mangled if it's 16 or more (I guess the default is supposed to be 8). - Alignment isn't mangled on return values (since the memory is allocated by the caller). The current patch leaves hooks to make alignment mangling work... but doesn't actually ever mangle alignment: clang never actually encodes a relevant alignment into the IR. Once we get clang to emit the real size/alignment of structs, we can start emitting it.
1 parent 6456ebb commit bee6966

File tree

3 files changed

+12
-11
lines changed

3 files changed

+12
-11
lines changed

llvm/lib/Target/AArch64/AArch64Arm64ECCallLowering.cpp

+4-3
Original file line numberDiff line numberDiff line change
@@ -181,13 +181,14 @@ void AArch64Arm64ECCallLowering::getThunkArgTypes(
181181
}
182182

183183
for (unsigned E = FT->getNumParams(); I != E; ++I) {
184-
Align ParamAlign = AttrList.getParamAlignment(I).valueOrOne();
185184
#if 0
186185
// FIXME: Need more information about argument size; see
187186
// https://reviews.llvm.org/D132926
188187
uint64_t ArgSizeBytes = AttrList.getParamArm64ECArgSizeBytes(I);
188+
Align ParamAlign = AttrList.getParamAlignment(I).valueOrOne();
189189
#else
190190
uint64_t ArgSizeBytes = 0;
191+
Align ParamAlign = Align();
191192
#endif
192193
Type *Arm64Ty, *X64Ty;
193194
canonicalizeThunkType(FT->getParamType(I), ParamAlign,
@@ -297,7 +298,7 @@ void AArch64Arm64ECCallLowering::canonicalizeThunkType(
297298
uint64_t TotalSizeBytes = ElementCnt * ElementSizePerBytes;
298299
if (ElementTy->isFloatTy() || ElementTy->isDoubleTy()) {
299300
Out << (ElementTy->isFloatTy() ? "F" : "D") << TotalSizeBytes;
300-
if (Alignment.value() >= 8 && !T->isPointerTy())
301+
if (Alignment.value() >= 16 && !Ret)
301302
Out << "a" << Alignment.value();
302303
Arm64Ty = T;
303304
if (TotalSizeBytes <= 8) {
@@ -328,7 +329,7 @@ void AArch64Arm64ECCallLowering::canonicalizeThunkType(
328329
Out << "m";
329330
if (TypeSize != 4)
330331
Out << TypeSize;
331-
if (Alignment.value() >= 8 && !T->isPointerTy())
332+
if (Alignment.value() >= 16 && !Ret)
332333
Out << "a" << Alignment.value();
333334
// FIXME: Try to canonicalize Arm64Ty more thoroughly?
334335
Arm64Ty = T;

llvm/test/CodeGen/AArch64/arm64ec-entry-thunks.ll

+3-3
Original file line numberDiff line numberDiff line change
@@ -223,8 +223,8 @@ define i8 @matches_has_sret() nounwind {
223223

224224
%TSRet = type { i64, i64 }
225225
define void @has_aligned_sret(ptr align 32 sret(%TSRet)) nounwind {
226-
; CHECK-LABEL: .def $ientry_thunk$cdecl$m16a32$v;
227-
; CHECK: .section .wowthk$aa,"xr",discard,$ientry_thunk$cdecl$m16a32$v
226+
; CHECK-LABEL: .def $ientry_thunk$cdecl$m16$v;
227+
; CHECK: .section .wowthk$aa,"xr",discard,$ientry_thunk$cdecl$m16$v
228228
; CHECK: // %bb.0:
229229
; CHECK-NEXT: stp q6, q7, [sp, #-176]! // 32-byte Folded Spill
230230
; CHECK-NEXT: .seh_save_any_reg_px q6, 176
@@ -457,7 +457,7 @@ define %T2 @simple_struct(%T1 %0, %T2 %1, %T3, %T4) nounwind {
457457
; CHECK-NEXT: .symidx $ientry_thunk$cdecl$i8$v
458458
; CHECK-NEXT: .word 1
459459
; CHECK-NEXT: .symidx "#has_aligned_sret"
460-
; CHECK-NEXT: .symidx $ientry_thunk$cdecl$m16a32$v
460+
; CHECK-NEXT: .symidx $ientry_thunk$cdecl$m16$v
461461
; CHECK-NEXT: .word 1
462462
; CHECK-NEXT: .symidx "#small_array"
463463
; CHECK-NEXT: .symidx $ientry_thunk$cdecl$m2$m2F8

llvm/test/CodeGen/AArch64/arm64ec-exit-thunks.ll

+5-5
Original file line numberDiff line numberDiff line change
@@ -236,8 +236,8 @@ declare void @has_sret(ptr sret([100 x i8])) nounwind;
236236

237237
%TSRet = type { i64, i64 }
238238
declare void @has_aligned_sret(ptr align 32 sret(%TSRet)) nounwind;
239-
; CHECK-LABEL: .def $iexit_thunk$cdecl$m16a32$v;
240-
; CHECK: .section .wowthk$aa,"xr",discard,$iexit_thunk$cdecl$m16a32$v
239+
; CHECK-LABEL: .def $iexit_thunk$cdecl$m16$v;
240+
; CHECK: .section .wowthk$aa,"xr",discard,$iexit_thunk$cdecl$m16$v
241241
; CHECK: // %bb.0:
242242
; CHECK-NEXT: sub sp, sp, #48
243243
; CHECK-NEXT: .seh_stackalloc 48
@@ -271,8 +271,8 @@ declare void @has_aligned_sret(ptr align 32 sret(%TSRet)) nounwind;
271271
; CHECK: adrp x11, has_aligned_sret
272272
; CHECK: add x11, x11, :lo12:has_aligned_sret
273273
; CHECK: ldr x9, [x9, :lo12:__os_arm64x_check_icall]
274-
; CHECK: adrp x10, ($iexit_thunk$cdecl$m16a32$v)
275-
; CHECK: add x10, x10, :lo12:($iexit_thunk$cdecl$m16a32$v)
274+
; CHECK: adrp x10, ($iexit_thunk$cdecl$m16$v)
275+
; CHECK: add x10, x10, :lo12:($iexit_thunk$cdecl$m16$v)
276276
; CHECK: blr x9
277277
; CHECK: .seh_startepilogue
278278
; CHECK: ldr x30, [sp], #16 // 8-byte Folded Reload
@@ -492,7 +492,7 @@ declare %T2 @simple_struct(%T1, %T2, %T3, %T4) nounwind;
492492
; CHECK-NEXT: .symidx has_sret
493493
; CHECK-NEXT: .word 0
494494
; CHECK-NEXT: .symidx has_aligned_sret
495-
; CHECK-NEXT: .symidx $iexit_thunk$cdecl$m16a32$v
495+
; CHECK-NEXT: .symidx $iexit_thunk$cdecl$m16$v
496496
; CHECK-NEXT: .word 4
497497
; CHECK-NEXT: .symidx "#has_aligned_sret$exit_thunk"
498498
; CHECK-NEXT: .symidx has_aligned_sret

0 commit comments

Comments
 (0)