AArch64: modify Swift async frame record storage on Windows

The frame layout on Windows differs from that on other platforms. It
will spill the registers in descending numeric value (i.e. x30, x29,
...). Furthermore, the x29, x30 pair is particularly important as it
is used for the fast stack walking. As a result, we cannot simply
insert the Swift async frame record in between the store. To provide
the simplistic search mechanism, always spill the async frame record
prior to the spilled registers.

This was caught by the assertion failure in the frame lowering code when
building the runtime for Windows AArch64.

Fixes: #55058

Differential Revision: https://reviews.llvm.org/D124498
Reviewed By: mstorsjo
This commit is contained in:
Saleem Abdulrasool 2022-04-26 20:12:48 -07:00
parent a9d68a5524
commit 24ba1302b3
2 changed files with 73 additions and 1 deletions

View File

@ -2993,6 +2993,15 @@ bool AArch64FrameLowering::assignCalleeSavedSpillSlots(
// stack slots for them.
MachineFrameInfo &MFI = MF.getFrameInfo();
auto *AFI = MF.getInfo<AArch64FunctionInfo>();
bool UsesWinAAPCS = isTargetWindows(MF);
if (UsesWinAAPCS && hasFP(MF) && AFI->hasSwiftAsyncContext()) {
int FrameIdx = MFI.CreateStackObject(8, Align(16), true);
AFI->setSwiftAsyncContextFrameIdx(FrameIdx);
if ((unsigned)FrameIdx < MinCSFrameIndex) MinCSFrameIndex = FrameIdx;
if ((unsigned)FrameIdx > MaxCSFrameIndex) MaxCSFrameIndex = FrameIdx;
}
for (auto &CS : CSI) {
Register Reg = CS.getReg();
const TargetRegisterClass *RC = RegInfo->getMinimalPhysRegClass(Reg);
@ -3006,7 +3015,8 @@ bool AArch64FrameLowering::assignCalleeSavedSpillSlots(
if ((unsigned)FrameIdx > MaxCSFrameIndex) MaxCSFrameIndex = FrameIdx;
// Grab 8 bytes below FP for the extended asynchronous frame info.
if (hasFP(MF) && AFI->hasSwiftAsyncContext() && Reg == AArch64::FP) {
if (hasFP(MF) && AFI->hasSwiftAsyncContext() && !UsesWinAAPCS &&
Reg == AArch64::FP) {
FrameIdx = MFI.CreateStackObject(8, Alignment, true);
AFI->setSwiftAsyncContextFrameIdx(FrameIdx);
if ((unsigned)FrameIdx < MinCSFrameIndex) MinCSFrameIndex = FrameIdx;

View File

@ -0,0 +1,62 @@
; RUN: llc -mtriple aarch64-unknown-windows -swift-async-fp=never -filetype asm -o - %s | FileCheck %s
; ModuleID = '_Concurrency.ll'
source_filename = "_Concurrency.ll"
target datalayout = "e-m:w-p:64:64-i32:32-i64:64-i128:128-n32:64-S128"
target triple = "aarch64-unknown-windows-msvc19.32.31302"
%swift.context = type { %swift.context*, void (%swift.context*)* }
; Function Attrs: argmemonly nofree nosync nounwind willreturn
declare void @llvm.lifetime.end.p0i8(i64 immarg, i8* nocapture) #0
; Function Attrs: nounwind
define hidden swifttailcc void @"$ss23withCheckedContinuation8function_xSS_yScCyxs5NeverOGXEtYalFTQ0_"(i8* nocapture readonly %0) #1 {
entryresume.0:
%1 = bitcast i8* %0 to i8**
%2 = load i8*, i8** %1, align 8
%3 = tail call i8** @llvm.swift.async.context.addr() #4
store i8* %2, i8** %3, align 8
%async.ctx.frameptr1 = getelementptr inbounds i8, i8* %2, i64 16
%.reload.addr4 = getelementptr inbounds i8, i8* %2, i64 24
%4 = bitcast i8* %.reload.addr4 to i8**
%.reload5 = load i8*, i8** %4, align 8
%.reload.addr = bitcast i8* %async.ctx.frameptr1 to i8**
%.reload = load i8*, i8** %.reload.addr, align 8
%5 = load i8*, i8** %1, align 8
store i8* %5, i8** %3, align 8
tail call swiftcc void @swift_task_dealloc(i8* %.reload5) #4
tail call void @llvm.lifetime.end.p0i8(i64 -1, i8* %.reload5)
tail call swiftcc void @swift_task_dealloc(i8* %.reload) #4
%6 = getelementptr inbounds i8, i8* %5, i64 8
%7 = bitcast i8* %6 to void (%swift.context*)**
%8 = load void (%swift.context*)*, void (%swift.context*)** %7, align 8
%9 = bitcast i8* %5 to %swift.context*
musttail call swifttailcc void %8(%swift.context* %9) #4
ret void
}
; NOTE: we do not see the canonical windows frame setup due to the `nounwind`
; attribtue on the function.
; CHECK: sub sp, sp, #64
; CHECK: stp x30, x29, [sp, #16]
; CHECK: add x29, sp, #16
; CHECK: stp x22, x21, [sp, #32]
; CHECK: sub x8, x29, #8
; CHECK: stp x20, x19, [sp, #48]
; CHECK: ldr x9, [x0]
; CHECK: str x9, [x8]
; Function Attrs: nounwind readnone
declare i8** @llvm.swift.async.context.addr() #2
; Function Attrs: argmemonly nounwind
declare dllimport swiftcc void @swift_task_dealloc(i8*) local_unnamed_addr #3
attributes #0 = { argmemonly nofree nosync nounwind willreturn }
attributes #1 = { nounwind "frame-pointer"="none" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="generic" "target-features"="+neon" }
attributes #2 = { nounwind readnone }
attributes #3 = { argmemonly nounwind }
attributes #4 = { nounwind }