forked from OSchip/llvm-project
AArch64: modify Swift async frame record storage on Windows
The frame layout on Windows differs from that on other platforms. It will spill the registers in descending numeric value (i.e. x30, x29, ...). Furthermore, the x29, x30 pair is particularly important as it is used for the fast stack walking. As a result, we cannot simply insert the Swift async frame record in between the store. To provide the simplistic search mechanism, always spill the async frame record prior to the spilled registers. This was caught by the assertion failure in the frame lowering code when building the runtime for Windows AArch64. Fixes: #55058 Differential Revision: https://reviews.llvm.org/D124498 Reviewed By: mstorsjo
This commit is contained in:
parent
a9d68a5524
commit
24ba1302b3
|
@ -2993,6 +2993,15 @@ bool AArch64FrameLowering::assignCalleeSavedSpillSlots(
|
|||
// stack slots for them.
|
||||
MachineFrameInfo &MFI = MF.getFrameInfo();
|
||||
auto *AFI = MF.getInfo<AArch64FunctionInfo>();
|
||||
|
||||
bool UsesWinAAPCS = isTargetWindows(MF);
|
||||
if (UsesWinAAPCS && hasFP(MF) && AFI->hasSwiftAsyncContext()) {
|
||||
int FrameIdx = MFI.CreateStackObject(8, Align(16), true);
|
||||
AFI->setSwiftAsyncContextFrameIdx(FrameIdx);
|
||||
if ((unsigned)FrameIdx < MinCSFrameIndex) MinCSFrameIndex = FrameIdx;
|
||||
if ((unsigned)FrameIdx > MaxCSFrameIndex) MaxCSFrameIndex = FrameIdx;
|
||||
}
|
||||
|
||||
for (auto &CS : CSI) {
|
||||
Register Reg = CS.getReg();
|
||||
const TargetRegisterClass *RC = RegInfo->getMinimalPhysRegClass(Reg);
|
||||
|
@ -3006,7 +3015,8 @@ bool AArch64FrameLowering::assignCalleeSavedSpillSlots(
|
|||
if ((unsigned)FrameIdx > MaxCSFrameIndex) MaxCSFrameIndex = FrameIdx;
|
||||
|
||||
// Grab 8 bytes below FP for the extended asynchronous frame info.
|
||||
if (hasFP(MF) && AFI->hasSwiftAsyncContext() && Reg == AArch64::FP) {
|
||||
if (hasFP(MF) && AFI->hasSwiftAsyncContext() && !UsesWinAAPCS &&
|
||||
Reg == AArch64::FP) {
|
||||
FrameIdx = MFI.CreateStackObject(8, Alignment, true);
|
||||
AFI->setSwiftAsyncContextFrameIdx(FrameIdx);
|
||||
if ((unsigned)FrameIdx < MinCSFrameIndex) MinCSFrameIndex = FrameIdx;
|
||||
|
|
|
@ -0,0 +1,62 @@
|
|||
; RUN: llc -mtriple aarch64-unknown-windows -swift-async-fp=never -filetype asm -o - %s | FileCheck %s
|
||||
|
||||
; ModuleID = '_Concurrency.ll'
|
||||
source_filename = "_Concurrency.ll"
|
||||
target datalayout = "e-m:w-p:64:64-i32:32-i64:64-i128:128-n32:64-S128"
|
||||
target triple = "aarch64-unknown-windows-msvc19.32.31302"
|
||||
|
||||
%swift.context = type { %swift.context*, void (%swift.context*)* }
|
||||
|
||||
; Function Attrs: argmemonly nofree nosync nounwind willreturn
|
||||
declare void @llvm.lifetime.end.p0i8(i64 immarg, i8* nocapture) #0
|
||||
|
||||
; Function Attrs: nounwind
|
||||
define hidden swifttailcc void @"$ss23withCheckedContinuation8function_xSS_yScCyxs5NeverOGXEtYalFTQ0_"(i8* nocapture readonly %0) #1 {
|
||||
entryresume.0:
|
||||
%1 = bitcast i8* %0 to i8**
|
||||
%2 = load i8*, i8** %1, align 8
|
||||
%3 = tail call i8** @llvm.swift.async.context.addr() #4
|
||||
store i8* %2, i8** %3, align 8
|
||||
%async.ctx.frameptr1 = getelementptr inbounds i8, i8* %2, i64 16
|
||||
%.reload.addr4 = getelementptr inbounds i8, i8* %2, i64 24
|
||||
%4 = bitcast i8* %.reload.addr4 to i8**
|
||||
%.reload5 = load i8*, i8** %4, align 8
|
||||
%.reload.addr = bitcast i8* %async.ctx.frameptr1 to i8**
|
||||
%.reload = load i8*, i8** %.reload.addr, align 8
|
||||
%5 = load i8*, i8** %1, align 8
|
||||
store i8* %5, i8** %3, align 8
|
||||
tail call swiftcc void @swift_task_dealloc(i8* %.reload5) #4
|
||||
tail call void @llvm.lifetime.end.p0i8(i64 -1, i8* %.reload5)
|
||||
tail call swiftcc void @swift_task_dealloc(i8* %.reload) #4
|
||||
%6 = getelementptr inbounds i8, i8* %5, i64 8
|
||||
%7 = bitcast i8* %6 to void (%swift.context*)**
|
||||
%8 = load void (%swift.context*)*, void (%swift.context*)** %7, align 8
|
||||
%9 = bitcast i8* %5 to %swift.context*
|
||||
musttail call swifttailcc void %8(%swift.context* %9) #4
|
||||
ret void
|
||||
}
|
||||
|
||||
; NOTE: we do not see the canonical windows frame setup due to the `nounwind`
|
||||
; attribtue on the function.
|
||||
|
||||
; CHECK: sub sp, sp, #64
|
||||
; CHECK: stp x30, x29, [sp, #16]
|
||||
; CHECK: add x29, sp, #16
|
||||
; CHECK: stp x22, x21, [sp, #32]
|
||||
; CHECK: sub x8, x29, #8
|
||||
; CHECK: stp x20, x19, [sp, #48]
|
||||
; CHECK: ldr x9, [x0]
|
||||
; CHECK: str x9, [x8]
|
||||
|
||||
; Function Attrs: nounwind readnone
|
||||
declare i8** @llvm.swift.async.context.addr() #2
|
||||
|
||||
; Function Attrs: argmemonly nounwind
|
||||
declare dllimport swiftcc void @swift_task_dealloc(i8*) local_unnamed_addr #3
|
||||
|
||||
attributes #0 = { argmemonly nofree nosync nounwind willreturn }
|
||||
attributes #1 = { nounwind "frame-pointer"="none" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="generic" "target-features"="+neon" }
|
||||
attributes #2 = { nounwind readnone }
|
||||
attributes #3 = { argmemonly nounwind }
|
||||
attributes #4 = { nounwind }
|
||||
|
Loading…
Reference in New Issue