diff --git a/llvm/test/Transforms/Coroutines/coro-split-musttail6.ll b/llvm/test/Transforms/Coroutines/coro-split-musttail6.ll new file mode 100644 index 0000000000000..f139b8fb58843 --- /dev/null +++ b/llvm/test/Transforms/Coroutines/coro-split-musttail6.ll @@ -0,0 +1,116 @@ +; Tests that sinked lifetime markers wouldn't provent optimization +; to convert a resuming call to a musttail call. +; The difference between this and coro-split-musttail5.ll is that there is +; an extra bitcast instruction in the path, which makes it harder to +; optimize. +; RUN: opt < %s -passes='cgscc(coro-split),simplifycfg,early-cse' -S | FileCheck %s + +declare void @fakeresume1(i64* align 8) + +define void @g() #0 { +entry: + %id = call token @llvm.coro.id(i32 0, i8* null, i8* null, i8* null) + %alloc = call i8* @malloc(i64 16) #3 + %alloc.var = alloca i64 + %alloca.var.i8 = bitcast i64* %alloc.var to i8* + call void @llvm.lifetime.start.p0i8(i64 1, i8* %alloca.var.i8) + %vFrame = call noalias nonnull i8* @llvm.coro.begin(token %id, i8* %alloc) + + %save = call token @llvm.coro.save(i8* null) + %suspend = call i8 @llvm.coro.suspend(token %save, i1 false) + + switch i8 %suspend, label %exit [ + i8 0, label %await.suspend + i8 1, label %exit + ] +await.suspend: + %save2 = call token @llvm.coro.save(i8* null) + call fastcc void @fakeresume1(i64* align 8 null) + %suspend2 = call i8 @llvm.coro.suspend(token %save2, i1 false) + switch i8 %suspend2, label %exit [ + i8 0, label %await.ready + i8 1, label %exit + ] +await.ready: + call void @consume(i64* %alloc.var) + call void @llvm.lifetime.end.p0i8(i64 1, i8* %alloca.var.i8) + br label %exit +exit: + call i1 @llvm.coro.end(i8* null, i1 false) + ret void +} + +; FIXME: The fakeresume1 here should be marked as musttail. +; Verify that in the resume part resume call is marked with musttail. +; CHECK-LABEL: @g.resume( +; CHECK-NOT: musttail call fastcc void @fakeresume1(i64* align 8 null) + +; It has a cleanup bb. +define void @f() #0 { +entry: + %id = call token @llvm.coro.id(i32 0, i8* null, i8* null, i8* null) + %alloc = call i8* @malloc(i64 16) #3 + %alloc.var = alloca i64 + %alloca.var.i8 = bitcast i64* %alloc.var to i8* + call void @llvm.lifetime.start.p0i8(i64 1, i8* %alloca.var.i8) + %vFrame = call noalias nonnull i8* @llvm.coro.begin(token %id, i8* %alloc) + + %save = call token @llvm.coro.save(i8* null) + %suspend = call i8 @llvm.coro.suspend(token %save, i1 false) + + switch i8 %suspend, label %exit [ + i8 0, label %await.suspend + i8 1, label %exit + ] +await.suspend: + %save2 = call token @llvm.coro.save(i8* null) + call fastcc void @fakeresume1(i64* align 8 null) + %suspend2 = call i8 @llvm.coro.suspend(token %save2, i1 false) + switch i8 %suspend2, label %exit [ + i8 0, label %await.ready + i8 1, label %cleanup + ] +await.ready: + call void @consume(i64* %alloc.var) + call void @llvm.lifetime.end.p0i8(i64 1, i8* %alloca.var.i8) + br label %exit + +cleanup: + %free.handle = call i8* @llvm.coro.free(token %id, i8* %vFrame) + %.not = icmp eq i8* %free.handle, null + br i1 %.not, label %exit, label %coro.free + +coro.free: + call void @delete(i8* nonnull %free.handle) #2 + br label %exit + +exit: + call i1 @llvm.coro.end(i8* null, i1 false) + ret void +} + +; FIXME: The fakeresume1 here should be marked as musttail. +; Verify that in the resume part resume call is marked with musttail. +; CHECK-LABEL: @f.resume( +; CHECK-NOT: musttail call fastcc void @fakeresume1(i64* align 8 null) + +declare token @llvm.coro.id(i32, i8* readnone, i8* nocapture readonly, i8*) #1 +declare i1 @llvm.coro.alloc(token) #2 +declare i64 @llvm.coro.size.i64() #3 +declare i8* @llvm.coro.begin(token, i8* writeonly) #2 +declare token @llvm.coro.save(i8*) #2 +declare i8* @llvm.coro.frame() #3 +declare i8 @llvm.coro.suspend(token, i1) #2 +declare i8* @llvm.coro.free(token, i8* nocapture readonly) #1 +declare i1 @llvm.coro.end(i8*, i1) #2 +declare i8* @llvm.coro.subfn.addr(i8* nocapture readonly, i8) #1 +declare i8* @malloc(i64) +declare void @delete(i8* nonnull) #2 +declare void @consume(i64*) +declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) +declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) + +attributes #0 = { "coroutine.presplit"="1" } +attributes #1 = { argmemonly nounwind readonly } +attributes #2 = { nounwind } +attributes #3 = { nounwind readnone } diff --git a/llvm/test/Transforms/Coroutines/coro-split-musttail7.ll b/llvm/test/Transforms/Coroutines/coro-split-musttail7.ll new file mode 100644 index 0000000000000..ce1f7203a0c7e --- /dev/null +++ b/llvm/test/Transforms/Coroutines/coro-split-musttail7.ll @@ -0,0 +1,118 @@ +; Tests that sinked lifetime markers wouldn't provent optimization +; to convert a resuming call to a musttail call. +; The difference between this and coro-split-musttail5.ll and coro-split-musttail5.ll +; is that this contains dead instruction generated during the transformation, +; which makes the optimization harder. +; RUN: opt < %s -passes='cgscc(coro-split),simplifycfg,early-cse' -S | FileCheck %s + +declare void @fakeresume1(i64* align 8) + +define void @g() #0 { +entry: + %id = call token @llvm.coro.id(i32 0, i8* null, i8* null, i8* null) + %alloc = call i8* @malloc(i64 16) #3 + %alloc.var = alloca i64 + %alloca.var.i8 = bitcast i64* %alloc.var to i8* + call void @llvm.lifetime.start.p0i8(i64 1, i8* %alloca.var.i8) + %vFrame = call noalias nonnull i8* @llvm.coro.begin(token %id, i8* %alloc) + + %save = call token @llvm.coro.save(i8* null) + %suspend = call i8 @llvm.coro.suspend(token %save, i1 false) + + switch i8 %suspend, label %exit [ + i8 0, label %await.suspend + i8 1, label %exit + ] +await.suspend: + %save2 = call token @llvm.coro.save(i8* null) + call fastcc void @fakeresume1(i64* align 8 null) + %suspend2 = call i8 @llvm.coro.suspend(token %save2, i1 false) + switch i8 %suspend2, label %exit [ + i8 0, label %await.ready + i8 1, label %exit + ] +await.ready: + call void @consume(i64* %alloc.var) + call void @llvm.lifetime.end.p0i8(i64 1, i8* %alloca.var.i8) + br label %exit +exit: + %.unused = getelementptr inbounds i8, i8* %vFrame, i32 0 + call i1 @llvm.coro.end(i8* null, i1 false) + ret void +} + +; FIXME: The fakeresume1 here should be marked as musttail. +; Verify that in the resume part resume call is marked with musttail. +; CHECK-LABEL: @g.resume( +; CHECK-NOT: musttail call fastcc void @fakeresume1(i64* align 8 null) + +; It has a cleanup bb. +define void @f() #0 { +entry: + %id = call token @llvm.coro.id(i32 0, i8* null, i8* null, i8* null) + %alloc = call i8* @malloc(i64 16) #3 + %alloc.var = alloca i64 + %alloca.var.i8 = bitcast i64* %alloc.var to i8* + call void @llvm.lifetime.start.p0i8(i64 1, i8* %alloca.var.i8) + %vFrame = call noalias nonnull i8* @llvm.coro.begin(token %id, i8* %alloc) + + %save = call token @llvm.coro.save(i8* null) + %suspend = call i8 @llvm.coro.suspend(token %save, i1 false) + + switch i8 %suspend, label %exit [ + i8 0, label %await.suspend + i8 1, label %exit + ] +await.suspend: + %save2 = call token @llvm.coro.save(i8* null) + call fastcc void @fakeresume1(i64* align 8 null) + %suspend2 = call i8 @llvm.coro.suspend(token %save2, i1 false) + switch i8 %suspend2, label %exit [ + i8 0, label %await.ready + i8 1, label %cleanup + ] +await.ready: + call void @consume(i64* %alloc.var) + call void @llvm.lifetime.end.p0i8(i64 1, i8* %alloca.var.i8) + br label %exit + +cleanup: + %free.handle = call i8* @llvm.coro.free(token %id, i8* %vFrame) + %.not = icmp eq i8* %free.handle, null + br i1 %.not, label %exit, label %coro.free + +coro.free: + call void @delete(i8* nonnull %free.handle) #2 + br label %exit + +exit: + %.unused = getelementptr inbounds i8, i8* %vFrame, i32 0 + call i1 @llvm.coro.end(i8* null, i1 false) + ret void +} + +; FIXME: The fakeresume1 here should be marked as musttail. +; Verify that in the resume part resume call is marked with musttail. +; CHECK-LABEL: @f.resume( +; CHECK-NOT: musttail call fastcc void @fakeresume1(i64* align 8 null) + +declare token @llvm.coro.id(i32, i8* readnone, i8* nocapture readonly, i8*) #1 +declare i1 @llvm.coro.alloc(token) #2 +declare i64 @llvm.coro.size.i64() #3 +declare i8* @llvm.coro.begin(token, i8* writeonly) #2 +declare token @llvm.coro.save(i8*) #2 +declare i8* @llvm.coro.frame() #3 +declare i8 @llvm.coro.suspend(token, i1) #2 +declare i8* @llvm.coro.free(token, i8* nocapture readonly) #1 +declare i1 @llvm.coro.end(i8*, i1) #2 +declare i8* @llvm.coro.subfn.addr(i8* nocapture readonly, i8) #1 +declare i8* @malloc(i64) +declare void @delete(i8* nonnull) #2 +declare void @consume(i64*) +declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) +declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) + +attributes #0 = { "coroutine.presplit"="1" } +attributes #1 = { argmemonly nounwind readonly } +attributes #2 = { nounwind } +attributes #3 = { nounwind readnone }