|
| 1 | +; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -mcpu=gfx942 -passes=amdgpu-attributor %s | FileCheck %s |
| 2 | + |
| 3 | +; CHECK-LABEL: define internal fastcc void @call1( |
| 4 | +; CHECK-SAME: ) #[[ATTR0:[0-9]+]] |
| 5 | +define internal fastcc void @call1() #0 { |
| 6 | + tail call fastcc void @call2() |
| 7 | + ret void |
| 8 | +} |
| 9 | + |
| 10 | +; CHECK-LABEL: define internal fastcc void @call2( |
| 11 | +; CHECK-SAME: ) #[[ATTR0]] |
| 12 | +define internal fastcc void @call2() #1 { |
| 13 | + tail call fastcc void @call5() |
| 14 | + ret void |
| 15 | +} |
| 16 | + |
| 17 | +; CHECK-LABEL: define { ptr addrspace(1), ptr } @call3( |
| 18 | +; CHECK-SAME:) #[[ATTR0]] |
| 19 | +define { ptr addrspace(1), ptr } @call3() #2 { |
| 20 | + tail call fastcc void @call5() |
| 21 | + ret { ptr addrspace(1), ptr } zeroinitializer |
| 22 | +} |
| 23 | + |
| 24 | +; CHECK-LABEL: define internal fastcc void @call5( |
| 25 | +; CHECK-SAME: ) #[[ATTR0]] |
| 26 | +define internal fastcc void @call5() { |
| 27 | + tail call fastcc void @call1() |
| 28 | + ret void |
| 29 | +} |
| 30 | + |
| 31 | +attributes #0 = {"amdgpu-flat-work-group-size"="1, 1024" "target-cpu"="gfx942" } |
| 32 | +attributes #1 = {"amdgpu-flat-work-group-size"="1, 1024" "target-cpu"="gfx942" } |
| 33 | +attributes #2 = {"amdgpu-flat-work-group-size"="1, 256" "target-cpu"="gfx942" } |
| 34 | + |
| 35 | +; CHECK: attributes #[[ATTR0]] = { "amdgpu-agpr-alloc"="0" "amdgpu-flat-work-group-size"="1,256" "amdgpu-no-completion-action" "amdgpu-no-default-queue" "amdgpu-no-dispatch-id" "amdgpu-no-dispatch-ptr" "amdgpu-no-flat-scratch-init" "amdgpu-no-heap-ptr" "amdgpu-no-hostcall-ptr" "amdgpu-no-implicitarg-ptr" "amdgpu-no-lds-kernel-id" "amdgpu-no-multigrid-sync-arg" "amdgpu-no-queue-ptr" "amdgpu-no-workgroup-id-x" "amdgpu-no-workgroup-id-y" "amdgpu-no-workgroup-id-z" "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "target-cpu"="gfx942" "uniform-work-group-size"="false" } |
0 commit comments