58 lines
1.5 KiB
LLVM
58 lines
1.5 KiB
LLVM
; RUN: llc -mtriple=amdgcn--amdhsa -mcpu=gfx908 < %s | FileCheck -check-prefixes=CHECK,GFX908 %s
|
|
; RUN: llc -mtriple=amdgcn--amdhsa -mcpu=gfx90a < %s | FileCheck -check-prefixes=CHECK,GFX90A %s
|
|
; RUN: llc -mtriple=amdgcn--amdhsa -mcpu=gfx801 < %s | FileCheck -check-prefixes=CHECK,GFX801 %s
|
|
|
|
; COM: Comments for each kernel
|
|
; CHECK: kernel_32_agprs
|
|
; GFX908: ; NumVgprs: 9
|
|
; GFX908 ; NumAgprs: 32
|
|
; GFX908 ; TotalNumVgprs: 32
|
|
|
|
; GFX90A: ; NumVgprs: 9
|
|
; GFX90A ; NumAgprs: 32
|
|
; GFX90A ; TotalNumVgprs: 44
|
|
|
|
; GFX801: ; NumVgprs: 9
|
|
|
|
; CHECK: kernel_40_vgprs
|
|
; GFX908: ; NumVgprs: 40
|
|
; GFX908 ; NumAgprs: 16
|
|
; GFX908 ; TotalNumVgprs: 40
|
|
|
|
; GFX90A: ; NumVgprs: 40
|
|
; GFX90A ; NumAgprs: 16
|
|
; GFX90A ; TotalNumVgprs: 56
|
|
|
|
; GFX801: ; NumVgprs: 40
|
|
|
|
; COM: Metadata
|
|
; GFX908: - .agpr_count: 32
|
|
; GFX908: .vgpr_count: 32
|
|
|
|
; GFX90A: - .agpr_count: 32
|
|
; GFX90A: .vgpr_count: 44
|
|
|
|
; GFX801: .vgpr_count: 9
|
|
define amdgpu_kernel void @kernel_32_agprs() #0 {
|
|
bb:
|
|
call void asm sideeffect "", "~{v8}" ()
|
|
call void asm sideeffect "", "~{a31}" ()
|
|
ret void
|
|
}
|
|
|
|
; GFX908: - .agpr_count: 16
|
|
; GFX908: .vgpr_count: 40
|
|
|
|
; GFX90A: - .agpr_count: 16
|
|
; GFX90A: .vgpr_count: 56
|
|
|
|
; GFX801: .vgpr_count: 40
|
|
define amdgpu_kernel void @kernel_40_vgprs() #0 {
|
|
bb:
|
|
call void asm sideeffect "", "~{v39}" ()
|
|
call void asm sideeffect "", "~{a15}" ()
|
|
ret void
|
|
}
|
|
|
|
attributes #0 = { nounwind noinline "amdgpu-flat-work-group-size"="1,512" }
|