mirror of
https://github.com/RPCSX/llvm.git
synced 2024-11-23 19:59:57 +00:00
AMDGPU: Set call_convention bit in kernel_code_t
According to the documentation this is supposed to be -1 if indirect calls are not supported. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@293081 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
80b96e28e3
commit
d1c6dad551
@ -127,6 +127,11 @@ void initDefaultAMDKernelCodeT(amd_kernel_code_t &Header,
|
||||
Header.kernel_code_entry_byte_offset = sizeof(Header);
|
||||
// wavefront_size is specified as a power of 2: 2^6 = 64 threads.
|
||||
Header.wavefront_size = 6;
|
||||
|
||||
// If the code object does not support indirect functions, then the value must
|
||||
// be 0xffffffff.
|
||||
Header.call_convention = -1;
|
||||
|
||||
// These alignment values are specified in powers of two, so alignment =
|
||||
// 2^n. The minimum alignment is 2^4 = 16.
|
||||
Header.kernarg_segment_alignment = 4;
|
||||
|
@ -45,6 +45,8 @@
|
||||
; HSA: .amd_kernel_code_t
|
||||
; HSA: enable_sgpr_private_segment_buffer = 1
|
||||
; HSA: enable_sgpr_kernarg_segment_ptr = 1
|
||||
; HSA: wavefront_size = 6
|
||||
; HSA: call_convention = -1
|
||||
; HSA: .end_amd_kernel_code_t
|
||||
; HSA: s_load_dwordx2 s[{{[0-9]+:[0-9]+}}], s[4:5], 0x0
|
||||
|
||||
|
@ -124,6 +124,6 @@ amd_kernel_code_t_minimal:
|
||||
// ASM: group_segment_alignment = 4
|
||||
// ASM: private_segment_alignment = 4
|
||||
// ASM: wavefront_size = 6
|
||||
// ASM: call_convention = 0
|
||||
// ASM: call_convention = -1
|
||||
// ASM: runtime_loader_kernel_symbol = 0
|
||||
// ASM: .end_amd_kernel_code_t
|
||||
|
@ -273,6 +273,6 @@ amd_kernel_code_t_minimal:
|
||||
// ASM: group_segment_alignment = 4
|
||||
// ASM: private_segment_alignment = 4
|
||||
// ASM: wavefront_size = 6
|
||||
// ASM: call_convention = 0
|
||||
// ASM: call_convention = -1
|
||||
// ASM: runtime_loader_kernel_symbol = 0
|
||||
// ASM: .end_amd_kernel_code_t
|
||||
|
Loading…
Reference in New Issue
Block a user