Skip to content

Commit 624c37d

Browse files
masahitqchen
authored andcommitted
fixed rocm runtime. set default gcn arch to be gfx803 (#544)
1 parent acd48e9 commit 624c37d

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

src/codegen/llvm/codegen_amdgpu.cc

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -136,7 +136,7 @@ runtime::Module BuildAMDGPU(Array<LoweredFunc> funcs, std::string target) {
136136
) >= 4 &&
137137
target.substr(0, 4) == "rocm");
138138
llvm::TargetMachine* tm = \
139-
GetLLVMTargetMachine("-mtriple=amdgcn-amd-amdhsa-hcc -mcpu=gfx900" + \
139+
GetLLVMTargetMachine("-mtriple=amdgcn-amd-amdhsa-hcc -mcpu=gfx803" + \
140140
target.substr(4, target.length() - 4));
141141

142142
std::unique_ptr<CodeGenAMDGPU> cg(new CodeGenAMDGPU());

src/runtime/rocm/rocm_module.cc

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -152,7 +152,7 @@ class ROCMWrappedFunc {
152152

153153
ThreadWorkLoad wl = thread_axis_cfg_.Extract(args);
154154
void* config[] = {
155-
HIP_LAUNCH_PARAM_BUFFER_POINTER, &packed_args,
155+
HIP_LAUNCH_PARAM_BUFFER_POINTER, packed_args,
156156
HIP_LAUNCH_PARAM_BUFFER_SIZE, &packed_nbytes,
157157
HIP_LAUNCH_PARAM_END
158158
};

0 commit comments

Comments
 (0)