Skip to content

Commit

Permalink
fixed rocm runtime. set default gcn arch to be gfx803 (#544)
Browse files Browse the repository at this point in the history
  • Loading branch information
masahi authored and tqchen committed Oct 12, 2017
1 parent acd48e9 commit 624c37d
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 2 deletions.
2 changes: 1 addition & 1 deletion src/codegen/llvm/codegen_amdgpu.cc
Original file line number Diff line number Diff line change
Expand Up @@ -136,7 +136,7 @@ runtime::Module BuildAMDGPU(Array<LoweredFunc> funcs, std::string target) {
) >= 4 &&
target.substr(0, 4) == "rocm");
llvm::TargetMachine* tm = \
GetLLVMTargetMachine("-mtriple=amdgcn-amd-amdhsa-hcc -mcpu=gfx900" + \
GetLLVMTargetMachine("-mtriple=amdgcn-amd-amdhsa-hcc -mcpu=gfx803" + \
target.substr(4, target.length() - 4));

std::unique_ptr<CodeGenAMDGPU> cg(new CodeGenAMDGPU());
Expand Down
2 changes: 1 addition & 1 deletion src/runtime/rocm/rocm_module.cc
Original file line number Diff line number Diff line change
Expand Up @@ -152,7 +152,7 @@ class ROCMWrappedFunc {

ThreadWorkLoad wl = thread_axis_cfg_.Extract(args);
void* config[] = {
HIP_LAUNCH_PARAM_BUFFER_POINTER, &packed_args,
HIP_LAUNCH_PARAM_BUFFER_POINTER, packed_args,
HIP_LAUNCH_PARAM_BUFFER_SIZE, &packed_nbytes,
HIP_LAUNCH_PARAM_END
};
Expand Down

0 comments on commit 624c37d

Please sign in to comment.