Commit 624c37df by masahi Committed by Tianqi Chen

fixed rocm runtime. set default gcn arch to be gfx803 (#544)

parent acd48e9a
......@@ -136,7 +136,7 @@ runtime::Module BuildAMDGPU(Array<LoweredFunc> funcs, std::string target) {
) >= 4 &&
target.substr(0, 4) == "rocm");
llvm::TargetMachine* tm = \
GetLLVMTargetMachine("-mtriple=amdgcn-amd-amdhsa-hcc -mcpu=gfx900" + \
GetLLVMTargetMachine("-mtriple=amdgcn-amd-amdhsa-hcc -mcpu=gfx803" + \
target.substr(4, target.length() - 4));
std::unique_ptr<CodeGenAMDGPU> cg(new CodeGenAMDGPU());
......
......@@ -152,7 +152,7 @@ class ROCMWrappedFunc {
ThreadWorkLoad wl = thread_axis_cfg_.Extract(args);
void* config[] = {
HIP_LAUNCH_PARAM_BUFFER_POINTER, &packed_args,
HIP_LAUNCH_PARAM_BUFFER_POINTER, packed_args,
HIP_LAUNCH_PARAM_BUFFER_SIZE, &packed_nbytes,
HIP_LAUNCH_PARAM_END
};
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment