From 2b31e51d5a6939f6b398c4b8d76ea8b8d18b38b1 Mon Sep 17 00:00:00 2001 From: Peter Yeh Date: Thu, 10 Oct 2019 14:09:33 -0700 Subject: [PATCH] force code object v2 for amd gpu backend --- src/codegen/llvm/codegen_amdgpu.cc | 1 + 1 file changed, 1 insertion(+) diff --git a/src/codegen/llvm/codegen_amdgpu.cc b/src/codegen/llvm/codegen_amdgpu.cc index 58a2964c3d82..0b9b8e3c905b 100644 --- a/src/codegen/llvm/codegen_amdgpu.cc +++ b/src/codegen/llvm/codegen_amdgpu.cc @@ -189,6 +189,7 @@ runtime::Module BuildAMDGPU(Array funcs, std::string target) { std::ostringstream config; config << "-mtriple=amdgcn-amd-amdhsa-hcc -mcpu=gfx" << DetectROCMComputeVersion(target) + << " -mattr=-code-object-v3 " << target.substr(4, target.length() - 4); std::unique_ptr tm = GetLLVMTargetMachine(config.str()); std::unique_ptr cg(new CodeGenAMDGPU());