Commit 786d7998 by Thomas Viehmann Committed by masahi

add GPU checking before compilation for rocm (#4394)

Previously, we would rely on the later phases to error out
(often for using too much shared memory). This enables the
checks on the IR that already exist for CUDA and OpenCL also
for ROCm.
parent 464ebb13
...@@ -227,7 +227,8 @@ class RPCRunner(Runner): ...@@ -227,7 +227,8 @@ class RPCRunner(Runner):
def get_build_kwargs(self): def get_build_kwargs(self):
kwargs = {} kwargs = {}
if 'cuda' in self.task.target.keys or 'opencl' in self.task.target.keys: if 'cuda' in self.task.target.keys or 'opencl' in self.task.target.keys or \
'rocm' in self.task.target.keys:
remote = request_remote(self.key, self.host, self.port) remote = request_remote(self.key, self.host, self.port)
ctx = remote.context(str(self.task.target), 0) ctx = remote.context(str(self.task.target), 0)
max_dims = ctx.max_thread_dimensions max_dims = ctx.max_thread_dimensions
...@@ -345,7 +346,6 @@ class LocalRunner(RPCRunner): ...@@ -345,7 +346,6 @@ class LocalRunner(RPCRunner):
def _build_func_common(measure_input, check_gpu=None, cuda_arch=None, build_option=None): def _build_func_common(measure_input, check_gpu=None, cuda_arch=None, build_option=None):
"""Common part for building a configuration""" """Common part for building a configuration"""
target, task, config = measure_input target, task, config = measure_input
with target: with target:
s, args = task.instantiate(config) s, args = task.instantiate(config)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment