runtime error
python3.10/site-packages/deepspeed/module_inject/replace_module.py", line 310, in replace_fn new_module = replace_with_policy(child, File "/usr/local/lib/python3.10/site-packages/deepspeed/module_inject/replace_module.py", line 247, in replace_with_policy _container.create_module() File "/usr/local/lib/python3.10/site-packages/deepspeed/module_inject/containers/gpt2.py", line 20, in create_module self.module = DeepSpeedGPTInference(_config, mp_group=self.mp_group) File "/usr/local/lib/python3.10/site-packages/deepspeed/model_implementations/transformers/ds_gpt.py", line 20, in __init__ super().__init__(config, mp_group, quantize_scales, quantize_groups, merge_count, mlp_extra_grouping) File "/usr/local/lib/python3.10/site-packages/deepspeed/model_implementations/transformers/ds_transformer.py", line 58, in __init__ inference_module = builder.load() File "/usr/local/lib/python3.10/site-packages/deepspeed/ops/op_builder/builder.py", line 479, in load return self.jit_load(verbose) File "/usr/local/lib/python3.10/site-packages/deepspeed/ops/op_builder/builder.py", line 523, in jit_load op_module = load(name=self.name, File "/usr/local/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 1306, in load return _jit_compile( File "/usr/local/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 1710, in _jit_compile _write_ninja_file_and_build_library( File "/usr/local/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 1800, in _write_ninja_file_and_build_library extra_ldflags = _prepare_ldflags( File "/usr/local/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 1893, in _prepare_ldflags if (not os.path.exists(_join_cuda_home(extra_lib_dir)) and File "/usr/local/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 2407, in _join_cuda_home raise OSError('CUDA_HOME environment variable is not set. ' OSError: CUDA_HOME environment variable is not set. Please set it to your CUDA install root.
Container logs:
Fetching error logs...