Hugging Face's logo
Shamima
/
Runtime error

runtime error

, in replace_fn new_module = replace_with_policy(child, File "/home/user/.local/lib/python3.10/site-packages/deepspeed/module_inject/replace_module.py", line 247, in replace_with_policy _container.create_module() File "/home/user/.local/lib/python3.10/site-packages/deepspeed/module_inject/containers/gpt2.py", line 20, in create_module self.module = DeepSpeedGPTInference(_config, mp_group=self.mp_group) File "/home/user/.local/lib/python3.10/site-packages/deepspeed/model_implementations/transformers/ds_gpt.py", line 20, in __init__ super().__init__(config, mp_group, quantize_scales, quantize_groups, merge_count, mlp_extra_grouping) File "/home/user/.local/lib/python3.10/site-packages/deepspeed/model_implementations/transformers/ds_transformer.py", line 58, in __init__ inference_module = builder.load() File "/home/user/.local/lib/python3.10/site-packages/deepspeed/ops/op_builder/builder.py", line 458, in load return self.jit_load(verbose) File "/home/user/.local/lib/python3.10/site-packages/deepspeed/ops/op_builder/builder.py", line 502, in jit_load op_module = load(name=self.name, File "/home/user/.local/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 1308, in load return _jit_compile( File "/home/user/.local/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 1710, in _jit_compile _write_ninja_file_and_build_library( File "/home/user/.local/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 1800, in _write_ninja_file_and_build_library extra_ldflags = _prepare_ldflags( File "/home/user/.local/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 1899, in _prepare_ldflags if (not os.path.exists(_join_cuda_home(extra_lib_dir)) and File "/home/user/.local/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 2416, in _join_cuda_home raise OSError('CUDA_HOME environment variable is not set. ' OSError: CUDA_HOME environment variable is not set. Please set it to your CUDA install root.

Container logs:

Fetching error logs...