torch:2.3.1
torch_npu:2.3.1
cann:8.0rc2
modellink-master
Traceback (most recent call last):
File "/usr/local/python3.8.19/lib/python3.8/multiprocessing/process.py", line 315, in _bootstrap
self.run()
File "/usr/local/python3.8.19/lib/python3.8/multiprocessing/process.py", line 108, in run
self._target(*self._args, **self._kwargs)
File "/job/code/tools/checkpoint/saver_megatron.py", line 553, in save_model_checkpoint
models = get_models(args.target_tensor_parallel_size, md.params_dtype, True, post_process)
File "/job/code/tools/checkpoint/saver_megatron.py", line 515, in get_models
models = [model_provider(pre_process, post_process).to(dtype) for _ in range(count)]
File "/job/code/tools/checkpoint/saver_megatron.py", line 515, in
models = [model_provider(pre_process, post_process).to(dtype) for _ in range(count)]
File "/job/code/pretrain_gpt.py", line 87, in model_provider
model = megatron.legacy.model.GPTModel(
File "/job/code/modellink/model/gpt_model.py", line 43, in init
self.language_model, self._language_model_key = get_language_model(
File "/job/code/megatron/legacy/model/language_model.py", line 67, in get_language_model
language_model = TransformerLanguageModel(
File "/job/code/modellink/model/language_model.py", line 97, in transformer_language_model_init
self.rotary_pos_emb = RotaryEmbedding(
File "/tmp/MindSpeed/mindspeed/core/fusions/rotary_pos_embedding.py", line 30, in wrapper
fn(self, *args, **kwargs)
File "/job/code/megatron/core/models/common/embeddings/rotary_pos_embedding.py", line 77, in init
torch.arange(0, dim, 2, dtype=torch.float32, device=torch.cuda.current_device())
File "/usr/local/python3.8.19/lib/python3.8/site-packages/torch_npu/npu/utils.py", line 59, in current_device
torch_npu.npu._lazy_init()
File "/usr/local/python3.8.19/lib/python3.8/site-packages/torch_npu/npu/init.py", line 210, in _lazy_init
raise RuntimeError(
RuntimeError: Cannot re-initialize NPU in forked subprocess. To use NPU with multiprocessing, you must use the 'spawn' start method
报错已经说明了原因了,不能在fork进程中重复初始化,建议使用spawn起进程
此处可能存在不合适展示的内容,页面不予展示。您可通过相关编辑功能自查并修改。
如您确认内容无涉及 不当用语 / 纯广告导流 / 暴力 / 低俗色情 / 侵权 / 盗版 / 虚假 / 无价值内容或违法国家有关法律法规的内容,可点击提交进行申诉,我们将尽快为您处理。
登录 后才可以发表评论