cd X1安装目录/Megatron-LM/megatron
vim checkpointing.py
import torch_mindio
optim_checkpoint = torch.load(optim_load_path, map_location=torch.device('cpu'))
替换后:
optim_checkpoint = torch_mindio.load(optim_load_path, map_location='cpu')
torch.save(state, save_path)
torch_mindio.save(state, save_path)
with open(self._get_optimizer_ckpt_name(save_dir, tag, expp_rank), 'wb') as fd: torch.save(optimizer_state, fd) fd.flush()
torch_mindio.save(optimizer_state, self._get_optimizer_ckpt_name(save_dir, tag, expp_rank))