We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 543579d commit bfe8a04Copy full SHA for bfe8a04
1 file changed
megatron/core/optimizer/distrib_optimizer.py
@@ -415,7 +415,9 @@ def _build_model_and_main_param_groups(
415
416
# fp32 params.
417
elif model_param.type() == 'torch.cuda.FloatTensor':
418
- shard_model_param = model_param.view(-1)[param_range.start : param_range.end]
+ shard_model_param = model_param.detach().view(-1)[
419
+ param_range.start : param_range.end
420
+ ]
421
model_fp32_params_this_group.append(model_param)
422
shard_fp32_params_this_group.append(shard_model_param)
423
tensor_parallel.copy_tensor_model_parallel_attributes(
0 commit comments