diff --git a/nemo/collections/llm/recipes/mixtral_8x3b.py b/nemo/collections/llm/recipes/mixtral_8x3b.py index 6cea2ab30725a..d7aad37590961 100644 --- a/nemo/collections/llm/recipes/mixtral_8x3b.py +++ b/nemo/collections/llm/recipes/mixtral_8x3b.py @@ -12,9 +12,8 @@ from nemo.collections.llm.peft.lora import LoRA from nemo.collections.llm.recipes.log.default import default_log, default_resume, tensorboard_logger from nemo.collections.llm.recipes.optim.adam import distributed_fused_adam_with_cosine_annealing -from nemo.collections.llm.recipes.precision.mixed_precision import bf16_mixed_plugin +from nemo.collections.llm.recipes.precision.mixed_precision import bf16_mixed, bf16_mixed_plugin from nemo.collections.llm.utils import Config, Partial -from nemo.collections.llm.recipes.precision.mixed_precision import bf16_mixed from nemo.lightning.pytorch.callbacks.megatron_comm_overlap import MegatronCommOverlapCallback from nemo.lightning.pytorch.callbacks.moe_token_drop import MegatronTokenDropCallback from nemo.utils.exp_manager import TimingCallback