diff --git a/code/train_causal_mc.py b/code/train_causal_mc.py index 624b4d9..ed16e1b 100644 --- a/code/train_causal_mc.py +++ b/code/train_causal_mc.py @@ -305,7 +305,6 @@ def main(): quantization_config=q_config, use_flash_attention_2=True, trust_remote_code=True, - token="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", # pretraining_tp=1, ) tokenizer = AutoTokenizer.from_pretrained(cfg.model_name_or_path)