Add type checks and style improvements

VProv · VProv · commit bf0b180a5ab4 · 2025-03-11T05:50:43.000-07:00
diff --git a/src/together/resources/finetune.py b/src/together/resources/finetune.py
@@ -1,7 +1,7 @@
 from __future__ import annotations
 
 from pathlib import Path
-from typing import Literal, Union
+from typing import Literal
 
 from rich import print as rprint
 
@@ -57,6 +57,7 @@ def createFinetuneRequest(
     training_method: str = "sft",
     dpo_beta: float | None = None,
 ) -> FinetuneRequest:
+
     if batch_size == "max":
         log_warn_once(
             "Starting from together>=1.3.0, "
@@ -104,14 +105,21 @@ def createFinetuneRequest(
     if weight_decay is not None and (weight_decay < 0):
         raise ValueError("Weight decay should be non-negative")
 
+    AVAILABLE_TRAINING_METHODS = {
+        TrainingMethodSFT().method,
+        TrainingMethodDPO().method,
+    }
+    if training_method not in AVAILABLE_TRAINING_METHODS:
+        raise ValueError(
+            f"training_method must be one of {', '.join(AVAILABLE_TRAINING_METHODS)}"
+        )
+
     lrScheduler = FinetuneLRScheduler(
         lr_scheduler_type="linear",
         lr_scheduler_args=FinetuneLinearLRSchedulerArgs(min_lr_ratio=min_lr_ratio),
     )
 
-    training_method_cls: Union[TrainingMethodSFT, TrainingMethodDPO] = (
-        TrainingMethodSFT()
-    )
+    training_method_cls: TrainingMethodSFT | TrainingMethodDPO = TrainingMethodSFT()
     if training_method == "dpo":
         training_method_cls = TrainingMethodDPO(dpo_beta=dpo_beta)
 
diff --git a/src/together/types/finetune.py b/src/together/types/finetune.py
@@ -1,7 +1,7 @@
 from __future__ import annotations
 
 from enum import Enum
-from typing import List, Literal, Union
+from typing import List, Literal
 
 from pydantic import StrictBool, Field, validator, field_validator
 
@@ -148,15 +148,15 @@ class TrainingMethodSFT(TrainingMethod):
     Training method type for SFT training
     """
 
-    method: str = "sft"
+    method: Literal["sft"] = "sft"
 
 
 class TrainingMethodDPO(TrainingMethod):
     """
     Training method type for DPO training
     """
 
-    method: str = "dpo"
+    method: Literal["dpo"] = "dpo"
     dpo_beta: float | None = None
 
 
@@ -204,7 +204,7 @@ class FinetuneRequest(BaseModel):
     # train on inputs
     train_on_inputs: StrictBool | Literal["auto"] = "auto"
     # training method
-    training_method: Union[TrainingMethodSFT, TrainingMethodDPO] = Field(
+    training_method: TrainingMethodSFT | TrainingMethodDPO = Field(
         default_factory=TrainingMethodSFT
     )