fix: Add type field to DPOAlignmentConfig for remote provider serialization

Addresses review feedback to keep preference optimization APIs DPO-specific
rather than accepting all algorithm types.
This commit is contained in:
Nehanth 2025-06-25 16:40:37 -04:00
parent 40a0cef38e
commit 243fe37a67

View file

@ -125,7 +125,7 @@ class PostTrainingRLHFRequest(BaseModel):
validation_dataset_id: str
algorithm: RLHFAlgorithm
algorithm_config: AlgorithmConfig
algorithm_config: DPOAlignmentConfig
optimizer_config: OptimizerConfig
training_config: TrainingConfig
@ -202,7 +202,7 @@ class PostTraining(Protocol):
self,
job_uuid: str,
finetuned_model: str,
algorithm_config: AlgorithmConfig,
algorithm_config: DPOAlignmentConfig,
training_config: TrainingConfig,
hyperparam_search_config: dict[str, Any],
logger_config: dict[str, Any],