mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-06-27 18:50:41 +00:00
fix: Add type field to DPOAlignmentConfig for remote provider serialization
Addresses review feedback to keep preference optimization APIs DPO-specific rather than accepting all algorithm types.
This commit is contained in:
parent
40a0cef38e
commit
243fe37a67
1 changed files with 2 additions and 2 deletions
|
@ -125,7 +125,7 @@ class PostTrainingRLHFRequest(BaseModel):
|
|||
validation_dataset_id: str
|
||||
|
||||
algorithm: RLHFAlgorithm
|
||||
algorithm_config: AlgorithmConfig
|
||||
algorithm_config: DPOAlignmentConfig
|
||||
|
||||
optimizer_config: OptimizerConfig
|
||||
training_config: TrainingConfig
|
||||
|
@ -202,7 +202,7 @@ class PostTraining(Protocol):
|
|||
self,
|
||||
job_uuid: str,
|
||||
finetuned_model: str,
|
||||
algorithm_config: AlgorithmConfig,
|
||||
algorithm_config: DPOAlignmentConfig,
|
||||
training_config: TrainingConfig,
|
||||
hyperparam_search_config: dict[str, Any],
|
||||
logger_config: dict[str, Any],
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue