mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-03 19:57:35 +00:00
Merge 66f4af7fec
into d266c59c2a
This commit is contained in:
commit
31bbb2de18
2 changed files with 2 additions and 2 deletions
|
@ -71,7 +71,7 @@ class HuggingFacePostTrainingConfig(BaseModel):
|
|||
dpo_beta: float = 0.1
|
||||
use_reference_model: bool = True
|
||||
dpo_loss_type: Literal["sigmoid", "hinge", "ipo", "kto_pair"] = "sigmoid"
|
||||
dpo_output_dir: str
|
||||
dpo_output_dir: str | None = None
|
||||
|
||||
@classmethod
|
||||
def sample_run_config(cls, __distro_dir__: str, **kwargs: Any) -> dict[str, Any]:
|
||||
|
|
|
@ -135,7 +135,7 @@ class HuggingFacePostTrainingImpl:
|
|||
|
||||
resources_allocated, checkpoints = await recipe.train(
|
||||
model=finetuned_model,
|
||||
output_dir=f"{self.config.dpo_output_dir}/{job_uuid}",
|
||||
output_dir=f"{self.config.dpo_output_dir}/{job_uuid}" if self.config.dpo_output_dir else None,
|
||||
job_uuid=job_uuid,
|
||||
dpo_config=algorithm_config,
|
||||
config=training_config,
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue