This commit is contained in:
Botao Chen 2024-12-12 15:41:39 -08:00
parent 8132b4e177
commit 317e80dc2c
2 changed files with 3 additions and 3 deletions

View file

@ -26,4 +26,4 @@ class Checkpoint(BaseModel):
epoch: int
post_training_job_id: str
path: str
training_metric: Optional[PostTrainingMetric] = None
training_metrics: Optional[PostTrainingMetric] = None

View file

@ -544,13 +544,13 @@ class LoraFinetuningSingleDevice:
)
if self.training_config.data_config.validation_dataset_id:
validation_loss, perplexity = await self.validation()
training_metreic = PostTrainingMetric(
training_metrics = PostTrainingMetric(
epoch=curr_epoch,
train_loss=loss_to_log,
validation_loss=validation_loss,
perplexity=perplexity,
)
checkpoint.training_metric = training_metreic
checkpoint.training_metrics = training_metrics
checkpoints.append(checkpoint)
return (memory_stats, checkpoints)