From 27a165711865aa76b59a21b72f7fec97b01cf2ec Mon Sep 17 00:00:00 2001 From: raspawar Date: Wed, 2 Apr 2025 10:04:12 +0000 Subject: [PATCH] update documentation --- .../remote/post_training/nvidia/README.md | 14 ++++++++++++++ 1 file changed, 14 insertions(+) diff --git a/llama_stack/providers/remote/post_training/nvidia/README.md b/llama_stack/providers/remote/post_training/nvidia/README.md index 230587d66..015d6a5f9 100644 --- a/llama_stack/providers/remote/post_training/nvidia/README.md +++ b/llama_stack/providers/remote/post_training/nvidia/README.md @@ -125,6 +125,20 @@ client.post_training.job.cancel(job_uuid="your-job-id") ### Inference with the fine-tuned model +#### 1. Register the model + +```python +model = Model( + identifier="test-example-model@v1", + provider_id="nvidia", + provider_model_id="test-example-model@v1", + model_type=ModelType.llm, +) +client.register_model(model) +``` + +#### 2. Inference with the fine-tuned model + ```python response = client.inference.completion( content="Complete the sentence using one word: Roses are red, violets are ",