diff --git a/docs/notebooks/Alpha_Llama_Stack_Post_Training.ipynb b/docs/notebooks/Alpha_Llama_Stack_Post_Training.ipynb index c7701cb16..b7d769b51 100644 --- a/docs/notebooks/Alpha_Llama_Stack_Post_Training.ipynb +++ b/docs/notebooks/Alpha_Llama_Stack_Post_Training.ipynb @@ -3535,14 +3535,12 @@ "\n", "# register the eval dataset\n", "response = client.datasets.register(\n", - " dataset_id=\"eval_dataset\",\n", - " provider_id=\"localfs\",\n", - " url={\"uri\": data_url},\n", - " dataset_schema={\n", - " \"input_query\": {\"type\": \"string\"},\n", - " \"chat_completion_input\": {\"type\": \"chat_completion_input\"},\n", - " \"expected_answer\": {\"type\": \"string\"},\n", + " purpose=\"eval/messages-answer\",\n", + " source={\n", + " \"type\": \"uri\",\n", + " \"uri\": data_url,\n", " },\n", + " dataset_id=\"eval_dataset\",\n", ")" ] }, @@ -4397,15 +4395,15 @@ "# register post training dataset\n", "# use the below commented out version for dialog dataset\n", "response = client.datasets.register(\n", - " dataset_id=\"post_training_dataset\",\n", - " provider_id=\"localfs\",\n", - " url={\"uri\": data_url},\n", - " dataset_schema={\n", - " \"chat_completion_input\": {\"type\": \"chat_completion_input\"},\n", - " \"expected_answer\": {\"type\": \"string\"},\n", + " purpose=\"post-training/messages\",\n", + " source={\n", + " \"type\": \"uri\",\n", + " \"uri\": data_url,\n", " },\n", + " dataset_id=\"post_training_dataset\",\n", ")\n", "\n", + "\n", "# response = client.datasets.register(\n", "# dataset_id=\"post_training_dataset\",\n", "# provider_id=\"localfs\",\n", diff --git a/docs/source/references/evals_reference/index.md b/docs/source/references/evals_reference/index.md index 2b3d1cff5..0294d83ea 100644 --- a/docs/source/references/evals_reference/index.md +++ b/docs/source/references/evals_reference/index.md @@ -114,18 +114,12 @@ pprint(response) simpleqa_dataset_id = "huggingface::simpleqa" _ = client.datasets.register( + purpose="eval/messages-answer", + source={ + "type": "uri", + "uri": "huggingface://datasets/llamastack/simpleqa?split=train", + }, dataset_id=simpleqa_dataset_id, - provider_id="huggingface", - url={"uri": "https://huggingface.co/datasets/llamastack/simpleqa"}, - metadata={ - "path": "llamastack/simpleqa", - "split": "train", - }, - dataset_schema={ - "input_query": {"type": "string"}, - "expected_answer": {"type": "string"}, - "chat_completion_input": {"type": "chat_completion_input"}, - }, ) eval_rows = client.datasets.iterrows(