diff --git a/docs/_static/llama-stack-spec.html b/docs/_static/llama-stack-spec.html
index 748839691..210a84b03 100644
--- a/docs/_static/llama-stack-spec.html
+++ b/docs/_static/llama-stack-spec.html
@@ -9429,7 +9429,7 @@
},
"source": {
"$ref": "#/components/schemas/DataSource",
- "description": "The data source of the dataset. Examples: - { \"type\": \"uri\", \"uri\": \"https://mywebsite.com/mydata.jsonl\" } - { \"type\": \"uri\", \"uri\": \"lsfs://mydata.jsonl\" } - { \"type\": \"uri\", \"uri\": \"data:csv;base64,{base64_content}\" } - { \"type\": \"uri\", \"uri\": \"huggingface://llamastack/simpleqa?split=train\" } - { \"type\": \"rows\", \"rows\": [ { \"messages\": [ {\"role\": \"user\", \"content\": \"Hello, world!\"}, {\"role\": \"assistant\", \"content\": \"Hello, world!\"}, ] } ] }"
+ "description": "The data source of the dataset. Ensure that the data source schema is compatible with the purpose of the dataset. Examples: - { \"type\": \"uri\", \"uri\": \"https://mywebsite.com/mydata.jsonl\" } - { \"type\": \"uri\", \"uri\": \"lsfs://mydata.jsonl\" } - { \"type\": \"uri\", \"uri\": \"data:csv;base64,{base64_content}\" } - { \"type\": \"uri\", \"uri\": \"huggingface://llamastack/simpleqa?split=train\" } - { \"type\": \"rows\", \"rows\": [ { \"messages\": [ {\"role\": \"user\", \"content\": \"Hello, world!\"}, {\"role\": \"assistant\", \"content\": \"Hello, world!\"}, ] } ] }"
},
"metadata": {
"type": "object",
diff --git a/docs/_static/llama-stack-spec.yaml b/docs/_static/llama-stack-spec.yaml
index b607a0b7f..a1eb07444 100644
--- a/docs/_static/llama-stack-spec.yaml
+++ b/docs/_static/llama-stack-spec.yaml
@@ -6395,12 +6395,14 @@ components:
source:
$ref: '#/components/schemas/DataSource'
description: >-
- The data source of the dataset. Examples: - { "type": "uri", "uri": "https://mywebsite.com/mydata.jsonl"
- } - { "type": "uri", "uri": "lsfs://mydata.jsonl" } - { "type": "uri",
- "uri": "data:csv;base64,{base64_content}" } - { "type": "uri", "uri":
- "huggingface://llamastack/simpleqa?split=train" } - { "type": "rows",
- "rows": [ { "messages": [ {"role": "user", "content": "Hello, world!"},
- {"role": "assistant", "content": "Hello, world!"}, ] } ] }
+ The data source of the dataset. Ensure that the data source schema is
+ compatible with the purpose of the dataset. Examples: - { "type": "uri",
+ "uri": "https://mywebsite.com/mydata.jsonl" } - { "type": "uri", "uri":
+ "lsfs://mydata.jsonl" } - { "type": "uri", "uri": "data:csv;base64,{base64_content}"
+ } - { "type": "uri", "uri": "huggingface://llamastack/simpleqa?split=train"
+ } - { "type": "rows", "rows": [ { "messages": [ {"role": "user", "content":
+ "Hello, world!"}, {"role": "assistant", "content": "Hello, world!"}, ]
+ } ] }
metadata:
type: object
additionalProperties:
diff --git a/llama_stack/apis/datasets/datasets.py b/llama_stack/apis/datasets/datasets.py
index 1dd29ad8e..d033d0b70 100644
--- a/llama_stack/apis/datasets/datasets.py
+++ b/llama_stack/apis/datasets/datasets.py
@@ -163,7 +163,7 @@ class Datasets(Protocol):
],
"answer": "John Doe"
}
- :param source: The data source of the dataset. Examples:
+ :param source: The data source of the dataset. Ensure that the data source schema is compatible with the purpose of the dataset. Examples:
- {
"type": "uri",
"uri": "https://mywebsite.com/mydata.jsonl"