add datastore initial code

This commit is contained in:
Ubuntu 2025-03-14 14:45:00 +00:00 committed by raspawar
parent d667a7109f
commit 0a2af0e2f8
9 changed files with 293 additions and 9 deletions

View file

@ -16,6 +16,8 @@ distribution_spec:
- inline::meta-reference
datasetio:
- inline::localfs
datasets:
- remote::nvidia
scoring:
- inline::basic
- inline::llm-as-judge

View file

@ -7,6 +7,7 @@
from pathlib import Path
from llama_stack.distribution.datatypes import ModelInput, Provider, ShieldInput, ToolGroupInput
from llama_stack.providers.remote.datasets.nvidia import NvidiaDatasetConfig
from llama_stack.providers.remote.inference.nvidia import NVIDIAConfig
from llama_stack.providers.remote.inference.nvidia.models import MODEL_ENTRIES
from llama_stack.providers.remote.post_training.nvidia import NvidiaPostTrainingConfig
@ -24,6 +25,7 @@ def get_distribution_template() -> DistributionTemplate:
"telemetry": ["inline::meta-reference"],
"eval": ["inline::meta-reference"],
"datasetio": ["inline::localfs"],
"datasets": ["remote::nvidia"],
"scoring": ["inline::basic"],
"tool_runtime": ["inline::rag-runtime"],
}
@ -39,6 +41,12 @@ def get_distribution_template() -> DistributionTemplate:
provider_type="remote::nvidia",
config=NvidiaPostTrainingConfig.sample_run_config(),
)
datasets_provider = Provider(
provider_id="nvidia",
provider_type="remote::nvidia",
config=NvidiaDatasetConfig.sample_run_config(),
)
safety_provider = Provider(
provider_id="nvidia",
provider_type="remote::nvidia",
@ -76,6 +84,8 @@ def get_distribution_template() -> DistributionTemplate:
"run.yaml": RunConfigSettings(
provider_overrides={
"inference": [inference_provider],
"post_training": [post_training_provider],
"datasets": [datasets_provider],
},
default_models=default_models,
default_tool_groups=default_tool_groups,

View file

@ -58,11 +58,11 @@ providers:
datasetio:
- provider_id: localfs
provider_type: inline::localfs
config:
kvstore:
type: sqlite
namespace: null
db_path: ${env.SQLITE_STORE_DIR:~/.llama/distributions/nvidia}/localfs_datasetio.db
config: {}
datasets:
- provider_id: nvidia
provider_type: remote::nvidia
config: {}
scoring:
- provider_id: basic
provider_type: inline::basic