mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-05 10:23:44 +00:00
feat: refactor llama-stack-api structure
move llama_stack_api.apis... to top level llama_stack_api. merge provider datatypes and the existing apis.datatypes into a common llama_stack_api.datatypes update all usages of these packages throughout LLS Signed-off-by: Charlie Doern <cdoern@redhat.com>
This commit is contained in:
parent
d6b915ce0a
commit
b7480e9c88
296 changed files with 906 additions and 1109 deletions
|
|
@ -58,8 +58,8 @@ import json
|
|||
from unittest.mock import AsyncMock, MagicMock
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.batches import BatchObject
|
||||
from llama_stack_api.apis.common.errors import ConflictError, ResourceNotFoundError
|
||||
from llama_stack_api.batches import BatchObject
|
||||
from llama_stack_api.common.errors import ConflictError, ResourceNotFoundError
|
||||
|
||||
|
||||
class TestReferenceBatchesImpl:
|
||||
|
|
|
|||
|
|
@ -43,7 +43,7 @@ Key Behaviors Tested:
|
|||
import asyncio
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.common.errors import ConflictError
|
||||
from llama_stack_api.common.errors import ConflictError
|
||||
|
||||
|
||||
class TestReferenceBatchesIdempotency:
|
||||
|
|
|
|||
|
|
@ -8,8 +8,8 @@ from unittest.mock import patch
|
|||
|
||||
import pytest
|
||||
from botocore.exceptions import ClientError
|
||||
from llama_stack_api.apis.common.errors import ResourceNotFoundError
|
||||
from llama_stack_api.apis.files import OpenAIFilePurpose
|
||||
from llama_stack_api.common.errors import ResourceNotFoundError
|
||||
from llama_stack_api.files import OpenAIFilePurpose
|
||||
|
||||
|
||||
class TestS3FilesImpl:
|
||||
|
|
@ -227,7 +227,7 @@ class TestS3FilesImpl:
|
|||
|
||||
mock_now.return_value = 0
|
||||
|
||||
from llama_stack_api.apis.files import ExpiresAfter
|
||||
from llama_stack_api.files import ExpiresAfter
|
||||
|
||||
sample_text_file.filename = "test_expired_file"
|
||||
uploaded = await s3_provider.openai_upload_file(
|
||||
|
|
@ -259,7 +259,7 @@ class TestS3FilesImpl:
|
|||
|
||||
async def test_unsupported_expires_after_anchor(self, s3_provider, sample_text_file):
|
||||
"""Unsupported anchor value should raise ValueError."""
|
||||
from llama_stack_api.apis.files import ExpiresAfter
|
||||
from llama_stack_api.files import ExpiresAfter
|
||||
|
||||
sample_text_file.filename = "test_unsupported_expires_after_anchor"
|
||||
|
||||
|
|
@ -272,7 +272,7 @@ class TestS3FilesImpl:
|
|||
|
||||
async def test_nonint_expires_after_seconds(self, s3_provider, sample_text_file):
|
||||
"""Non-integer seconds in expires_after should raise ValueError."""
|
||||
from llama_stack_api.apis.files import ExpiresAfter
|
||||
from llama_stack_api.files import ExpiresAfter
|
||||
|
||||
sample_text_file.filename = "test_nonint_expires_after_seconds"
|
||||
|
||||
|
|
@ -285,7 +285,7 @@ class TestS3FilesImpl:
|
|||
|
||||
async def test_expires_after_seconds_out_of_bounds(self, s3_provider, sample_text_file):
|
||||
"""Seconds outside allowed range should raise ValueError."""
|
||||
from llama_stack_api.apis.files import ExpiresAfter
|
||||
from llama_stack_api.files import ExpiresAfter
|
||||
|
||||
with pytest.raises(ValueError, match="greater than or equal to 3600"):
|
||||
await s3_provider.openai_upload_file(
|
||||
|
|
|
|||
|
|
@ -7,8 +7,8 @@
|
|||
from unittest.mock import patch
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.common.errors import ResourceNotFoundError
|
||||
from llama_stack_api.apis.files import OpenAIFilePurpose
|
||||
from llama_stack_api.common.errors import ResourceNotFoundError
|
||||
from llama_stack_api.files import OpenAIFilePurpose
|
||||
|
||||
from llama_stack.core.datatypes import User
|
||||
from llama_stack.providers.remote.files.s3.files import S3FilesImpl
|
||||
|
|
|
|||
|
|
@ -8,7 +8,7 @@ from types import SimpleNamespace
|
|||
from unittest.mock import AsyncMock, MagicMock
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.inference import OpenAIChatCompletionRequestWithExtraBody
|
||||
from llama_stack_api.inference import OpenAIChatCompletionRequestWithExtraBody
|
||||
from openai import AuthenticationError
|
||||
|
||||
from llama_stack.providers.remote.inference.bedrock.bedrock import BedrockInferenceAdapter
|
||||
|
|
|
|||
|
|
@ -9,7 +9,8 @@ import time
|
|||
from unittest.mock import AsyncMock, MagicMock, PropertyMock, patch
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.inference import (
|
||||
from llama_stack_api.datatypes import HealthStatus
|
||||
from llama_stack_api.inference import (
|
||||
OpenAIAssistantMessageParam,
|
||||
OpenAIChatCompletion,
|
||||
OpenAIChatCompletionRequestWithExtraBody,
|
||||
|
|
@ -19,8 +20,7 @@ from llama_stack_api.apis.inference import (
|
|||
OpenAICompletionRequestWithExtraBody,
|
||||
ToolChoice,
|
||||
)
|
||||
from llama_stack_api.apis.models import Model
|
||||
from llama_stack_api.providers.datatypes import HealthStatus
|
||||
from llama_stack_api.models import Model
|
||||
|
||||
from llama_stack.core.routers.inference import InferenceRouter
|
||||
from llama_stack.core.routing_tables.models import ModelsRoutingTable
|
||||
|
|
|
|||
|
|
@ -7,7 +7,7 @@
|
|||
from unittest.mock import AsyncMock
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.tools import ToolDef
|
||||
from llama_stack_api.tools import ToolDef
|
||||
|
||||
from llama_stack.providers.inline.agents.meta_reference.responses.streaming import (
|
||||
convert_tooldef_to_chat_tool,
|
||||
|
|
|
|||
|
|
@ -8,8 +8,8 @@ import os
|
|||
from unittest.mock import patch
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.datasets import Dataset, DatasetPurpose, URIDataSource
|
||||
from llama_stack_api.apis.resource import ResourceType
|
||||
from llama_stack_api.datasets import Dataset, DatasetPurpose, URIDataSource
|
||||
from llama_stack_api.resource import ResourceType
|
||||
|
||||
from llama_stack.providers.remote.datasetio.nvidia.config import NvidiaDatasetIOConfig
|
||||
from llama_stack.providers.remote.datasetio.nvidia.datasetio import NvidiaDatasetIOAdapter
|
||||
|
|
|
|||
|
|
@ -8,11 +8,11 @@ import os
|
|||
from unittest.mock import MagicMock, patch
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.benchmarks import Benchmark
|
||||
from llama_stack_api.apis.common.job_types import Job, JobStatus
|
||||
from llama_stack_api.apis.eval.eval import BenchmarkConfig, EvaluateResponse, ModelCandidate, SamplingParams
|
||||
from llama_stack_api.apis.inference.inference import TopPSamplingStrategy
|
||||
from llama_stack_api.apis.resource import ResourceType
|
||||
from llama_stack_api.benchmarks import Benchmark
|
||||
from llama_stack_api.common.job_types import Job, JobStatus
|
||||
from llama_stack_api.eval import BenchmarkConfig, EvaluateResponse, ModelCandidate, SamplingParams
|
||||
from llama_stack_api.inference import TopPSamplingStrategy
|
||||
from llama_stack_api.resource import ResourceType
|
||||
|
||||
from llama_stack.models.llama.sku_types import CoreModelId
|
||||
from llama_stack.providers.remote.eval.nvidia.config import NVIDIAEvalConfig
|
||||
|
|
|
|||
|
|
@ -9,7 +9,7 @@ import warnings
|
|||
from unittest.mock import patch
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.post_training.post_training import (
|
||||
from llama_stack_api.post_training import (
|
||||
DataConfig,
|
||||
DatasetFormat,
|
||||
EfficiencyConfig,
|
||||
|
|
|
|||
|
|
@ -8,7 +8,7 @@ from unittest.mock import AsyncMock, MagicMock, patch
|
|||
|
||||
import aiohttp
|
||||
import pytest
|
||||
from llama_stack_api.apis.models import ModelType
|
||||
from llama_stack_api.models import ModelType
|
||||
|
||||
from llama_stack.providers.remote.inference.nvidia.config import NVIDIAConfig
|
||||
from llama_stack.providers.remote.inference.nvidia.nvidia import NVIDIAInferenceAdapter
|
||||
|
|
|
|||
|
|
@ -9,13 +9,13 @@ from typing import Any
|
|||
from unittest.mock import AsyncMock, MagicMock, patch
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.inference import (
|
||||
from llama_stack_api.inference import (
|
||||
OpenAIAssistantMessageParam,
|
||||
OpenAIUserMessageParam,
|
||||
)
|
||||
from llama_stack_api.apis.resource import ResourceType
|
||||
from llama_stack_api.apis.safety import RunShieldResponse, ViolationLevel
|
||||
from llama_stack_api.apis.shields import Shield
|
||||
from llama_stack_api.resource import ResourceType
|
||||
from llama_stack_api.safety import RunShieldResponse, ViolationLevel
|
||||
from llama_stack_api.shields import Shield
|
||||
|
||||
from llama_stack.providers.remote.safety.nvidia.config import NVIDIASafetyConfig
|
||||
from llama_stack.providers.remote.safety.nvidia.nvidia import NVIDIASafetyAdapter
|
||||
|
|
|
|||
|
|
@ -9,7 +9,7 @@ import warnings
|
|||
from unittest.mock import patch
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.post_training.post_training import (
|
||||
from llama_stack_api.post_training import (
|
||||
DataConfig,
|
||||
DatasetFormat,
|
||||
LoraFinetuningConfig,
|
||||
|
|
|
|||
|
|
@ -7,7 +7,7 @@
|
|||
from types import SimpleNamespace
|
||||
from unittest.mock import AsyncMock, PropertyMock, patch
|
||||
|
||||
from llama_stack_api.apis.inference import OpenAIChatCompletionRequestWithExtraBody
|
||||
from llama_stack_api.inference import OpenAIChatCompletionRequestWithExtraBody
|
||||
|
||||
from llama_stack.providers.remote.inference.bedrock.bedrock import BedrockInferenceAdapter
|
||||
from llama_stack.providers.remote.inference.bedrock.config import BedrockConfig
|
||||
|
|
|
|||
|
|
@ -10,8 +10,8 @@ from typing import Any
|
|||
from unittest.mock import AsyncMock, MagicMock, Mock, PropertyMock, patch
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.inference import Model, OpenAIChatCompletionRequestWithExtraBody, OpenAIUserMessageParam
|
||||
from llama_stack_api.apis.models import ModelType
|
||||
from llama_stack_api.inference import Model, OpenAIChatCompletionRequestWithExtraBody, OpenAIUserMessageParam
|
||||
from llama_stack_api.models import ModelType
|
||||
from pydantic import BaseModel, Field
|
||||
|
||||
from llama_stack.core.request_headers import request_provider_data_context
|
||||
|
|
|
|||
|
|
@ -4,7 +4,7 @@
|
|||
# This source code is licensed under the terms described in the LICENSE file in
|
||||
# the root directory of this source tree.
|
||||
|
||||
from llama_stack_api.apis.inference import (
|
||||
from llama_stack_api.inference import (
|
||||
OpenAIAssistantMessageParam,
|
||||
OpenAIUserMessageParam,
|
||||
)
|
||||
|
|
|
|||
|
|
@ -7,8 +7,8 @@
|
|||
from unittest.mock import AsyncMock, MagicMock, patch
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.common.content_types import URL, TextContentItem
|
||||
from llama_stack_api.apis.tools import RAGDocument
|
||||
from llama_stack_api.common.content_types import URL, TextContentItem
|
||||
from llama_stack_api.rag_tool import RAGDocument
|
||||
|
||||
from llama_stack.providers.utils.memory.vector_store import content_from_data_and_mime_type, content_from_doc
|
||||
|
||||
|
|
|
|||
|
|
@ -34,7 +34,7 @@
|
|||
#
|
||||
|
||||
import pytest
|
||||
from llama_stack_api.apis.models import Model
|
||||
from llama_stack_api.models import Model
|
||||
|
||||
from llama_stack.providers.utils.inference.model_registry import ModelRegistryHelper, ProviderModelEntry
|
||||
|
||||
|
|
|
|||
|
|
@ -9,8 +9,8 @@ from unittest.mock import AsyncMock, MagicMock, patch
|
|||
|
||||
import numpy as np
|
||||
import pytest
|
||||
from llama_stack_api.apis.vector_io import Chunk, ChunkMetadata, QueryChunksResponse
|
||||
from llama_stack_api.apis.vector_stores import VectorStore
|
||||
from llama_stack_api.vector_io import Chunk, ChunkMetadata, QueryChunksResponse
|
||||
from llama_stack_api.vector_stores import VectorStore
|
||||
|
||||
from llama_stack.core.storage.datatypes import KVStoreReference, SqliteKVStoreConfig
|
||||
from llama_stack.providers.inline.vector_io.faiss.config import FaissVectorIOConfig
|
||||
|
|
|
|||
|
|
@ -9,10 +9,10 @@ from unittest.mock import MagicMock, patch
|
|||
|
||||
import numpy as np
|
||||
import pytest
|
||||
from llama_stack_api.apis.files import Files
|
||||
from llama_stack_api.apis.vector_io import Chunk, QueryChunksResponse
|
||||
from llama_stack_api.apis.vector_stores import VectorStore
|
||||
from llama_stack_api.providers.datatypes import HealthStatus
|
||||
from llama_stack_api.datatypes import HealthStatus
|
||||
from llama_stack_api.files import Files
|
||||
from llama_stack_api.vector_io import Chunk, QueryChunksResponse
|
||||
from llama_stack_api.vector_stores import VectorStore
|
||||
|
||||
from llama_stack.providers.inline.vector_io.faiss.config import FaissVectorIOConfig
|
||||
from llama_stack.providers.inline.vector_io.faiss.faiss import (
|
||||
|
|
|
|||
|
|
@ -8,7 +8,7 @@ import asyncio
|
|||
|
||||
import numpy as np
|
||||
import pytest
|
||||
from llama_stack_api.apis.vector_io import Chunk, QueryChunksResponse
|
||||
from llama_stack_api.vector_io import Chunk, QueryChunksResponse
|
||||
|
||||
from llama_stack.providers.inline.vector_io.sqlite_vec.sqlite_vec import (
|
||||
SQLiteVecIndex,
|
||||
|
|
|
|||
|
|
@ -10,8 +10,8 @@ from unittest.mock import AsyncMock, patch
|
|||
|
||||
import numpy as np
|
||||
import pytest
|
||||
from llama_stack_api.apis.common.errors import VectorStoreNotFoundError
|
||||
from llama_stack_api.apis.vector_io import (
|
||||
from llama_stack_api.common.errors import VectorStoreNotFoundError
|
||||
from llama_stack_api.vector_io import (
|
||||
Chunk,
|
||||
OpenAICreateVectorStoreFileBatchRequestWithExtraBody,
|
||||
OpenAICreateVectorStoreRequestWithExtraBody,
|
||||
|
|
@ -19,7 +19,7 @@ from llama_stack_api.apis.vector_io import (
|
|||
VectorStoreChunkingStrategyAuto,
|
||||
VectorStoreFileObject,
|
||||
)
|
||||
from llama_stack_api.apis.vector_stores import VectorStore
|
||||
from llama_stack_api.vector_stores import VectorStore
|
||||
|
||||
from llama_stack.providers.inline.vector_io.sqlite_vec.sqlite_vec import VECTOR_DBS_PREFIX
|
||||
|
||||
|
|
@ -222,7 +222,7 @@ async def test_insert_chunks_missing_db_raises(vector_io_adapter):
|
|||
|
||||
async def test_insert_chunks_with_missing_document_id(vector_io_adapter):
|
||||
"""Ensure no KeyError when document_id is missing or in different places."""
|
||||
from llama_stack_api.apis.vector_io import Chunk, ChunkMetadata
|
||||
from llama_stack_api.vector_io import Chunk, ChunkMetadata
|
||||
|
||||
fake_index = AsyncMock()
|
||||
vector_io_adapter.cache["db1"] = fake_index
|
||||
|
|
@ -255,7 +255,7 @@ async def test_insert_chunks_with_missing_document_id(vector_io_adapter):
|
|||
|
||||
async def test_document_id_with_invalid_type_raises_error():
|
||||
"""Ensure TypeError is raised when document_id is not a string."""
|
||||
from llama_stack_api.apis.vector_io import Chunk
|
||||
from llama_stack_api.vector_io import Chunk
|
||||
|
||||
# Integer document_id should raise TypeError
|
||||
from llama_stack.providers.utils.vector_io.vector_utils import generate_chunk_id
|
||||
|
|
|
|||
|
|
@ -4,7 +4,7 @@
|
|||
# This source code is licensed under the terms described in the LICENSE file in
|
||||
# the root directory of this source tree.
|
||||
|
||||
from llama_stack_api.apis.vector_io import Chunk, ChunkMetadata
|
||||
from llama_stack_api.vector_io import Chunk, ChunkMetadata
|
||||
|
||||
from llama_stack.providers.utils.vector_io.vector_utils import generate_chunk_id
|
||||
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue