Temporary Commit at 1/6/2025, 8:13:09 PM

Summary: ### THIS DIFF ### PLAN ### CONTEXT ### DESIGN Test Plan: # Test Setup **Type checker and check that the build compiles** **Unit Tests** **E2E Tests** // Screenshots and videos | Before | After | |--| | … | … | # Monitoring Plan.
2025-08-05 10:13:05 +00:00 · 2025-01-06 20:13:10 -08:00 · 2025-01-06 20:13:10 -08:00 · bf610adf9b
commit bf610adf9b
parent b719743be9
25 changed files with 305 additions and 3 deletions
--- a/.github/.watchman-cookie-sxyi-mbp-77593-68
+++ b/.github/.watchman-cookie-sxyi-mbp-77593-68
--- a/.github/.watchman-cookie-sxyi-mbp-77593-69
+++ b/.github/.watchman-cookie-sxyi-mbp-77593-69
--- a/.github/.watchman-cookie-sxyi-mbp-77593-70
+++ b/.github/.watchman-cookie-sxyi-mbp-77593-70
--- a/distributions/.watchman-cookie-sxyi-mbp-77593-68
+++ b/distributions/.watchman-cookie-sxyi-mbp-77593-68
--- a/distributions/.watchman-cookie-sxyi-mbp-77593-69
+++ b/distributions/.watchman-cookie-sxyi-mbp-77593-69
--- a/distributions/.watchman-cookie-sxyi-mbp-77593-70
+++ b/distributions/.watchman-cookie-sxyi-mbp-77593-70
--- a/docs/.watchman-cookie-sxyi-mbp-77593-68
+++ b/docs/.watchman-cookie-sxyi-mbp-77593-68
--- a/docs/.watchman-cookie-sxyi-mbp-77593-69
+++ b/docs/.watchman-cookie-sxyi-mbp-77593-69
--- a/docs/.watchman-cookie-sxyi-mbp-77593-70
+++ b/docs/.watchman-cookie-sxyi-mbp-77593-70
--- a/llama_stack/.watchman-cookie-sxyi-mbp-77593-68
+++ b/llama_stack/.watchman-cookie-sxyi-mbp-77593-68
--- a/llama_stack/.watchman-cookie-sxyi-mbp-77593-69
+++ b/llama_stack/.watchman-cookie-sxyi-mbp-77593-69
--- a/llama_stack/.watchman-cookie-sxyi-mbp-77593-70
+++ b/llama_stack/.watchman-cookie-sxyi-mbp-77593-70
--- a/llama_stack/providers/tests/ci_test.py
+++ b/llama_stack/providers/tests/ci_test.py
@ -0,0 +1,112 @@
 import os
 import re
 import signal
 import subprocess
 import time
 import yaml
 from typing import List
 from pathlib import Path
 from llama_stack.apis import inference
 from llama_stack.distribution.datatypes import Provider
 import pytest
 # Inference provider and the required environment arg for running integration tests
 INFERENCE_PROVIDER_ENV_KEY = {
    "ollama": None,
    "fireworks": "FIREWORKS_API_KEY",
    "together": "TOGETHER_API_KEY",
 }
 TEST_MODELS = {
    "text": "meta-llama/Llama-3.1-8B-Instruct",
    "vision": "meta-llama/Llama-3.2-11B-Vision-Instruct",
 }
 # Model category and the keywords of the corresponding functionality tests
 CATEGORY_FUNCTIONALITY_TESTS = {
    "text": ["streaming", "tool_calling", "structured_output"],
    "vision": [
        "streaming",
    ],
 }
 class TestConfig:
    class ModelTest:
        model_type: str
        model_name: str
        test_path: str
    providers: List[str]
    apis: List[str]
    capabilities: List[str]
    model_tests: List[ModelTest]
 def generate_pytest_args(category, provider, test_keywords, env_key):
    test_path = (
        "./llama_stack/providers/tests/inference/test_{model_type}_inference.py".format(
            model_type=category
        )
    )
    pytest_args = [
        test_path,
        "-v",
        # "-s",
        "-k",
        "{provider} and ({test_keywords})".format(
            provider=provider, test_keywords=" or ".join(test_keywords)
        ),
        "--inference-model={model_name}".format(model_name=TEST_MODELS[category]),
    ]
    if env_key is not None:
        pytest_args.extend(
            [
                "--env",
                "{key_name}={key_value}".format(
                    key_name=env_key, key_value=os.getenv(env_key)
                ),
            ]
        )
    return pytest_args
 def main():
    test_result = []
    path = Path(__file__).parent / 'ci_test_config.yml'
    with open(path, 'r') as f:
        data = yaml.load(f, Loader=yaml.SafeLoader)
        inference = data['inference']
        model_tests = inference['model_tests']
    # for model_category, test_keywords in CATEGORY_FUNCTIONALITY_TESTS.items():
    #     for provider, env_key in INFERENCE_PROVIDER_ENV_KEY.items():
    #         if provider == "ollama":
    #             ollama_model_alias = (
    #                 "llama3.1:8b-instruct-fp16"
    #                 if model_category == "text"
    #                 else "llama3.2-vision:11b-instruct-fp16"
    #             )
    #             proc = subprocess.Popen(["ollama", "run", ollama_model_alias])
    #             retcode = pytest.main(
    #                 generate_pytest_args(
    #                     model_category, provider, test_keywords, env_key
    #                 )
    #             )
    #             proc = subprocess.Popen(["ollama", "stop", ollama_model_alias])
    #         else:
    #             retcode = pytest.main(
    #                 generate_pytest_args(
    #                     model_category, provider, test_keywords, env_key
    #                 )
    #             )
 if __name__ == "__main__":
    main()
--- a/llama_stack/providers/tests/ci_test_config.yml
+++ b/llama_stack/providers/tests/ci_test_config.yml
@ -0,0 +1,22 @@
 inference_providers:
  - ollama
  - fireworks
  - together
  - tgi
  - vllm
 test_models:
  text: meta-llama/Llama-3.1-8B-Instruct
  vision: meta-llama/Llama-3.2-11B-Vision-Instruct
 inference/test_vision_inference.py
  test_vision_chat_completion_streaming
  test_vision_chat_completion_non_streaming
 inference/test_text_inference.py
  test_structured_output
  test_chat_completion_streaming
  test_chat_completion_non_streaming
  test_chat_completion_with_tool_calling
  test_chat_completion_with_tool_calling_streaming
--- a/llama_stack/providers/tests/conftest.py
+++ b/llama_stack/providers/tests/conftest.py
@ -7,7 +7,8 @@
 import os
 from pathlib import Path
 from typing import Any, Dict, List, Optional
-
+import yaml
 import json
 import pytest
 from dotenv import load_dotenv
 from pydantic import BaseModel
@ -73,6 +74,10 @@ def pytest_addoption(parser):
    parser.addoption(
        "--env", action="append", help="Set environment variables, e.g. --env KEY=value"
    )
    parser.addoption(
        "--config", action="append", help="Set environment variables, e.g. --env KEY=value"
    )
 def make_provider_id(providers: Dict[str, str]) -> str:
@ -148,6 +153,62 @@ def pytest_itemcollected(item):
        item.name = f"{item.name}[{marks}]"
 # def pytest_ignore_collect(path, config):
 #     # print("SIXIAN ignore", path)
 #     # if config.getoption("--config") is None:
 #     #     return False
 #     manifest_path = Path(__file__).parent  / "manifest.json"
 #     files = json.loads(manifest_path.read_text(encoding="utf-8"))["files"]
 #     file_path = set((Path(__file__).parent / f["path"]) for f in files)
 #     # print("SIXIAN ", path.__class__.__name__)
 #     # print("SIXIAN files", file_path)
 #     if Path(path) not in file_path:
 #         # print("SIXIAN ignoring", path, file_path)
 #         return True
 #     return False
 def pytest_collection_modifyitems(config, items):
    manifest_path = Path(__file__).parent  / "manifest.json"
    manifest = json.loads(manifest_path.read_text(encoding="utf-8"))
    mapping = dict()
    for f in manifest["files"]:
        mapping[f["basepath"]] = f["functions"]
    ret_items = []
    deselected = []
    print("SIXIAN test_file", items)
    for item in items:
        test_file = item.fspath.basename
        # print("SIXIAN test_file", test_file, "mapping", mapping)
        if test_file in mapping.keys():
            print("SIXIAN appending", item)
            ret_items.append(item)
        else:
            deselected.append(item)  
    print("SIXIAN ret_items", ret_items)
    config.hook.pytest_deselected(items=[deselected])
 # class ManifestDirectory(pytest.Directory):
 #     def collect(self):
 #         manifest_path = self.path / "manifest.json"
 #         manifest = json.loads(manifest_path.read_text(encoding="utf-8"))
 #         ihook = self.ihook
 #         for file in manifest["files"]:
 #             yield from ihook.pytest_collect_file(
 #                 file_path=self.path / file, parent=self
 #             )
 # def pytest_collect_directory(path, parent):
 #     if config.getoption("--env") is None:
 #         return None
 #     if path.joinpath("manifest.json").is_file():
 #         return ManifestDirectory.from_parent(parent=parent, path=path)
 #     return None
 pytest_plugins = [
    "llama_stack.providers.tests.inference.fixtures",
    "llama_stack.providers.tests.safety.fixtures",
--- a/llama_stack/providers/tests/inference/test_text_inference.py
+++ b/llama_stack/providers/tests/inference/test_text_inference.py
@ -16,8 +16,6 @@ from llama_models.llama3.api.datatypes import (
    ToolPromptFormat,
 )
 from pydantic import BaseModel, ValidationError
 from llama_stack.apis.inference import (
    ChatCompletionResponse,
    ChatCompletionResponseEventType,
@ -33,6 +31,9 @@ from llama_stack.apis.inference import (
    UserMessage,
 )
 from llama_stack.apis.models import Model
 from pydantic import BaseModel, ValidationError
 from .utils import group_chunks
--- a/llama_stack/providers/tests/manifest.json
+++ b/llama_stack/providers/tests/manifest.json
@ -0,0 +1,21 @@
 {
    "files": [
        {
            "basepath": "test_text_inference.py",
            "functions": [
                "test_structured_output",
                "test_chat_completion_streaming",
                "test_chat_completion_non_streaming",
                "test_chat_completion_with_tool_calling",
                "test_chat_completion_with_tool_calling_streaming"
            ]
        },
        {
            "basepath": "test_vision_inference.py",
            "functions": [
                "test_vision_chat_completion_streaming",
                "test_vision_chat_completion_non_streaming"
            ]
        }
    ]
 }
--- a/llama_stack/providers/tests/report_config.yml
+++ b/llama_stack/providers/tests/report_config.yml
@ -0,0 +1,49 @@
 inference:
  providers:
    - id: ollama
    - id: together
      env_param: TOGETHER_API_KEY
    - id: fireworks
      env_param: FIREWORKS_API_KEY
    - id: tgi
    - id: vllm
  apis:
    - chat_completion
    - embeddings
  capabilities:
    - streaming
    - tool_calling
    - structured_output
  model_tests:
    - model_type: vision
      model_name: meta-llama/Llama-3.2-11B-Vision-Instruct
      test_path: /llama_stack/providers/tests/inference/test_vision_inference.py
      test_api:
        - chat_completion
      test_capabilities:
        - streaming
    - model_type: text
      model_name: meta-llama/Llama-3.1-8B-Instruct
      test_path: /llama_stack/providers/tests/inference/test_text_inference.py
      test_api:
        - chat_completion
      test_capabilities:
        - streaming
        - tool_calling
        - structured_output
    - model_type: embedding
      model_name: sentence-transformers/all-MiniLM-L6-v2
      test_path: /llama_stack/providers/tests/inference/test_embeddings.py
      test_api:
        - embedding
      test_capabilities: ~
 memory:
  providers:
   - faiss
   - weaviate
   - pgvector
   - chroma
  test_path:
   -  /llama_stack/providers/tests/memory/test_memory.py
--- a/llama_stack/providers/tests/test.py
+++ b/llama_stack/providers/tests/test.py
@ -0,0 +1,36 @@
 import os
 import subprocess
 import yaml
 TEST_CONFIG_YAML = "test-config.yaml"
 OUTPUT_FILE = "run_tests.sh"
 def get_data(yaml_file_name):
    with open(yaml_file_name, "r") as f:
        data = yaml.safe_load(f)
    return data
 def main():
    test_config_yaml_path = os.path.join(os.path.dirname(__file__), TEST_CONFIG_YAML)
    data = get_data(test_config_yaml_path)
    output_file_path = os.path.join(os.path.dirname(__file__), OUTPUT_FILE)
    with open(output_file_path, "w") as f:
        print("Started writing to {}".format(OUTPUT_FILE))
        for provider in data["providers"].split(" "):
            for model in data["inference_models"]:
                inference_model, test_file = data["inference_models"][model].split(",")
                f.write(
                    'pytest -v -s -k "{}"  --inference-model="{}" ./llama_stack/providers/tests/inference/{}\n'.format(
                        provider, inference_model, test_file[1:]
                    )
                )
        print("Finished writing to {}".format(OUTPUT_FILE))
        subprocess.run(["chmod", "+x", output_file_path])
        subprocess.run(["bash", output_file_path])
 if __name__ == "__main__":
    main()
--- a/rfcs/.watchman-cookie-sxyi-mbp-77593-68
+++ b/rfcs/.watchman-cookie-sxyi-mbp-77593-68
--- a/rfcs/.watchman-cookie-sxyi-mbp-77593-69
+++ b/rfcs/.watchman-cookie-sxyi-mbp-77593-69
--- a/rfcs/.watchman-cookie-sxyi-mbp-77593-70
+++ b/rfcs/.watchman-cookie-sxyi-mbp-77593-70
--- a/tests/.watchman-cookie-sxyi-mbp-77593-68
+++ b/tests/.watchman-cookie-sxyi-mbp-77593-68
--- a/tests/.watchman-cookie-sxyi-mbp-77593-69
+++ b/tests/.watchman-cookie-sxyi-mbp-77593-69
--- a/tests/.watchman-cookie-sxyi-mbp-77593-70
+++ b/tests/.watchman-cookie-sxyi-mbp-77593-70