diff --git a/llama_stack/providers/tests/README.md b/llama_stack/providers/tests/README.md index 0fe191d07..6a4bc1d05 100644 --- a/llama_stack/providers/tests/README.md +++ b/llama_stack/providers/tests/README.md @@ -28,21 +28,21 @@ We have the following orthogonal parametrizations (pytest "marks") for inference If you want to run a test with the llama_8b model with fireworks, you can use: ```bash -pytest -s -v llama_stack/providers/tests/inference/test_inference.py \ +pytest -s -v llama_stack/providers/tests/inference/test_text_inference.py \ -m "fireworks and llama_8b" \ --env FIREWORKS_API_KEY=<...> ``` You can make it more complex to run both llama_8b and llama_3b on Fireworks, but only llama_3b with Ollama: ```bash -pytest -s -v llama_stack/providers/tests/inference/test_inference.py \ +pytest -s -v llama_stack/providers/tests/inference/test_text_inference.py \ -m "fireworks or (ollama and llama_3b)" \ --env FIREWORKS_API_KEY=<...> ``` Finally, you can override the model completely by doing: ```bash -pytest -s -v llama_stack/providers/tests/inference/test_inference.py \ +pytest -s -v llama_stack/providers/tests/inference/test_text_inference.py \ -m fireworks \ --inference-model "Llama3.1-70B-Instruct" \ --env FIREWORKS_API_KEY=<...> diff --git a/llama_stack/providers/tests/inference/test_inference.py b/llama_stack/providers/tests/inference/test_text_inference.py similarity index 99% rename from llama_stack/providers/tests/inference/test_inference.py rename to llama_stack/providers/tests/inference/test_text_inference.py index 342117536..7de0f7ec2 100644 --- a/llama_stack/providers/tests/inference/test_inference.py +++ b/llama_stack/providers/tests/inference/test_text_inference.py @@ -19,7 +19,7 @@ from .utils import group_chunks # How to run this test: # -# pytest -v -s llama_stack/providers/tests/inference/test_inference.py +# pytest -v -s llama_stack/providers/tests/inference/test_text_inference.py # -m "(fireworks or ollama) and llama_3b" # --env FIREWORKS_API_KEY=