diff --git a/llama_stack/templates/tgi/report.md b/llama_stack/templates/tgi/report.md index cc69923de..1f76ff692 100644 --- a/llama_stack/templates/tgi/report.md +++ b/llama_stack/templates/tgi/report.md @@ -21,25 +21,24 @@ ## Inference: | Model | API | Capability | Test | Status | |:----- |:-----|:-----|:-----|:-----| -| Text | /chat_completion | streaming | test_text_chat_completion_streaming | ✅ | -| Vision | /chat_completion | streaming | test_image_chat_completion_streaming | ⏭️ | -| Vision | /chat_completion | non_streaming | test_image_chat_completion_non_streaming | ⏭️ | -| Text | /chat_completion | non_streaming | test_text_chat_completion_non_streaming | ✅ | -| Text | /chat_completion | tool_calling | test_text_chat_completion_with_tool_calling_and_streaming | ✅ | -| Text | /chat_completion | tool_calling | test_text_chat_completion_with_tool_calling_and_non_streaming | ✅ | -| Text | /completion | streaming | test_text_completion_streaming | ✅ | -| Text | /completion | non_streaming | test_text_completion_non_streaming | ✅ | -| Text | /completion | structured_output | test_text_completion_structured_output | ✅ | +| Llama-3.1-8B-Instruct | /chat_completion | streaming | test_text_chat_completion_streaming | ✅ | +| Llama-3.2-11B-Vision-Instruct | /chat_completion | streaming | test_image_chat_completion_streaming | ❌ | +| Llama-3.2-11B-Vision-Instruct | /chat_completion | non_streaming | test_image_chat_completion_non_streaming | ❌ | +| Llama-3.1-8B-Instruct | /chat_completion | non_streaming | test_text_chat_completion_non_streaming | ✅ | +| Llama-3.1-8B-Instruct | /chat_completion | tool_calling | test_text_chat_completion_with_tool_calling_and_streaming | ✅ | +| Llama-3.1-8B-Instruct | /chat_completion | tool_calling | test_text_chat_completion_with_tool_calling_and_non_streaming | ✅ | +| Llama-3.1-8B-Instruct | /completion | streaming | test_text_completion_streaming | ✅ | +| Llama-3.1-8B-Instruct | /completion | non_streaming | test_text_completion_non_streaming | ✅ | +| Llama-3.1-8B-Instruct | /completion | structured_output | test_text_completion_structured_output | ✅ | -## Memory: +## Vector_io: | API | Capability | Test | Status | |:-----|:-----|:-----|:-----| -| /insert, /query | inline | test_memory_bank_insert_inline_and_query | ✅ | -| /insert, /query | url | test_memory_bank_insert_from_url_and_query | ✅ | +| /retrieve | | test_vector_db_retrieve | ✅ | ## Agents: | API | Capability | Test | Status | |:-----|:-----|:-----|:-----| -| create_agent_turn | rag | test_rag_agent | ✅ | -| create_agent_turn | custom_tool | test_custom_tool | ❌ | -| create_agent_turn | code_execution | test_code_execution | ✅ | +| /create_agent_turn | rag | test_rag_agent | ✅ | +| /create_agent_turn | custom_tool | test_custom_tool | ✅ | +| /create_agent_turn | code_execution | test_code_interpreter_for_attachments | ✅ |