fix: OAI compat endpoint for meta reference inference provider (#1962)

Test plan: python tests/verifications/generate_report.py --providers fireworks,together,llama_meta_ref,openai Co-authored-by: Eric Huang <erichuang@fb.com>
2025-10-12 05:54:38 +00:00 · 2025-04-17 11:16:04 -07:00 · 2025-04-17 11:16:04 -07:00 · 2976b5d992
commit 2976b5d992
parent 8bd6665775
8 changed files with 1184 additions and 44 deletions
--- a/tests/verifications/conf/meta_reference.yaml
+++ b/tests/verifications/conf/meta_reference.yaml
@ -0,0 +1,8 @@
+# LLAMA_STACK_PORT=5002 llama stack run meta-reference-gpu --env INFERENCE_MODEL=meta-llama/Llama-4-Scout-17B-16E-Instruct --env INFERENCE_CHECKPOINT_DIR=<path_to_ckpt>
+base_url: http://localhost:5002/v1/openai/v1
+api_key_var: foo
+models:
+- meta-llama/Llama-4-Scout-17B-16E-Instruct
+model_display_names:
+  meta-llama/Llama-4-Scout-17B-16E-Instruct: Llama-4-Scout-Instruct
+test_exclusions: {}