mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-03 18:00:36 +00:00
# What does this PR do? - update Cerebras to use OpenAIMixin - enable openai completions tests - enable openai chat completions tests - disable with n > 1 tests - add recording for --setup cerebras --subdirs inference --pattern openai ## Test Plan `./scripts/integration-tests.sh --stack-config server:ci-tests --setup cerebras --subdirs inference --pattern openai` ``` tests/integration/inference/test_openai_completion.py::test_openai_completion_non_streaming[txt=cerebras/llama-3.3-70b-inference:completion:sanity] instantiating llama_stack_client Port 8321 is already in use, assuming server is already running... llama_stack_client instantiated in 0.053s PASSED [ 2%] tests/integration/inference/test_openai_completion.py::test_openai_completion_non_streaming_suffix[txt=cerebras/llama-3.3-70b-inference:completion:suffix] SKIPPED (Suffix is not supported for the model: cerebras/llama-3.3-70b.) [ 4%] tests/integration/inference/test_openai_completion.py::test_openai_completion_streaming[txt=cerebras/llama-3.3-70b-inference:completion:sanity] PASSED [ 6%] tests/integration/inference/test_openai_completion.py::test_openai_completion_prompt_logprobs[txt=cerebras/llama-3.3-70b-1] SKIPPED (Model cerebras/llama-3.3-70b hosted by remote::cerebras doesn't support vllm extra_body parameters.) [ 8%] tests/integration/inference/test_openai_completion.py::test_openai_completion_guided_choice[txt=cerebras/llama-3.3-70b] SKIPPED (Model cerebras/llama-3.3-70b hosted by remote::cerebras doesn't support vllm extra_body parameters.) [ 10%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[openai_client-txt=cerebras/llama-3.3-70b-inference:chat_completion:non_streaming_01] PASSED [ 12%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming[openai_client-txt=cerebras/llama-3.3-70b-inference:chat_completion:streaming_01] PASSED [ 14%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming_with_n[openai_client-txt=cerebras/llama-3.3-70b-inference:chat_completion:streaming_01] SKIPPED (Model cerebras/llama-3.3-70b hosted by remote::cere...) [ 17%] tests/integration/inference/test_openai_completion.py::test_inference_store[openai_client-txt=cerebras/llama-3.3-70b-True] PASSED [ 19%] tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=cerebras/llama-3.3-70b-True] PASSED [ 21%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming_with_file[txt=cerebras/llama-3.3-70b] SKIPPED (Model cerebras/llama-3.3-70b hosted by remote::cerebras doesn't support chat completion calls wit...) [ 23%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_single_string[openai_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 25%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_multiple_strings[openai_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 27%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_encoding_format_float[openai_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 29%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_dimensions[openai_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 31%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_user_parameter[openai_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 34%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_empty_list_error[openai_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 36%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_invalid_model_error[openai_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 38%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_different_inputs_different_outputs[openai_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 40%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_encoding_format_base64[openai_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 42%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_base64_batch_processing[openai_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 44%] tests/integration/inference/test_openai_completion.py::test_openai_completion_prompt_logprobs[txt=cerebras/llama-3.3-70b-0] SKIPPED (Model cerebras/llama-3.3-70b hosted by remote::cerebras doesn't support vllm extra_body parameters.) [ 46%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[openai_client-txt=cerebras/llama-3.3-70b-inference:chat_completion:non_streaming_02] PASSED [ 48%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming[openai_client-txt=cerebras/llama-3.3-70b-inference:chat_completion:streaming_02] PASSED [ 51%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming_with_n[openai_client-txt=cerebras/llama-3.3-70b-inference:chat_completion:streaming_02] SKIPPED (Model cerebras/llama-3.3-70b hosted by remote::cere...) [ 53%] tests/integration/inference/test_openai_completion.py::test_inference_store[openai_client-txt=cerebras/llama-3.3-70b-False] PASSED [ 55%] tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=cerebras/llama-3.3-70b-False] PASSED [ 57%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_single_string[llama_stack_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 59%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_multiple_strings[llama_stack_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 61%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_encoding_format_float[llama_stack_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 63%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_dimensions[llama_stack_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 65%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_user_parameter[llama_stack_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 68%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_empty_list_error[llama_stack_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 70%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_invalid_model_error[llama_stack_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 72%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_different_inputs_different_outputs[llama_stack_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 74%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_encoding_format_base64[llama_stack_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 76%] tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_base64_batch_processing[llama_stack_client-cerebras/llama-3.3-70b-None-None-None-384] SKIPPED (embedding_model_id empty - skipping test) [ 78%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[client_with_models-txt=cerebras/llama-3.3-70b-inference:chat_completion:non_streaming_01] PASSED [ 80%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming[client_with_models-txt=cerebras/llama-3.3-70b-inference:chat_completion:streaming_01] PASSED [ 82%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming_with_n[client_with_models-txt=cerebras/llama-3.3-70b-inference:chat_completion:streaming_01] SKIPPED (Model cerebras/llama-3.3-70b hosted by remote:...) [ 85%] tests/integration/inference/test_openai_completion.py::test_inference_store[client_with_models-txt=cerebras/llama-3.3-70b-True] PASSED [ 87%] tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=cerebras/llama-3.3-70b-True] PASSED [ 89%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[client_with_models-txt=cerebras/llama-3.3-70b-inference:chat_completion:non_streaming_02] PASSED [ 91%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming[client_with_models-txt=cerebras/llama-3.3-70b-inference:chat_completion:streaming_02] PASSED [ 93%] tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming_with_n[client_with_models-txt=cerebras/llama-3.3-70b-inference:chat_completion:streaming_02] SKIPPED (Model cerebras/llama-3.3-70b hosted by remote:...) [ 95%] tests/integration/inference/test_openai_completion.py::test_inference_store[client_with_models-txt=cerebras/llama-3.3-70b-False] PASSED [ 97%] tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=cerebras/llama-3.3-70b-False] PASSED [100%] =================================================================================================================== slowest 10 durations ==================================================================================================================== 0.37s call tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[openai_client-txt=cerebras/llama-3.3-70b-inference:chat_completion:non_streaming_01] 0.34s call tests/integration/inference/test_openai_completion.py::test_inference_store[openai_client-txt=cerebras/llama-3.3-70b-False] 0.18s call tests/integration/inference/test_openai_completion.py::test_inference_store[client_with_models-txt=cerebras/llama-3.3-70b-True] 0.17s setup tests/integration/inference/test_openai_completion.py::test_openai_completion_non_streaming[txt=cerebras/llama-3.3-70b-inference:completion:sanity] 0.15s call tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=cerebras/llama-3.3-70b-True] 0.13s call tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=cerebras/llama-3.3-70b-True] 0.12s call tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=cerebras/llama-3.3-70b-False] 0.12s call tests/integration/inference/test_openai_completion.py::test_inference_store[openai_client-txt=cerebras/llama-3.3-70b-True] 0.12s call tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=cerebras/llama-3.3-70b-False] 0.08s call tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming[client_with_models-txt=cerebras/llama-3.3-70b-inference:chat_completion:streaming_02] ================================================================================================================== short test summary info ================================================================================================================== SKIPPED [1] tests/integration/inference/test_openai_completion.py:75: Suffix is not supported for the model: cerebras/llama-3.3-70b. SKIPPED [3] tests/integration/inference/test_openai_completion.py:123: Model cerebras/llama-3.3-70b hosted by remote::cerebras doesn't support vllm extra_body parameters. SKIPPED [4] tests/integration/inference/test_openai_completion.py:103: Model cerebras/llama-3.3-70b hosted by remote::cerebras doesn't support n param. SKIPPED [1] tests/integration/inference/test_openai_completion.py:129: Model cerebras/llama-3.3-70b hosted by remote::cerebras doesn't support chat completion calls with base64 encoded files. SKIPPED [2] tests/integration/inference/test_openai_embeddings.py:90: embedding_model_id empty - skipping test SKIPPED [2] tests/integration/inference/test_openai_embeddings.py:112: embedding_model_id empty - skipping test SKIPPED [2] tests/integration/inference/test_openai_embeddings.py:136: embedding_model_id empty - skipping test SKIPPED [2] tests/integration/inference/test_openai_embeddings.py:154: embedding_model_id empty - skipping test SKIPPED [2] tests/integration/inference/test_openai_embeddings.py:175: embedding_model_id empty - skipping test SKIPPED [2] tests/integration/inference/test_openai_embeddings.py:195: embedding_model_id empty - skipping test SKIPPED [2] tests/integration/inference/test_openai_embeddings.py:206: embedding_model_id empty - skipping test SKIPPED [2] tests/integration/inference/test_openai_embeddings.py:217: embedding_model_id empty - skipping test SKIPPED [2] tests/integration/inference/test_openai_embeddings.py:244: embedding_model_id empty - skipping test SKIPPED [2] tests/integration/inference/test_openai_embeddings.py:278: embedding_model_id empty - skipping test ================================================================================================= 18 passed, 29 skipped, 50 deselected, 4 warnings in 3.02s ================================================================================================= ``` |
||
|---|---|---|
| .. | ||
| 0b3f2e4754ff.json | ||
| 0b27fd737699.json | ||
| 00ba04f74a96.json | ||
| 0c1f45455d3b.json | ||
| 0d3290adae1d.json | ||
| 0e8f2b001dd9.json | ||
| 0fda25b9241c.json | ||
| 0ff78129bb3a.json | ||
| 1adfaa0e062e.json | ||
| 1b92be674e2a.json | ||
| 1b8394f90636.json | ||
| 1b45391880c6.json | ||
| 1e11c2b20ff8.json | ||
| 1f48f4b2ae33.json | ||
| 2afe3b38ca01.json | ||
| 2b2ad549510d.json | ||
| 2d187a11704c.json | ||
| 3a81146f2afa.json | ||
| 3c0bf9ba81b2.json | ||
| 3c3f13cb7794.json | ||
| 3ca695048bee.json | ||
| 3cdb5cab6ce6.json | ||
| 3dff18060ebc.json | ||
| 3ef0f9aab128.json | ||
| 4a3a4447b16b.json | ||
| 4ca6152a0eb8.json | ||
| 4d4440c8641b.json | ||
| 4de6877d86fa.json | ||
| 5db0c44c83a4.json | ||
| 5f5d16afadb4.json | ||
| 5fa0e98f3d84.json | ||
| 6c4e2e207e8a.json | ||
| 6cb0285a7638.json | ||
| 6cc063bbd7d3.json | ||
| 6d35c91287e2.json | ||
| 6d937e5e9233.json | ||
| 6f96090aa955.json | ||
| 6fbea1abca7c.json | ||
| 6fe1d4fedf12.json | ||
| 7b25b702ea18.json | ||
| 7b4815aba6c5.json | ||
| 7bcb0f86c91b.json | ||
| 07c5fa34d9ca.json | ||
| 7e6806cba34a.json | ||
| 7ef63231b9f8.json | ||
| 7f53b458dad9.json | ||
| 8bba71367e87.json | ||
| 9b9e8cf39b15.json | ||
| 9b812cbcb88d.json | ||
| 9c4bc9c3e7ac.json | ||
| 9c007f300365.json | ||
| 9c28ec9ac338.json | ||
| 9c140a29ae09.json | ||
| 9e7a83d3d596.json | ||
| 9e651e5fcfe2.json | ||
| 9f3d749cc1c8.json | ||
| 9fadf5a3d68f.json | ||
| 10eea8c15ddc.json | ||
| 011f70e24ce4.json | ||
| 35db283fef1d.json | ||
| 40f524d1934a.json | ||
| 41e27b9b5d09.json | ||
| 43e106de6736.json | ||
| 44a1d9de0602.json | ||
| 44fb9cf5875f.json | ||
| 48d2fb183a2a.json | ||
| 50a8dc5b8ece.json | ||
| 56ac6a7c6df0.json | ||
| 57b67d1b1a36.json | ||
| 61be36ad8ccd.json | ||
| 62aa454ea5f9.json | ||
| 70adef2c30c4.json | ||
| 72c1126ff2f9.json | ||
| 72e075bf28e8.json | ||
| 75d0dd9d0fa3.json | ||
| 76b89a84cd6f.json | ||
| 80e4404d8987.json | ||
| 80f09f27dd61.json | ||
| 81a91f79c51d.json | ||
| 83c2ffb72daa.json | ||
| 84cab42e1f5c.json | ||
| 89b141855b81.json | ||
| 90fec951fdb9.json | ||
| 94d11daee205.json | ||
| 97d3812bfccb.json | ||
| 97e259c0d3e5.json | ||
| 121a72d1c4cf.json | ||
| 173ecb3aab28.json | ||
| 177ba8517262.json | ||
| 198ef7208389.json | ||
| 211b1562d4e6.json | ||
| 249b7f0ddde6.json | ||
| 325a72db5755.json | ||
| 382c2f22274c.json | ||
| 390f0c7dac96.json | ||
| 432a346b2ed8.json | ||
| 441e2832387f.json | ||
| 477f8946bf7d.json | ||
| 511eb1b92e34.json | ||
| 545d86510a80.json | ||
| 0547d0909f24.json | ||
| 554de3cd986f.json | ||
| 563b994bb7d1.json | ||
| 565b1072cb9d.json | ||
| 802f60021837.json | ||
| 830a1fe14938.json | ||
| 836f51dfb3c5.json | ||
| 840fbb380b73.json | ||
| 894fdacb1cfa.json | ||
| 2983cc1d79f0.json | ||
| 3877ecf1bc62.json | ||
| 4014dd44c15f.json | ||
| 6730dcde0b73.json | ||
| 6857b19d3f0a.json | ||
| 6906a6e71988.json | ||
| 7354ec181984.json | ||
| 12913f20f6ac.json | ||
| 17030e75309f.json | ||
| 17253d7cc667.json | ||
| 23506e73bb9e.json | ||
| 28648cf8d421.json | ||
| 29585e055e6f.json | ||
| 31407e035752.json | ||
| 50340cd4d253.json | ||
| 67198cbad48f.json | ||
| 85594a69d74a.json | ||
| 140187e305dc.json | ||
| 174458ad71b2.json | ||
| 178016edef0e.json | ||
| 197228e26971.json | ||
| 561746e1c8de.json | ||
| 0648374e43e7.json | ||
| 731824c54461.json | ||
| 875323ed9913.json | ||
| 4096743baf8e.json | ||
| 04172112ffbb.json | ||
| 4597743bcd2a.json | ||
| 8295382a8e7c.json | ||
| 8752115f8d0c.json | ||
| 27463384d1a3.json | ||
| 4420515208a8.json | ||
| 5370751803dc.json | ||
| 6412295819a1.json | ||
| 417020320684.json | ||
| a0c4df33879f.json | ||
| a1c5bf09ea53.json | ||
| a4c8d19bb1eb.json | ||
| a59d0d7c1485.json | ||
| a98eecadddc8.json | ||
| a410d4840402.json | ||
| a5187d9d5057.json | ||
| a6810c23eda8.json | ||
| a97477559b10.json | ||
| aacf9abc51d4.json | ||
| ae1c22f18ecc.json | ||
| ae6835cfe70e.json | ||
| af6ca03dcbc3.json | ||
| afb33182f365.json | ||
| b4cda53cd04f.json | ||
| b5e3ed420986.json | ||
| b9f6e724ae06.json | ||
| b14ff438ca99.json | ||
| b44cc7a7afc8.json | ||
| b91f1fb4aedb.json | ||
| b459f403a5ae.json | ||
| b612debbd3bf.json | ||
| b24590574a85.json | ||
| bbd0637dce16.json | ||
| bce560cbf1c6.json | ||
| bd356b27a085.json | ||
| bf79a89cc37f.json | ||
| c9cba6f3ee38.json | ||
| c31a86ea6c58.json | ||
| c2199d6064db.json | ||
| c7582fa7c2c4.json | ||
| c791119e6359.json | ||
| c9667519ad7c.json | ||
| cb3df2a1dc22.json | ||
| cd094caaf1c0.json | ||
| cf55f983d1ff.json | ||
| d0ac68cbde69.json | ||
| d3e27b7234e2.json | ||
| d4c86ac355fb.json | ||
| d4f56d7d1996.json | ||
| d64ffaa0de6f.json | ||
| d86d4fc1eaca.json | ||
| d85689907fec.json | ||
| da531c71e64f.json | ||
| dac7a32e5db9.json | ||
| dbc41d2417e1.json | ||
| dc8120cf0774.json | ||
| dd9e7d5913e9.json | ||
| dd226d71f844.json | ||
| decfd950646c.json | ||
| e0a6dce1d94b.json | ||
| e2c9b07709fe.json | ||
| e08e01e5652a.json | ||
| e9c8a0e4f0e0.json | ||
| e08848bfcd28.json | ||
| e509387fc329.json | ||
| e29300494763.json | ||
| e96152610712.json | ||
| ecae140151d1.json | ||
| ecf6f0c51485.json | ||
| ed9e9b34008d.json | ||
| eee6a163b837.json | ||
| eee47930e3ae.json | ||
| eefb4206a4a9.json | ||
| ef59cbff54d0.json | ||
| ef757a75ed08.json | ||
| f0bbea34c5cc.json | ||
| f1ea938b0b0d.json | ||
| f3c3afbd9b7e.json | ||
| f6d655e91ac3.json | ||
| f70f30f54211.json | ||
| f80b99430f7e.json | ||
| f477c2fe1332.json | ||
| f518ea4fde7d.json | ||
| f1592dee71e5.json | ||
| f6857bcea729.json | ||
| fb785db7fafd.json | ||
| fcdef245da95.json | ||
| fe140befeba4.json | ||
| ff7db0102b28.json | ||
| ff3271401fb4.json | ||
| ffd7b58fded8.json | ||
| models-4a3a4447b16b-3057338f.json | ||
| models-bd032f995f2a-af43cc69.json | ||