mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-05 20:27:35 +00:00
feat: update Cerebras inference provider to support dynamic model listing
- update Cerebras to use OpenAIMixin - enable openai completions tests - enable openai chat completions tests - disable with n > 1 tests - add recording for --setup cerebras --subdirs inference --pattern openai test with: `./scripts/integration-tests.sh --stack-config server:ci-tests --setup cerebras --subdirs inference --pattern openai`
This commit is contained in:
parent
521865c388
commit
1f7e87c647
16 changed files with 3369 additions and 14 deletions
|
@ -108,6 +108,13 @@ SETUP_DEFINITIONS: dict[str, Setup] = {
|
|||
"embedding_model": "together/togethercomputer/m2-bert-80M-32k-retrieval",
|
||||
},
|
||||
),
|
||||
"cerebras": Setup(
|
||||
name="cerebras",
|
||||
description="Cerebras models",
|
||||
defaults={
|
||||
"text_model": "cerebras/llama-3.3-70b",
|
||||
},
|
||||
),
|
||||
}
|
||||
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue