mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-04 04:04:14 +00:00
# What does this PR do? recorded for: ./scripts/integration-tests.sh --stack-config server:ci-tests --suite base --setup fireworks --subdirs inference --pattern openai ## Test Plan ./scripts/integration-tests.sh --stack-config server:ci-tests --suite base --setup fireworks --subdirs inference --pattern openai
31 lines
802 B
JSON
31 lines
802 B
JSON
{
|
|
"request": {
|
|
"method": "POST",
|
|
"url": "https://api.fireworks.ai/inference/v1/v1/embeddings",
|
|
"headers": {},
|
|
"body": {
|
|
"model": "accounts/fireworks/models/qwen3-embedding-8b",
|
|
"input": [],
|
|
"encoding_format": "float"
|
|
},
|
|
"endpoint": "/v1/embeddings",
|
|
"model": "accounts/fireworks/models/qwen3-embedding-8b"
|
|
},
|
|
"response": {
|
|
"body": {
|
|
"__type__": "openai.types.create_embedding_response.CreateEmbeddingResponse",
|
|
"__data__": {
|
|
"data": [],
|
|
"model": "accounts/fireworks/models/qwen3-embedding-8b",
|
|
"object": "list",
|
|
"usage": {
|
|
"prompt_tokens": 0,
|
|
"total_tokens": 0,
|
|
"completion_tokens": 0
|
|
},
|
|
"perf_metrics": null
|
|
}
|
|
},
|
|
"is_streaming": false
|
|
}
|
|
}
|