llama-stack-mirror/tests/integration/common/recordings/62312134a706e1315ae2fc9a3e56cc13492eb4bc5b276181d8e1a95d156686b6.json
Eric Huang 0424e33172 test
# What does this PR do?


## Test Plan
2025-10-08 13:46:46 -07:00

60 lines
1.9 KiB
JSON

{
"test_id": null,
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "Test trace openai with temperature 1"
}
],
"max_tokens": 100,
"stream": false,
"temperature": 0.7,
"extra_body": {}
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": {
"__type__": "openai.types.chat.chat_completion.ChatCompletion",
"__data__": {
"id": "rec-62312134a706",
"choices": [
{
"finish_reason": "length",
"index": 0,
"logprobs": null,
"message": {
"content": "You want to test a model's behavior on the \"openai\" task using a temperature of 1.\n\nThe \"openai\" task is not a standard benchmark, so I'll assume you're referring to a task that tests the model's ability to reason and generate text in a way similar to OpenAI's language models. Here's an example code snippet that uses a popular library for testing language models, `transformers`, to test a model with a temperature of 1:\n\n```python\n",
"refusal": null,
"role": "assistant",
"annotations": null,
"audio": null,
"function_call": null,
"tool_calls": null
}
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": {
"completion_tokens": 100,
"prompt_tokens": 33,
"total_tokens": 133,
"completion_tokens_details": null,
"prompt_tokens_details": null
}
}
},
"is_streaming": false
}
}