llama-stack-mirror/tests/integration/recordings/responses/e2c9b07709fe.json

{
  "request": {
    "method": "POST",
    "url": "http://localhost:11434/v1/v1/chat/completions",
    "headers": {},
    "body": {
      "model": "llama3.2:3b-instruct-fp16",
      "messages": [
        {
          "role": "user",
          "content": "Test trace openai with temperature 1"
        }
      ],
      "max_tokens": 100,
      "stream": false,
      "temperature": 0.7
    },
    "endpoint": "/v1/chat/completions",
    "model": "llama3.2:3b-instruct-fp16"
  },
  "response": {
    "body": {
      "__type__": "openai.types.chat.chat_completion.ChatCompletion",
      "__data__": {
        "id": "chatcmpl-494",
        "choices": [
          {
            "finish_reason": "length",
            "index": 0,
            "logprobs": null,
            "message": {
              "content": "To test the OpenAI API with a temperature of 1, you can use the following Python code:\n\n```python\nimport requests\n\ndef generate_text(model_name, prompt, temperature=1):\n    # Set the API endpoint and parameters\n    url = \"https://api.openai.com/v1/models/\" + model_name + \"/generate\"\n    params = {\n        \"prompt\": prompt,\n        \"temperature\": temperature\n    }\n\n    # Send a GET request to the API\n    response =",
              "refusal": null,
              "role": "assistant",
              "annotations": null,
              "audio": null,
              "function_call": null,
              "tool_calls": null
            }
          }
        ],
        "created": 1754510067,
        "model": "llama3.2:3b-instruct-fp16",
        "object": "chat.completion",
        "service_tier": null,
        "system_fingerprint": "fp_ollama",
        "usage": {
          "completion_tokens": 100,
          "prompt_tokens": 33,
          "total_tokens": 133,
          "completion_tokens_details": null,
          "prompt_tokens_details": null
        }
      }
    },
    "is_streaming": false
  }
}