# Copyright (c) Meta Platforms, Inc. and affiliates. # All rights reserved. # # This source code is licensed under the terms described in the LICENSE file in # the root directory of this source tree. from typing import Optional from llama_models.schema_utils import json_schema_type from pydantic import BaseModel, Field @json_schema_type class VLLMInferenceAdapterConfig(BaseModel): url: Optional[str] = Field( default=None, description="The URL for the vLLM model serving endpoint", ) max_tokens: int = Field( default=4096, description="Maximum number of tokens to generate.", ) api_token: Optional[str] = Field( default="fake", description="The API token", )