mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-03 19:57:35 +00:00
21 lines
590 B
Python
21 lines
590 B
Python
# Copyright (c) Meta Platforms, Inc. and affiliates.
|
|
# All rights reserved.
|
|
#
|
|
# This source code is licensed under the terms described in the LICENSE file in
|
|
# the root directory of this source tree.
|
|
|
|
from typing import Optional
|
|
|
|
from pydantic import BaseModel
|
|
from strong_typing.schema import json_schema_type
|
|
|
|
from llama_toolchain.inference.api import QuantizationConfig
|
|
|
|
|
|
@json_schema_type
|
|
class MetaReferenceImplConfig(BaseModel):
|
|
model: str
|
|
quantization: Optional[QuantizationConfig] = None
|
|
torch_seed: Optional[int] = None
|
|
max_seq_len: int
|
|
max_batch_size: int = 1
|