chore: introduce write queue for response_store

# What does this PR do?


## Test Plan
This commit is contained in:
Eric Huang 2025-09-19 16:02:02 -07:00
parent d3600b92d1
commit 7660ba844f
4 changed files with 128 additions and 7 deletions

View file

@ -433,6 +433,12 @@ class InferenceStoreConfig(BaseModel):
num_writers: int = Field(default=4, description="Number of concurrent background writers")
class ResponsesStoreConfig(BaseModel):
sql_store_config: SqlStoreConfig
max_write_queue_size: int = Field(default=10000, description="Max queued writes for responses store")
num_writers: int = Field(default=4, description="Number of concurrent background writers")
class StackRunConfig(BaseModel):
version: int = LLAMA_STACK_RUN_CONFIG_VERSION