models routing work

This commit is contained in:
Xi Yan 2024-09-19 08:48:10 -07:00
parent f3ff3a3001
commit 9bdd4e3dd9
3 changed files with 20 additions and 3 deletions

View file

@ -90,7 +90,7 @@ async def run_main(host: str, port: int, stream: bool):
cprint(f"User>{message.content}", "green")
iterator = client.chat_completion(
ChatCompletionRequest(
model="Meta-Llama3.1-8B-Instruct",
model="ollama-1",
messages=[message],
stream=stream,
)