mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-04 12:07:34 +00:00
rename ModelInference to Inference
This commit is contained in:
parent
245461620d
commit
67f0510edd
18 changed files with 468 additions and 1636 deletions
|
@ -10,12 +10,12 @@ from .api import (
|
|||
ChatCompletionResponseStreamChunk,
|
||||
CompletionRequest,
|
||||
InstructModel,
|
||||
ModelInference,
|
||||
Inference,
|
||||
UserMessage,
|
||||
)
|
||||
|
||||
|
||||
class ModelInferenceClient(ModelInference):
|
||||
class InferenceClient(Inference):
|
||||
def __init__(self, base_url: str):
|
||||
self.base_url = base_url
|
||||
|
||||
|
@ -48,7 +48,7 @@ class ModelInferenceClient(ModelInference):
|
|||
|
||||
|
||||
async def run_main(host: str, port: int):
|
||||
client = ModelInferenceClient(f"http://{host}:{port}")
|
||||
client = InferenceClient(f"http://{host}:{port}")
|
||||
|
||||
message = UserMessage(content="hello world, help me out here")
|
||||
req = ChatCompletionRequest(
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue