mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-08-03 17:29:01 +00:00
text inference
This commit is contained in:
parent
16cfe1014e
commit
2fe4acd64d
1 changed files with 24 additions and 5 deletions
|
@ -7,13 +7,32 @@
|
||||||
|
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
|
from llama_models.llama3.api.datatypes import (
|
||||||
|
SamplingParams,
|
||||||
|
StopReason,
|
||||||
|
ToolCall,
|
||||||
|
ToolDefinition,
|
||||||
|
ToolParamDefinition,
|
||||||
|
ToolPromptFormat,
|
||||||
|
)
|
||||||
|
|
||||||
from pydantic import BaseModel, ValidationError
|
from pydantic import BaseModel, ValidationError
|
||||||
|
|
||||||
from llama_models.llama3.api.datatypes import * # noqa: F403
|
from llama_stack.apis.inference import (
|
||||||
from llama_stack.apis.inference import * # noqa: F403
|
ChatCompletionResponse,
|
||||||
|
ChatCompletionResponseEventType,
|
||||||
from llama_stack.distribution.datatypes import * # noqa: F403
|
ChatCompletionResponseStreamChunk,
|
||||||
|
CompletionResponse,
|
||||||
|
CompletionResponseStreamChunk,
|
||||||
|
JsonSchemaResponseFormat,
|
||||||
|
LogProbConfig,
|
||||||
|
SystemMessage,
|
||||||
|
ToolCallDelta,
|
||||||
|
ToolCallParseStatus,
|
||||||
|
ToolChoice,
|
||||||
|
UserMessage,
|
||||||
|
)
|
||||||
|
from llama_stack.apis.models import Model
|
||||||
from .utils import group_chunks
|
from .utils import group_chunks
|
||||||
|
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue