forked from phoenix-oss/llama-stack-mirror
refactor: move generation.py to llama3
This commit is contained in:
parent
02066591b8
commit
816fdf289a
2 changed files with 3 additions and 3 deletions
|
@ -18,8 +18,9 @@ from llama_stack.providers.utils.inference.prompt_adapter import (
|
|||
CompletionRequestWithRawContent,
|
||||
)
|
||||
|
||||
from .common import model_checkpoint_dir
|
||||
from .config import MetaReferenceInferenceConfig
|
||||
from .generation import Llama, model_checkpoint_dir
|
||||
from .llama3.generation import Llama3
|
||||
from .parallel_utils import ModelParallelProcessGroup
|
||||
|
||||
|
||||
|
@ -42,7 +43,7 @@ def init_model_cb(
|
|||
model_id: str,
|
||||
llama_model: Model,
|
||||
):
|
||||
llama = Llama.build(config, model_id, llama_model)
|
||||
llama = Llama3.build(config, model_id, llama_model)
|
||||
return ModelRunner(llama)
|
||||
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue