precommit

This commit is contained in:
Xi Yan 2024-11-08 17:58:58 -08:00
parent 1ebf6447c5
commit ba82021d4b
11 changed files with 19 additions and 14 deletions

View file

@ -21,13 +21,13 @@ from llama_models.llama3.api.args import ModelArgs
from llama_models.llama3.reference_impl.model import Transformer, TransformerBlock
from llama_models.sku_list import resolve_model
from llama_stack.apis.inference import QuantizationType
from termcolor import cprint
from torch import nn, Tensor
from torchao.quantization.GPTQ import Int8DynActInt4WeightLinear
from llama_stack.apis.inference import QuantizationType
from ..config import MetaReferenceQuantizedInferenceConfig