llama-stack-mirror/llama_toolchain/inference
2024-07-22 23:14:31 -07:00
..
api Initial commit - yes! 2024-07-22 23:14:31 -07:00
quantization Initial commit - yes! 2024-07-22 23:14:31 -07:00
__init__.py Initial commit - yes! 2024-07-22 23:14:31 -07:00
api_instance.py Initial commit - yes! 2024-07-22 23:14:31 -07:00
client.py Initial commit - yes! 2024-07-22 23:14:31 -07:00
event_logger.py Initial commit - yes! 2024-07-22 23:14:31 -07:00
generation.py Initial commit - yes! 2024-07-22 23:14:31 -07:00
inference.py Initial commit - yes! 2024-07-22 23:14:31 -07:00
model_parallel.py Initial commit - yes! 2024-07-22 23:14:31 -07:00
parallel_utils.py Initial commit - yes! 2024-07-22 23:14:31 -07:00
server.py Initial commit - yes! 2024-07-22 23:14:31 -07:00