Revert "Added support for Triton chat completion using trtlllm generate endpo…"

This commit is contained in:
Ishaan Jaff 2024-05-29 13:42:49 -07:00 committed by GitHub
parent e8c1e87ac9
commit 99e506525c
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
2 changed files with 4 additions and 165 deletions

View file

@ -2254,26 +2254,6 @@ def completion(
return generator
response = generator
elif custom_llm_provider == "triton":
api_base = (
litellm.api_base or api_base
)
model_response = triton_chat_completions.completion(
api_base=api_base,
timeout=timeout,
model=model,
messages=messages,
model_response=model_response,
optional_params=optional_params,
logging_obj=logging,
)
## RESPONSE OBJECT
response = model_response
return response
elif custom_llm_provider == "cloudflare":
api_key = (
api_key