mirror of
https://github.com/BerriAI/litellm.git
synced 2025-04-24 18:24:20 +00:00
remove cuda from petals
This commit is contained in:
parent
102fd83ea6
commit
b81f8d2ddd
2 changed files with 2 additions and 3 deletions
|
@ -39,7 +39,6 @@ def completion(
|
|||
|
||||
tokenizer = AutoTokenizer.from_pretrained(model, use_fast=False, add_bos_token=False)
|
||||
model_obj = AutoDistributedModelForCausalLM.from_pretrained(model)
|
||||
model_obj = model_obj.cuda()
|
||||
|
||||
prompt = ""
|
||||
for message in messages:
|
||||
|
@ -64,7 +63,7 @@ def completion(
|
|||
)
|
||||
|
||||
## COMPLETION CALL
|
||||
inputs = tokenizer(prompt, return_tensors="pt")["input_ids"].cuda()
|
||||
inputs = tokenizer(prompt, return_tensors="pt")["input_ids"]
|
||||
|
||||
# optional params: max_new_tokens=1,temperature=0.9, top_p=0.6
|
||||
outputs = model_obj.generate(inputs, **optional_params)
|
||||
|
|
|
@ -1,6 +1,6 @@
|
|||
[tool.poetry]
|
||||
name = "litellm"
|
||||
version = "0.1.714"
|
||||
version = "0.1.715"
|
||||
description = "Library to easily interface with LLM API providers"
|
||||
authors = ["BerriAI"]
|
||||
license = "MIT License"
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue