update custom prompt template function

This commit is contained in:
Krrish Dholakia 2023-09-06 13:14:33 -07:00
parent 8440791e04
commit 0ace48d719
4 changed files with 29 additions and 43 deletions

View file

@ -3,27 +3,22 @@ def default_pt(messages):
# Llama2 prompt template # Llama2 prompt template
def llama_2_chat_pt(messages): def llama_2_chat_pt(messages):
prompt = "<s>" prompt = custom_prompt(
for message in messages: role_dict={
if message["role"] == "system": "system": {
prompt += "[INST] <<SYS>>" + message["content"] "pre_message": "[INST] <<SYS>>\n",
elif message["role"] == "assistant": "post_message": "\n<</SYS>>\n [/INST]\n"
prompt += message["content"] + "</s><s>[INST]" },
elif message["role"] == "user": "user": { # follow this format https://github.com/facebookresearch/llama/blob/77062717054710e352a99add63d160274ce670c6/llama/generation.py#L348
prompt += message["content"] + "[/INST]" "pre_message": "[INST] ",
return prompt "post_message": " [/INST]\n"
},
# TogetherAI Llama2 prompt template "assistant": {
def togetherai_llama_2_chat_pt(messages): "post_message": "\n" # follows this - https://replicate.com/blog/how-to-prompt-llama
prompt = "[INST]\n" }
for message in messages: },
if message["role"] == "system": messages=messages
prompt += message["content"] )
elif message["role"] == "assistant":
prompt += message["content"]
elif message["role"] == "user":
prompt += message["content"]
prompt += "\n[\INST]\n\n"
return prompt return prompt
# Falcon prompt template - from https://github.com/lm-sys/FastChat/blob/main/fastchat/conversation.py#L110 # Falcon prompt template - from https://github.com/lm-sys/FastChat/blob/main/fastchat/conversation.py#L110
@ -84,15 +79,15 @@ def phind_codellama_pt(messages):
return prompt return prompt
# Custom prompt template # Custom prompt template
def custom_prompt(role_dict: dict, pre_message_sep: str, post_message_sep: str, messages: list): def custom_prompt(role_dict: dict, messages: list, initial_prompt_value: str="", final_prompt_value: str=""):
prompt = "" prompt = initial_prompt_value
for message in messages: for message in messages:
if message["role"] == "system": role = message["role"]
prompt += f"{role_dict['system']}{pre_message_sep}" + message["content"] + post_message_sep pre_message_str = role_dict[role]["pre_message"] if role in role_dict and "pre_message" in role_dict[role] else ""
elif message["role"] == "user": post_message_str = role_dict[role]["post_message"] if role in role_dict and "post_message" in role_dict[role] else ""
prompt += f"{role_dict['user']}{pre_message_sep}" + message["content"] + post_message_sep prompt += pre_message_str + message["content"] + post_message_str
elif message["role"] == "assistant":
prompt += f"{role_dict['assistant']}{pre_message_sep}" + message["content"] + post_message_sep prompt += final_prompt_value
return prompt return prompt
def prompt_factory(model: str, messages: list): def prompt_factory(model: str, messages: list):
@ -100,30 +95,21 @@ def prompt_factory(model: str, messages: list):
if "meta-llama/Llama-2" in model: if "meta-llama/Llama-2" in model:
if "chat" in model: if "chat" in model:
return llama_2_chat_pt(messages=messages) return llama_2_chat_pt(messages=messages)
else:
return default_pt(messages=messages)
elif "tiiuae/falcon" in model: # Note: for the instruct models, it's best to use a User: .., Assistant:.. approach in your prompt template. elif "tiiuae/falcon" in model: # Note: for the instruct models, it's best to use a User: .., Assistant:.. approach in your prompt template.
if model == "tiiuae/falcon-180B-chat": if model == "tiiuae/falcon-180B-chat":
return falcon_chat_pt(messages=messages) return falcon_chat_pt(messages=messages)
elif "instruct" in model: elif "instruct" in model:
return falcon_instruct_pt(messages=messages) return falcon_instruct_pt(messages=messages)
else:
return default_pt(messages=messages)
elif "mosaicml/mpt" in model: elif "mosaicml/mpt" in model:
if "chat" in model: if "chat" in model:
return mpt_chat_pt(messages=messages) return mpt_chat_pt(messages=messages)
else:
return default_pt(messages=messages)
elif "codellama/codellama" in model: elif "codellama/codellama" in model:
if "instruct" in model: if "instruct" in model:
return llama_2_chat_pt(messages=messages) # https://huggingface.co/blog/codellama#conversational-instructions return llama_2_chat_pt(messages=messages) # https://huggingface.co/blog/codellama#conversational-instructions
else:
return default_pt(messages=messages)
elif "wizardlm/wizardcoder" in model: elif "wizardlm/wizardcoder" in model:
return wizardcoder_pt(messages=messages) return wizardcoder_pt(messages=messages)
elif "phind/phind-codellama" in model: elif "phind/phind-codellama" in model:
return phind_codellama_pt(messages=messages) return phind_codellama_pt(messages=messages)
elif "togethercomputer/llama-2" in model and "instruct" in model: elif "togethercomputer/llama-2" in model and ("instruct" in model or "chat" in model):
return togetherai_llama_2_chat_pt(messages=messages) return llama_2_chat_pt(messages=messages)
else: return default_pt(messages=messages) # default that covers Bloom, T-5, any non-chat tuned model (e.g. base Llama2)
return default_pt(messages=messages)

View file

@ -435,7 +435,7 @@ def test_completion_together_ai():
except Exception as e: except Exception as e:
pytest.fail(f"Error occurred: {e}") pytest.fail(f"Error occurred: {e}")
test_completion_together_ai()
# def test_customprompt_together_ai(): # def test_customprompt_together_ai():
# try: # try:
# litellm.register_prompt_template( # litellm.register_prompt_template(

View file

@ -1,6 +1,6 @@
[tool.poetry] [tool.poetry]
name = "litellm" name = "litellm"
version = "0.1.544" version = "0.1.545"
description = "Library to easily interface with LLM API providers" description = "Library to easily interface with LLM API providers"
authors = ["BerriAI"] authors = ["BerriAI"]
license = "MIT License" license = "MIT License"