test - making mistral embedding request on proxy

This commit is contained in:
Ishaan Jaff 2024-06-12 15:10:20 -07:00
parent 7eeef7ec1f
commit cb386fda20
4 changed files with 12 additions and 5 deletions

View file

@ -202,6 +202,7 @@ jobs:
-e REDIS_PORT=$REDIS_PORT \ -e REDIS_PORT=$REDIS_PORT \
-e AZURE_FRANCE_API_KEY=$AZURE_FRANCE_API_KEY \ -e AZURE_FRANCE_API_KEY=$AZURE_FRANCE_API_KEY \
-e AZURE_EUROPE_API_KEY=$AZURE_EUROPE_API_KEY \ -e AZURE_EUROPE_API_KEY=$AZURE_EUROPE_API_KEY \
-e MISTRAL_API_KEY=$MISTRAL_API_KEY \
-e AWS_ACCESS_KEY_ID=$AWS_ACCESS_KEY_ID \ -e AWS_ACCESS_KEY_ID=$AWS_ACCESS_KEY_ID \
-e AWS_SECRET_ACCESS_KEY=$AWS_SECRET_ACCESS_KEY \ -e AWS_SECRET_ACCESS_KEY=$AWS_SECRET_ACCESS_KEY \
-e AWS_REGION_NAME=$AWS_REGION_NAME \ -e AWS_REGION_NAME=$AWS_REGION_NAME \

View file

@ -14,10 +14,9 @@ model_list:
litellm_params: litellm_params:
model: openai/* model: openai/*
api_key: os.environ/OPENAI_API_KEY api_key: os.environ/OPENAI_API_KEY
- model_name: my-triton-model - model_name: mistral-embed
litellm_params: litellm_params:
model: triton/any" model: mistral/mistral-embed
api_base: https://exampleopenaiendpoint-production.up.railway.app/triton/embeddings
general_settings: general_settings:
master_key: sk-1234 master_key: sk-1234

View file

@ -85,6 +85,9 @@ model_list:
litellm_params: litellm_params:
model: openai/* model: openai/*
api_key: os.environ/OPENAI_API_KEY api_key: os.environ/OPENAI_API_KEY
- model_name: mistral-embed
litellm_params:
model: mistral/mistral-embed
- model_name: gpt-instruct # [PROD TEST] - tests if `/health` automatically infers this to be a text completion model - model_name: gpt-instruct # [PROD TEST] - tests if `/health` automatically infers this to be a text completion model
litellm_params: litellm_params:
model: text-completion-openai/gpt-3.5-turbo-instruct model: text-completion-openai/gpt-3.5-turbo-instruct

View file

@ -22,6 +22,7 @@ async def generate_key(
"text-embedding-ada-002", "text-embedding-ada-002",
"dall-e-2", "dall-e-2",
"fake-openai-endpoint-2", "fake-openai-endpoint-2",
"mistral-embed",
], ],
): ):
url = "http://0.0.0.0:4000/key/generate" url = "http://0.0.0.0:4000/key/generate"
@ -197,14 +198,14 @@ async def completion(session, key):
return response return response
async def embeddings(session, key): async def embeddings(session, key, model="text-embedding-ada-002"):
url = "http://0.0.0.0:4000/embeddings" url = "http://0.0.0.0:4000/embeddings"
headers = { headers = {
"Authorization": f"Bearer {key}", "Authorization": f"Bearer {key}",
"Content-Type": "application/json", "Content-Type": "application/json",
} }
data = { data = {
"model": "text-embedding-ada-002", "model": model,
"input": ["hello world"], "input": ["hello world"],
} }
@ -408,6 +409,9 @@ async def test_embeddings():
key_2 = key_gen["key"] key_2 = key_gen["key"]
await embeddings(session=session, key=key_2) await embeddings(session=session, key=key_2)
# embedding request with non OpenAI model
await embeddings(session=session, key=key, model="mistral-embed")
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_image_generation(): async def test_image_generation():