forked from phoenix/litellm-mirror
LiteLLM Minor Fixes & Improvements (10/24/2024) (#6421)
* fix(utils.py): support passing dynamic api base to validate_environment Returns True if just api base is required and api base is passed * fix(litellm_pre_call_utils.py): feature flag sending client headers to llm api Fixes https://github.com/BerriAI/litellm/issues/6410 * fix(anthropic/chat/transformation.py): return correct error message * fix(http_handler.py): add error response text in places where we expect it * fix(factory.py): handle base case of no non-system messages to bedrock Fixes https://github.com/BerriAI/litellm/issues/6411 * feat(cohere/embed): Support cohere image embeddings Closes https://github.com/BerriAI/litellm/issues/6413 * fix(__init__.py): fix linting error * docs(supported_embedding.md): add image embedding example to docs * feat(cohere/embed): use cohere embedding returned usage for cost calc * build(model_prices_and_context_window.json): add embed-english-v3.0 details (image cost + 'supports_image_input' flag) * fix(cohere_transformation.py): fix linting error * test(test_proxy_server.py): cleanup test * test: cleanup test * fix: fix linting errors
This commit is contained in:
parent
38708a355a
commit
c03e5da41f
23 changed files with 417 additions and 150 deletions
|
@ -3364,54 +3364,56 @@
|
|||
"litellm_provider": "cohere",
|
||||
"mode": "rerank"
|
||||
},
|
||||
"embed-english-v3.0": {
|
||||
"max_tokens": 512,
|
||||
"max_input_tokens": 512,
|
||||
"input_cost_per_token": 0.00000010,
|
||||
"output_cost_per_token": 0.00000,
|
||||
"litellm_provider": "cohere",
|
||||
"mode": "embedding"
|
||||
},
|
||||
"embed-english-light-v3.0": {
|
||||
"max_tokens": 512,
|
||||
"max_input_tokens": 512,
|
||||
"max_tokens": 1024,
|
||||
"max_input_tokens": 1024,
|
||||
"input_cost_per_token": 0.00000010,
|
||||
"output_cost_per_token": 0.00000,
|
||||
"litellm_provider": "cohere",
|
||||
"mode": "embedding"
|
||||
},
|
||||
"embed-multilingual-v3.0": {
|
||||
"max_tokens": 512,
|
||||
"max_input_tokens": 512,
|
||||
"max_tokens": 1024,
|
||||
"max_input_tokens": 1024,
|
||||
"input_cost_per_token": 0.00000010,
|
||||
"output_cost_per_token": 0.00000,
|
||||
"litellm_provider": "cohere",
|
||||
"mode": "embedding"
|
||||
},
|
||||
"embed-english-v2.0": {
|
||||
"max_tokens": 512,
|
||||
"max_input_tokens": 512,
|
||||
"max_tokens": 4096,
|
||||
"max_input_tokens": 4096,
|
||||
"input_cost_per_token": 0.00000010,
|
||||
"output_cost_per_token": 0.00000,
|
||||
"litellm_provider": "cohere",
|
||||
"mode": "embedding"
|
||||
},
|
||||
"embed-english-light-v2.0": {
|
||||
"max_tokens": 512,
|
||||
"max_input_tokens": 512,
|
||||
"max_tokens": 1024,
|
||||
"max_input_tokens": 1024,
|
||||
"input_cost_per_token": 0.00000010,
|
||||
"output_cost_per_token": 0.00000,
|
||||
"litellm_provider": "cohere",
|
||||
"mode": "embedding"
|
||||
},
|
||||
"embed-multilingual-v2.0": {
|
||||
"max_tokens": 256,
|
||||
"max_input_tokens": 256,
|
||||
"max_tokens": 768,
|
||||
"max_input_tokens": 768,
|
||||
"input_cost_per_token": 0.00000010,
|
||||
"output_cost_per_token": 0.00000,
|
||||
"litellm_provider": "cohere",
|
||||
"mode": "embedding"
|
||||
},
|
||||
"embed-english-v3.0": {
|
||||
"max_tokens": 1024,
|
||||
"max_input_tokens": 1024,
|
||||
"input_cost_per_token": 0.00000010,
|
||||
"input_cost_per_image": 0.0001,
|
||||
"output_cost_per_token": 0.00000,
|
||||
"litellm_provider": "cohere",
|
||||
"mode": "embedding",
|
||||
"supports_image_input": true
|
||||
},
|
||||
"replicate/meta/llama-2-13b": {
|
||||
"max_tokens": 4096,
|
||||
"max_input_tokens": 4096,
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue