diff --git a/litellm/main.py b/litellm/main.py
index 9ee8beaef..b788c717c 100644
--- a/litellm/main.py
+++ b/litellm/main.py
@@ -45,10 +45,12 @@ def completion(
     temperature=1, top_p=1, n=1, stream=False, stop=None, max_tokens=float('inf'),
     presence_penalty=0, frequency_penalty=0, logit_bias={}, user="", deployment_id=None,
     # Optional liteLLM function params
-    *, return_async=False, api_key=None, force_timeout=600, logger_fn=None, verbose=False, custom_llm_provider=None, custom_api_base=None
+    *, return_async=False, api_key=None, force_timeout=600, logger_fn=None, verbose=False, azure=False, custom_llm_provider=None, custom_api_base=None
   ):
   try:
     global new_response
+    if azure: # this flag is deprecated, remove once notebooks are also updated.
+      custom_llm_provider="azure"
     args = locals()
     model_response = deepcopy(new_response) # deep copy the default response format so we can mutate it and it's thread-safe. 
     # check if user passed in any of the OpenAI optional params