Spaces:
Paused
Paused
| """ | |
| Translate from OpenAI's `/v1/chat/completions` to VLLM's `/v1/chat/completions` | |
| """ | |
| from typing import List, Optional, Tuple | |
| from litellm.secret_managers.main import get_secret_bool, get_secret_str | |
| from litellm.types.router import LiteLLM_Params | |
| from ...openai.chat.gpt_transformation import OpenAIGPTConfig | |
| class LiteLLMProxyChatConfig(OpenAIGPTConfig): | |
| def get_supported_openai_params(self, model: str) -> List: | |
| params_list = super().get_supported_openai_params(model) | |
| params_list.append("thinking") | |
| params_list.append("reasoning_effort") | |
| return params_list | |
| def _map_openai_params( | |
| self, | |
| non_default_params: dict, | |
| optional_params: dict, | |
| model: str, | |
| drop_params: bool, | |
| ) -> dict: | |
| supported_openai_params = self.get_supported_openai_params(model) | |
| for param, value in non_default_params.items(): | |
| if param == "thinking": | |
| optional_params.setdefault("extra_body", {})["thinking"] = value | |
| elif param in supported_openai_params: | |
| optional_params[param] = value | |
| return optional_params | |
| def _get_openai_compatible_provider_info( | |
| self, api_base: Optional[str], api_key: Optional[str] | |
| ) -> Tuple[Optional[str], Optional[str]]: | |
| api_base = api_base or get_secret_str("LITELLM_PROXY_API_BASE") # type: ignore | |
| dynamic_api_key = api_key or get_secret_str("LITELLM_PROXY_API_KEY") | |
| return api_base, dynamic_api_key | |
| def get_models( | |
| self, api_key: Optional[str] = None, api_base: Optional[str] = None | |
| ) -> List[str]: | |
| api_base, api_key = self._get_openai_compatible_provider_info(api_base, api_key) | |
| if api_base is None: | |
| raise ValueError( | |
| "api_base not set for LiteLLM Proxy route. Set in env via `LITELLM_PROXY_API_BASE`" | |
| ) | |
| models = super().get_models(api_key=api_key, api_base=api_base) | |
| return [f"litellm_proxy/{model}" for model in models] | |
| def get_api_key(api_key: Optional[str] = None) -> Optional[str]: | |
| return api_key or get_secret_str("LITELLM_PROXY_API_KEY") | |
| def _should_use_litellm_proxy_by_default( | |
| litellm_params: Optional[LiteLLM_Params] = None, | |
| ): | |
| """ | |
| Returns True if litellm proxy should be used by default for a given request | |
| Issue: https://github.com/BerriAI/litellm/issues/10559 | |
| Use case: | |
| - When using Google ADK, users want a flag to dynamically enable sending the request to litellm proxy or not | |
| - Allow the model name to be passed in original format and still use litellm proxy: | |
| "gemini/gemini-1.5-pro", "openai/gpt-4", "mistral/llama-2-70b-chat" etc. | |
| """ | |
| import litellm | |
| if get_secret_bool("USE_LITELLM_PROXY") is True: | |
| return True | |
| if litellm_params and litellm_params.use_litellm_proxy is True: | |
| return True | |
| if litellm.use_litellm_proxy is True: | |
| return True | |
| return False | |
| def litellm_proxy_get_custom_llm_provider_info( | |
| model: str, api_base: Optional[str] = None, api_key: Optional[str] = None | |
| ) -> Tuple[str, str, Optional[str], Optional[str]]: | |
| """ | |
| Force use litellm proxy for all models | |
| Issue: https://github.com/BerriAI/litellm/issues/10559 | |
| Expected behavior: | |
| - custom_llm_provider will be 'litellm_proxy' | |
| - api_base = api_base OR LITELLM_PROXY_API_BASE | |
| - api_key = api_key OR LITELLM_PROXY_API_KEY | |
| Use case: | |
| - When using Google ADK, users want a flag to dynamically enable sending the request to litellm proxy or not | |
| - Allow the model name to be passed in original format and still use litellm proxy: | |
| "gemini/gemini-1.5-pro", "openai/gpt-4", "mistral/llama-2-70b-chat" etc. | |
| Return model, custom_llm_provider, dynamic_api_key, api_base | |
| """ | |
| import litellm | |
| custom_llm_provider = "litellm_proxy" | |
| if model.startswith("litellm_proxy/"): | |
| model = model.split("/", 1)[1] | |
| ( | |
| api_base, | |
| api_key, | |
| ) = litellm.LiteLLMProxyChatConfig()._get_openai_compatible_provider_info( | |
| api_base=api_base, api_key=api_key | |
| ) | |
| return model, custom_llm_provider, api_key, api_base | |