BerriAI · krrishdholakia · Jan 26, 2025 · Jan 25, 2025 · Jan 25, 2025 · Jan 25, 2025
diff --git a/litellm/cost_calculator.py b/litellm/cost_calculator.py
@@ -560,6 +560,10 @@
             base_model=base_model,
         )
 
+        verbose_logger.debug(
+            f"completion_response _select_model_name_for_cost_calc: {model}"
@@ -72,2 +72,8 @@
+def sanitize_model(model: Optional[str]) -> Optional[str]:
+    if model is None:
+        return None
+    # Add logic to sanitize the model string, e.g., mask sensitive parts
+    # For simplicity, let's mask any part that looks like an API key
+    return model.replace("os.environ/", "****")
@@ -562,4 +568,5 @@
+        sanitized_model = sanitize_model(model)
        verbose_logger.debug(
-            f"completion_response _select_model_name_for_cost_calc: {model}"
+            f"completion_response _select_model_name_for_cost_calc: {sanitized_model}"
        )
@@ -72,2 +72,8 @@

+def sanitize_model(model: Optional[str]) -> Optional[str]:
+    if model is None:
+        return None
+    # Add logic to sanitize the model string, e.g., mask sensitive parts
+    # For simplicity, let's mask any part that looks like an API key
+    return model.replace("os.environ/", "****")

@@ -562,4 +568,5 @@

+        sanitized_model = sanitize_model(model)
        verbose_logger.debug(
-            f"completion_response _select_model_name_for_cost_calc: {model}"
+            f"completion_response _select_model_name_for_cost_calc: {sanitized_model}"
        )
+        )
+
         if completion_response is not None and (
             isinstance(completion_response, BaseModel)
             or isinstance(completion_response, dict)
@@ -598,9 +602,6 @@
                 cache_read_input_tokens = prompt_tokens_details.get("cached_tokens", 0)
 
             total_time = getattr(completion_response, "_response_ms", 0)
-            verbose_logger.debug(
-                f"completion_response response ms: {getattr(completion_response, '_response_ms', None)} "
-            )
 
             hidden_params = getattr(completion_response, "_hidden_params", None)
             if hidden_params is not None:

diff --git a/litellm/litellm_core_utils/litellm_logging.py b/litellm/litellm_core_utils/litellm_logging.py
@@ -847,6 +847,7 @@ def _response_cost_calculator(
             response_cost = litellm.response_cost_calculator(
                 **response_cost_calculator_kwargs
             )
+            verbose_logger.debug(f"response_cost: {response_cost}")
             return response_cost
         except Exception as e:  # error calculating cost
             debug_info = StandardLoggingModelCostFailureDebugInformation(

diff --git a/litellm/llms/base_llm/base_utils.py b/litellm/llms/base_llm/base_utils.py
@@ -4,17 +4,15 @@
 from openai.lib import _parsing, _pydantic
 from pydantic import BaseModel
 
-from litellm.types.utils import ModelInfoBase
+from litellm.types.utils import ProviderSpecificModelInfo
 
 
 class BaseLLMModelInfo(ABC):
-    @abstractmethod
-    def get_model_info(
+    def get_provider_info(
         self,
         model: str,
-        existing_model_info: Optional[ModelInfoBase] = None,
-    ) -> Optional[ModelInfoBase]:
-        pass
+    ) -> Optional[ProviderSpecificModelInfo]:
+        return None
 
     @abstractmethod
     def get_models(self) -> List[str]:

diff --git a/litellm/llms/fireworks_ai/chat/transformation.py b/litellm/llms/fireworks_ai/chat/transformation.py
@@ -3,7 +3,7 @@
 import litellm
 from litellm.secret_managers.main import get_secret_str
 from litellm.types.llms.openai import AllMessageValues, ChatCompletionImageObject
-from litellm.types.utils import ModelInfoBase, ProviderSpecificModelInfo
+from litellm.types.utils import ProviderSpecificModelInfo
 
 from ...openai.chat.gpt_transformation import OpenAIGPTConfig
 
@@ -159,30 +159,14 @@ def _transform_messages_helper(
                             )
         return messages
 
-    def get_model_info(
-        self, model: str, existing_model_info: Optional[ModelInfoBase] = None
-    ) -> ModelInfoBase:
+    def get_provider_info(self, model: str) -> ProviderSpecificModelInfo:
         provider_specific_model_info = ProviderSpecificModelInfo(
             supports_function_calling=True,
             supports_prompt_caching=True,  # https://docs.fireworks.ai/guides/prompt-caching
             supports_pdf_input=True,  # via document inlining
             supports_vision=True,  # via document inlining
         )
-        if existing_model_info is not None:
-            return ModelInfoBase(
-                **{**existing_model_info, **provider_specific_model_info}
-            )
-        return ModelInfoBase(
-            key=model,
-            litellm_provider="fireworks_ai",
-            mode="chat",
-            input_cost_per_token=0.0,
-            output_cost_per_token=0.0,
-            max_tokens=None,
-            max_input_tokens=None,
-            max_output_tokens=None,
-            **provider_specific_model_info,
-        )
+        return provider_specific_model_info
 
     def transform_request(
         self,

diff --git a/litellm/llms/openai/chat/gpt_transformation.py b/litellm/llms/openai/chat/gpt_transformation.py
@@ -11,7 +11,7 @@
 from litellm.llms.base_llm.chat.transformation import BaseConfig, BaseLLMException
 from litellm.secret_managers.main import get_secret_str
 from litellm.types.llms.openai import AllMessageValues
-from litellm.types.utils import ModelInfoBase, ModelResponse
+from litellm.types.utils import ModelResponse
 
 from ..common_utils import OpenAIError
 
@@ -255,23 +255,6 @@ def get_models(
         models = response.json()["data"]
         return [model["id"] for model in models]
 
-    def get_model_info(
-        self, model: str, existing_model_info: Optional[ModelInfoBase] = None
-    ) -> ModelInfoBase:
-
-        if existing_model_info is not None:
-            return existing_model_info
-        return ModelInfoBase(
-            key=model,
-            litellm_provider="openai",
-            mode="chat",
-            input_cost_per_token=0.0,
-            output_cost_per_token=0.0,
-            max_tokens=None,
-            max_input_tokens=None,
-            max_output_tokens=None,
-        )
-
     @staticmethod
     def get_api_key(api_key: Optional[str] = None) -> Optional[str]:
         return (

diff --git a/litellm/llms/topaz/common_utils.py b/litellm/llms/topaz/common_utils.py
@@ -1,7 +1,6 @@
 from typing import List, Optional
 
 from litellm.secret_managers.main import get_secret_str
-from litellm.types.utils import ModelInfoBase
 
 from ..base_llm.base_utils import BaseLLMModelInfo
 from ..base_llm.chat.transformation import BaseLLMException
@@ -12,11 +11,6 @@ class TopazException(BaseLLMException):
 
 
 class TopazModelInfo(BaseLLMModelInfo):
-    def get_model_info(
-        self, model: str, existing_model_info: Optional[ModelInfoBase] = None
-    ) -> Optional[ModelInfoBase]:
-        return existing_model_info
-
     def get_models(self) -> List[str]:
         return [
             "topaz/Standard V2",

diff --git a/litellm/proxy/_experimental/out/404.html b/litellm/proxy/_experimental/out/404.html
diff --git a/litellm/proxy/_experimental/out/model_hub.html b/litellm/proxy/_experimental/out/model_hub.html