All-Hands-AI · rbren · May 10, 2024 · May 9, 2024 · May 9, 2024 · May 9, 2024
diff --git a/agenthub/codeact_agent/codeact_agent.py b/agenthub/codeact_agent/codeact_agent.py
@@ -18,7 +18,7 @@
     IPythonRunCellObservation,
     NullObservation,
 )
-from opendevin.llm.llm import LLM, completion_cost
+from opendevin.llm.llm import LLM
 from opendevin.runtime.plugins import (
     JupyterRequirement,
     PluginRequirement,
@@ -228,11 +228,9 @@ def step(self, state: State) -> Action:
             ],
             temperature=0.0,
         )
-        cur_cost = completion_cost(completion_response=response)
-        self.cost_accumulator += cur_cost
-        logger.info(
-            f'Cost: {cur_cost:.2f} USD | Accumulated Cost: {self.cost_accumulator:.2f} USD'
-        )
+
+        self.logCost(response)
+
         action_str: str = parse_response(response)
         state.num_of_chars += sum(
             len(message['content']) for message in self.messages
@@ -265,3 +263,12 @@ def step(self, state: State) -> Action:
 
     def search_memory(self, query: str) -> List[str]:
         raise NotImplementedError('Implement this abstract method')
+
+    def logCost(self, response):
+        cur_cost = self.llm.completion_cost(response)
+        self.cost_accumulator += cur_cost
+        logger.info(
+            'Cost: %.2f USD | Accumulated Cost: %.2f USD',
+            cur_cost,
+            self.cost_accumulator,
+        )
diff --git a/opendevin/llm/llm.py b/opendevin/llm/llm.py
@@ -2,7 +2,7 @@
 
 import litellm
 from litellm import completion as litellm_completion
-from litellm import completion_cost
+from litellm import completion_cost as litellm_completion_cost
 from litellm.exceptions import (
     APIConnectionError,
     RateLimitError,
@@ -20,7 +20,7 @@
 from opendevin.core.logger import opendevin_logger as logger
 from opendevin.core.schema import ConfigType
 
-__all__ = ['LLM', 'completion_cost']
+__all__ = ['LLM']
 
 DEFAULT_API_KEY = config.get(ConfigType.LLM_API_KEY)
 DEFAULT_BASE_URL = config.get(ConfigType.LLM_BASE_URL)
@@ -178,6 +178,28 @@ def get_token_count(self, messages):
         """
         return litellm.token_counter(model=self.model_name, messages=messages)
 
+    def completion_cost(self, response):
+        """
+        Calculate the cost of a completion response based on the model.  Local models are treated as free.
+
+        Args:
+            response (list): A response from a model invocation.
+
+        Returns:
+            number: The cost of the response.
+        """
+        if (
+            'localhost' not in self.base_url
+            and '127.0.0.1' not in self.base_url
+            and '0.0.0.0' not in self.base_url
+        ):
+            try:
+                cost = litellm_completion_cost(completion_response=response)
+                return cost
+            except Exception:
+                logger.warning('Cost calculation not supported for this model.')
+        return 0.0
+
     def __str__(self):
         if self.api_version:
             return f'LLM(model={self.model_name}, api_version={self.api_version}, base_url={self.base_url})'