1 år sedan · d50a8447ad
--- a/docs/modules/usage/llms/llms.md
+++ b/docs/modules/usage/llms/llms.md
@@ -15,13 +15,14 @@ OpenDevin will issue many prompts to the LLM you configure. Most of these LLMs c
 
															 The `LLM_MODEL` environment variable controls which model is used in programmatic interactions.
														
 
															 But when using the OpenDevin UI, you'll need to choose your model in the settings window.
														
 
															-The following environment variables might be necessary for some LLMs:
														
 
															+The following environment variables might be necessary for some LLMs/providers:
														
 
															 - `LLM_API_KEY`
														
 
															 - `LLM_BASE_URL`
														
 
															 - `LLM_EMBEDDING_MODEL`
														
 
															 - `LLM_EMBEDDING_DEPLOYMENT_NAME`
														
 
															 - `LLM_API_VERSION`
														
 
															+- `LLM_DROP_PARAMS`
														
 
															 We have a few guides for running OpenDevin with specific model providers:
														
--- a/opendevin/core/config.py
+++ b/opendevin/core/config.py
@@ -49,6 +49,7 @@ class LLMConfig:
 
															         input_cost_per_token: The cost per input token. This will available in logs for the user to check.
														
 
															         output_cost_per_token: The cost per output token. This will available in logs for the user to check.
														
 
															         ollama_base_url: The base URL for the OLLAMA API.
														
 
															+        drop_params: Drop any unmapped (unsupported) params without causing an exception.
														
 
															     """
														
 
															     model: str = 'gpt-4o'
														
@@ -75,6 +76,7 @@ class LLMConfig:
 
															     input_cost_per_token: float | None = None
														
 
															     output_cost_per_token: float | None = None
														
 
															     ollama_base_url: str | None = None
														
 
															+    drop_params: bool | None = None
														
 
															     def defaults_to_dict(self) -> dict:
														
 
															         """Serialize fields to a dict for the frontend, including type hints, defaults, and whether it's optional."""
														
--- a/opendevin/core/schema/config.py
+++ b/opendevin/core/schema/config.py
@@ -4,6 +4,7 @@ from enum import Enum
 
															 class ConfigType(str, Enum):
														
 
															     # For frontend
														
 
															     LLM_CUSTOM_LLM_PROVIDER = 'LLM_CUSTOM_LLM_PROVIDER'
														
 
															+    LLM_DROP_PARAMS = 'LLM_DROP_PARAMS'
														
 
															     LLM_MAX_INPUT_TOKENS = 'LLM_MAX_INPUT_TOKENS'
														
 
															     LLM_MAX_OUTPUT_TOKENS = 'LLM_MAX_OUTPUT_TOKENS'
														
 
															     LLM_TOP_P = 'LLM_TOP_P'
														
--- a/opendevin/llm/llm.py
+++ b/opendevin/llm/llm.py
@@ -52,7 +52,6 @@ class LLM:
 
															         Args:
														
 
															             config: The LLM configuration
														
 
															         """
														
 
															-
														
 
															         self.config = copy.deepcopy(config)
														
 
															         self.metrics = metrics if metrics is not None else Metrics()
														
 
															         self.cost_metric_supported = True
														
@@ -60,10 +59,12 @@ class LLM:
 
															         # litellm actually uses base Exception here for unknown model
														
 
															         self.model_info = None
														
 
															         try:
														
 
															-            if not config.model.startswith('openrouter'):
														
 
															-                self.model_info = litellm.get_model_info(config.model.split(':')[0])
														
 
															+            if self.config.model.startswith('openrouter'):
														
 
															+                self.model_info = litellm.get_model_info(self.config.model)
														
 
															             else:
														
 
															-                self.model_info = litellm.get_model_info(config.model)
														
 
															+                self.model_info = litellm.get_model_info(
														
 
															+                    self.config.model.split(':')[0]
														
 
															+                )
														
 
															         # noinspection PyBroadException
														
 
															         except Exception:
														
 
															             logger.warning(f'Could not get model info for {config.model}')
														
@@ -91,6 +92,9 @@ class LLM:
 
															                 # Max output tokens for gpt3.5, so this is a safe fallback for any potentially viable model
														
 
															                 self.config.max_output_tokens = 1024
														
 
															+        if self.config.drop_params:
														
 
															+            litellm.drop_params = self.config.drop_params
														
 
															+
														
 
															         self._completion = partial(
														
 
															             litellm_completion,
														
 
															             model=self.config.model,