| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429 |
- import argparse
- import os
- import pathlib
- import platform
- from dataclasses import is_dataclass
- from types import UnionType
- from typing import Any, MutableMapping, get_args, get_origin
- from uuid import uuid4
- import toml
- from dotenv import load_dotenv
- from openhands.core import logger
- from openhands.core.config.agent_config import AgentConfig
- from openhands.core.config.app_config import AppConfig
- from openhands.core.config.config_utils import (
- OH_DEFAULT_AGENT,
- OH_MAX_ITERATIONS,
- )
- from openhands.core.config.llm_config import LLMConfig
- from openhands.core.config.sandbox_config import SandboxConfig
- from openhands.core.config.security_config import SecurityConfig
- from openhands.storage import get_file_store
- from openhands.storage.files import FileStore
- JWT_SECRET = '.jwt_secret'
- load_dotenv()
- def load_from_env(cfg: AppConfig, env_or_toml_dict: dict | MutableMapping[str, str]):
- """Reads the env-style vars and sets config attributes based on env vars or a config.toml dict.
- Compatibility with vars like LLM_BASE_URL, AGENT_MEMORY_ENABLED, SANDBOX_TIMEOUT and others.
- Args:
- cfg: The AppConfig object to set attributes on.
- env_or_toml_dict: The environment variables or a config.toml dict.
- """
- def get_optional_type(union_type: UnionType) -> Any:
- """Returns the non-None type from a Union."""
- types = get_args(union_type)
- return next((t for t in types if t is not type(None)), None)
- # helper function to set attributes based on env vars
- def set_attr_from_env(sub_config: Any, prefix=''):
- """Set attributes of a config dataclass based on environment variables."""
- for field_name, field_type in sub_config.__annotations__.items():
- # compute the expected env var name from the prefix and field name
- # e.g. LLM_BASE_URL
- env_var_name = (prefix + field_name).upper()
- if is_dataclass(field_type):
- # nested dataclass
- nested_sub_config = getattr(sub_config, field_name)
- set_attr_from_env(nested_sub_config, prefix=field_name + '_')
- elif env_var_name in env_or_toml_dict:
- # convert the env var to the correct type and set it
- value = env_or_toml_dict[env_var_name]
- # skip empty config values (fall back to default)
- if not value:
- continue
- try:
- # if it's an optional type, get the non-None type
- if get_origin(field_type) is UnionType:
- field_type = get_optional_type(field_type)
- # Attempt to cast the env var to type hinted in the dataclass
- if field_type is bool:
- cast_value = str(value).lower() in ['true', '1']
- else:
- cast_value = field_type(value)
- setattr(sub_config, field_name, cast_value)
- except (ValueError, TypeError):
- logger.openhands_logger.error(
- f'Error setting env var {env_var_name}={value}: check that the value is of the right type'
- )
- # Start processing from the root of the config object
- set_attr_from_env(cfg)
- # load default LLM config from env
- default_llm_config = cfg.get_llm_config()
- set_attr_from_env(default_llm_config, 'LLM_')
- # load default agent config from env
- default_agent_config = cfg.get_agent_config()
- set_attr_from_env(default_agent_config, 'AGENT_')
- def load_from_toml(cfg: AppConfig, toml_file: str = 'config.toml'):
- """Load the config from the toml file. Supports both styles of config vars.
- Args:
- cfg: The AppConfig object to update attributes of.
- toml_file: The path to the toml file. Defaults to 'config.toml'.
- """
- # try to read the config.toml file into the config object
- try:
- with open(toml_file, 'r', encoding='utf-8') as toml_contents:
- toml_config = toml.load(toml_contents)
- except FileNotFoundError:
- return
- except toml.TomlDecodeError as e:
- logger.openhands_logger.warning(
- f'Cannot parse config from toml, toml values have not been applied.\nError: {e}',
- exc_info=False,
- )
- return
- # if there was an exception or core is not in the toml, try to use the old-style toml
- if 'core' not in toml_config:
- # re-use the env loader to set the config from env-style vars
- load_from_env(cfg, toml_config)
- return
- core_config = toml_config['core']
- # load llm configs and agent configs
- for key, value in toml_config.items():
- if isinstance(value, dict):
- try:
- if key is not None and key.lower() == 'agent':
- logger.openhands_logger.debug(
- 'Attempt to load default agent config from config toml'
- )
- non_dict_fields = {
- k: v for k, v in value.items() if not isinstance(v, dict)
- }
- agent_config = AgentConfig(**non_dict_fields)
- cfg.set_agent_config(agent_config, 'agent')
- for nested_key, nested_value in value.items():
- if isinstance(nested_value, dict):
- logger.openhands_logger.debug(
- f'Attempt to load group {nested_key} from config toml as agent config'
- )
- agent_config = AgentConfig(**nested_value)
- cfg.set_agent_config(agent_config, nested_key)
- elif key is not None and key.lower() == 'llm':
- logger.openhands_logger.debug(
- 'Attempt to load default LLM config from config toml'
- )
- llm_config = LLMConfig.from_dict(value)
- cfg.set_llm_config(llm_config, 'llm')
- for nested_key, nested_value in value.items():
- if isinstance(nested_value, dict):
- logger.openhands_logger.debug(
- f'Attempt to load group {nested_key} from config toml as llm config'
- )
- llm_config = LLMConfig.from_dict(nested_value)
- cfg.set_llm_config(llm_config, nested_key)
- elif key is not None and key.lower() == 'security':
- logger.openhands_logger.debug(
- 'Attempt to load security config from config toml'
- )
- security_config = SecurityConfig.from_dict(value)
- cfg.security = security_config
- elif not key.startswith('sandbox') and key.lower() != 'core':
- logger.openhands_logger.warning(
- f'Unknown key in {toml_file}: "{key}"'
- )
- except (TypeError, KeyError) as e:
- logger.openhands_logger.warning(
- f'Cannot parse config from toml, toml values have not been applied.\n Error: {e}',
- exc_info=False,
- )
- else:
- logger.openhands_logger.warning(f'Unknown key in {toml_file}: "{key}')
- try:
- # set sandbox config from the toml file
- sandbox_config = cfg.sandbox
- # migrate old sandbox configs from [core] section to sandbox config
- keys_to_migrate = [key for key in core_config if key.startswith('sandbox_')]
- for key in keys_to_migrate:
- new_key = key.replace('sandbox_', '')
- if new_key in sandbox_config.__annotations__:
- # read the key in sandbox and remove it from core
- setattr(sandbox_config, new_key, core_config.pop(key))
- else:
- logger.openhands_logger.warning(f'Unknown sandbox config: {key}')
- # the new style values override the old style values
- if 'sandbox' in toml_config:
- sandbox_config = SandboxConfig(**toml_config['sandbox'])
- # update the config object with the new values
- cfg.sandbox = sandbox_config
- for key, value in core_config.items():
- if hasattr(cfg, key):
- setattr(cfg, key, value)
- else:
- logger.openhands_logger.warning(f'Unknown core config key: {key}')
- except (TypeError, KeyError) as e:
- logger.openhands_logger.warning(
- f'Cannot parse config from toml, toml values have not been applied.\nError: {e}',
- exc_info=False,
- )
- def get_or_create_jwt_secret(file_store: FileStore) -> str:
- try:
- jwt_secret = file_store.read(JWT_SECRET)
- return jwt_secret
- except FileNotFoundError:
- new_secret = uuid4().hex
- file_store.write(JWT_SECRET, new_secret)
- return new_secret
- def finalize_config(cfg: AppConfig):
- """More tweaks to the config after it's been loaded."""
- if cfg.workspace_base is not None:
- cfg.workspace_base = os.path.abspath(cfg.workspace_base)
- if cfg.workspace_mount_path is None:
- cfg.workspace_mount_path = cfg.workspace_base
- if cfg.workspace_mount_rewrite:
- base = cfg.workspace_base or os.getcwd()
- parts = cfg.workspace_mount_rewrite.split(':')
- cfg.workspace_mount_path = base.replace(parts[0], parts[1])
- # make sure log_completions_folder is an absolute path
- for llm in cfg.llms.values():
- llm.log_completions_folder = os.path.abspath(llm.log_completions_folder)
- if llm.embedding_base_url is None:
- llm.embedding_base_url = llm.base_url
- if cfg.sandbox.use_host_network and platform.system() == 'Darwin':
- logger.openhands_logger.warning(
- 'Please upgrade to Docker Desktop 4.29.0 or later to use host network mode on macOS. '
- 'See https://github.com/docker/roadmap/issues/238#issuecomment-2044688144 for more information.'
- )
- # make sure cache dir exists
- if cfg.cache_dir:
- pathlib.Path(cfg.cache_dir).mkdir(parents=True, exist_ok=True)
- if not cfg.jwt_secret:
- cfg.jwt_secret = get_or_create_jwt_secret(
- get_file_store(cfg.file_store, cfg.file_store_path)
- )
- # Utility function for command line --group argument
- def get_llm_config_arg(
- llm_config_arg: str, toml_file: str = 'config.toml'
- ) -> LLMConfig | None:
- """Get a group of llm settings from the config file.
- A group in config.toml can look like this:
- ```
- [llm.gpt-3.5-for-eval]
- model = 'gpt-3.5-turbo'
- api_key = '...'
- temperature = 0.5
- num_retries = 8
- ...
- ```
- The user-defined group name, like "gpt-3.5-for-eval", is the argument to this function. The function will load the LLMConfig object
- with the settings of this group, from the config file, and set it as the LLMConfig object for the app.
- Note that the group must be under "llm" group, or in other words, the group name must start with "llm.".
- Args:
- llm_config_arg: The group of llm settings to get from the config.toml file.
- toml_file: Path to the configuration file to read from. Defaults to 'config.toml'.
- Returns:
- LLMConfig: The LLMConfig object with the settings from the config file.
- """
- # keep only the name, just in case
- llm_config_arg = llm_config_arg.strip('[]')
- # truncate the prefix, just in case
- if llm_config_arg.startswith('llm.'):
- llm_config_arg = llm_config_arg[4:]
- logger.openhands_logger.debug(f'Loading llm config from {llm_config_arg}')
- # load the toml file
- try:
- with open(toml_file, 'r', encoding='utf-8') as toml_contents:
- toml_config = toml.load(toml_contents)
- except FileNotFoundError as e:
- logger.openhands_logger.error(f'Config file not found: {e}')
- return None
- except toml.TomlDecodeError as e:
- logger.openhands_logger.error(
- f'Cannot parse llm group from {llm_config_arg}. Exception: {e}'
- )
- return None
- # update the llm config with the specified section
- if 'llm' in toml_config and llm_config_arg in toml_config['llm']:
- return LLMConfig.from_dict(toml_config['llm'][llm_config_arg])
- logger.openhands_logger.debug(f'Loading from toml failed for {llm_config_arg}')
- return None
- # Command line arguments
- def get_parser() -> argparse.ArgumentParser:
- """Get the parser for the command line arguments."""
- parser = argparse.ArgumentParser(description='Run an agent with a specific task')
- parser.add_argument(
- '--config-file',
- type=str,
- default='config.toml',
- help='Path to the config file (default: config.toml in the current directory)',
- )
- parser.add_argument(
- '-d',
- '--directory',
- type=str,
- help='The working directory for the agent',
- )
- parser.add_argument(
- '-t',
- '--task',
- type=str,
- default='',
- help='The task for the agent to perform',
- )
- parser.add_argument(
- '-f',
- '--file',
- type=str,
- help='Path to a file containing the task. Overrides -t if both are provided.',
- )
- parser.add_argument(
- '-c',
- '--agent-cls',
- default=OH_DEFAULT_AGENT,
- type=str,
- help='Name of the default agent to use',
- )
- parser.add_argument(
- '-i',
- '--max-iterations',
- default=OH_MAX_ITERATIONS,
- type=int,
- help='The maximum number of iterations to run the agent',
- )
- parser.add_argument(
- '-b',
- '--max-budget-per-task',
- type=float,
- help='The maximum budget allowed per task, beyond which the agent will stop.',
- )
- # --eval configs are for evaluations only
- parser.add_argument(
- '--eval-output-dir',
- default='evaluation/evaluation_outputs/outputs',
- type=str,
- help='The directory to save evaluation output',
- )
- parser.add_argument(
- '--eval-n-limit',
- default=None,
- type=int,
- help='The number of instances to evaluate',
- )
- parser.add_argument(
- '--eval-num-workers',
- default=4,
- type=int,
- help='The number of workers to use for evaluation',
- )
- parser.add_argument(
- '--eval-note',
- default=None,
- type=str,
- help='The note to add to the evaluation directory',
- )
- parser.add_argument(
- '-l',
- '--llm-config',
- default=None,
- type=str,
- help='Replace default LLM ([llm] section in config.toml) config with the specified LLM config, e.g. "llama3" for [llm.llama3] section in config.toml',
- )
- parser.add_argument(
- '-n',
- '--name',
- default='default',
- type=str,
- help='Name for the session',
- )
- parser.add_argument(
- '--eval-ids',
- default=None,
- type=str,
- help='The comma-separated list (in quotes) of IDs of the instances to evaluate',
- )
- parser.add_argument(
- '--no-auto-continue',
- action='store_true',
- help='Disable automatic "continue" responses. Will read from stdin instead.',
- )
- return parser
- def parse_arguments() -> argparse.Namespace:
- """Parse the command line arguments."""
- parser = get_parser()
- parsed_args, _ = parser.parse_known_args()
- return parsed_args
- def load_app_config(
- set_logging_levels: bool = True, config_file: str = 'config.toml'
- ) -> AppConfig:
- """Load the configuration from the specified config file and environment variables.
- Args:
- set_logging_levels: Whether to set the global variables for logging levels.
- config_file: Path to the config file. Defaults to 'config.toml' in the current directory.
- """
- config = AppConfig()
- load_from_toml(config, config_file)
- load_from_env(config, os.environ)
- finalize_config(config)
- if set_logging_levels:
- logger.DEBUG = config.debug
- logger.DISABLE_COLOR_PRINTING = config.disable_color
- return config
|