define dict in run_args yaml

automl · Jun 13, 2024 · 85c9fa5 · 85c9fa5
1 parent 3b4769a
commit 85c9fa5
Show file tree

Hide file tree

Showing 4 changed files with 60 additions and 62 deletions.
diff --git a/neps/api.py b/neps/api.py
@@ -314,7 +314,7 @@ def run(
 
     # Check to verify if the target directory contains history of another optimizer state
     # This check is performed only when the `searcher` is built during the run
-    if not isinstance(searcher, (BaseOptimizer, str)):
+    if not isinstance(searcher, (BaseOptimizer, str, dict)):
         raise ValueError(
             f"Unrecognized `searcher` of type {type(searcher)}. Not str or BaseOptimizer."
         )
@@ -417,6 +417,11 @@ def _run_args(
         config, searcher = get_searcher_data(searcher, loading_custom_searcher=True)
         searcher_info["searcher_selection"] = "user-yaml"
         searcher_info["neps_decision_tree"] = False
+    elif isinstance(searcher, dict):
+        config = searcher
+        searcher = config.pop("name", "unnamed-custom-searcher")
+        searcher_info["searcher_selection"] = "user-yaml"
+        searcher_info["neps_decision_tree"] = False
     else:
         if searcher in ["default", None]:
             # NePS decides the searcher according to the pipeline space.

diff --git a/neps/utils/run_args_from_yaml.py b/neps/utils/run_args_from_yaml.py
@@ -6,6 +6,7 @@
 from typing import Callable, Optional, Dict, Tuple, List, Any
 import inspect
 from neps.search_spaces.search_space import pipeline_space_from_yaml
+from pathlib import Path
 
 logger = logging.getLogger("neps")
 
@@ -189,11 +190,10 @@ def handle_special_argument_cases(settings: Dict, special_configs: Dict) -> None
     - None: The function modifies 'settings' in place.
 
     """
-    # Load the value of each key from a dictionary specifying "path" and "name".
-    process_config_key(
-        settings, special_configs, [SEARCHER, RUN_PIPELINE]
-    )
+    # process special configs
+    process_run_pipeline(RUN_PIPELINE, special_configs, settings)
     process_pipeline_space(PIPELINE_SPACE, special_configs, settings)
+    process_searcher(SEARCHER, special_configs, settings)
     if special_configs[SEARCHER_KWARGS] is not None:
         configs = {}
         # Check if values of keys is not None and then add the dict to settings
@@ -209,55 +209,7 @@ def handle_special_argument_cases(settings: Dict, special_configs: Dict) -> None
         settings[PRE_LOAD_HOOKS] = load_hooks_from_config(special_configs[PRE_LOAD_HOOKS])
 
 
-def process_config_key(settings: Dict, special_configs: Dict, keys: List) -> None:
-    """
-    Enhance 'settings' by adding keys and their corresponding values or loaded objects
-    from 'special_configs'. Keys in 'special_configs' are processed to directly insert
-    their values into 'settings' or to load functions/objects using 'path' and 'name'.
-    Key handling varies: 'RUN_PIPELINE' requires a dictionary defining a loadable function
-    , whereas other keys may accept either strings or dictionaries
-
-    Parameters:
-    - settings (dict): Dictionary to update.
-    - special_configs (dict): Contains keys and values for processing.
-    - keys (list): List of keys to process in 'special_configs'.
-
-    Raises:
-    - KeyError: Missing 'path'/'name' for dictionaries.
-    - TypeError: Incorrect type for key's value; RUN_PIPELINE must be a dict,
-    others can be dict or string.
-    """
-    for key in keys:
-        if special_configs.get(key) is not None:
-            value = special_configs[key]
-            if isinstance(value, str) and key != RUN_PIPELINE:
-                # searcher can be a string
-                settings[key] = value
-            elif isinstance(value, dict):
-                # dict that should contain 'path' and 'name' for loading value
-                try:
-                    func = load_and_return_object(value["path"], value["name"], key)
-                    settings[key] = func
-                except KeyError as e:
-                    raise KeyError(
-                        f"Missing key for argument {key}: {e}. Expect 'path' "
-                        f"and 'name' as keys when loading '{key}' "
-                        f"from 'run_args'"
-                    ) from e
-            else:
-                if key == RUN_PIPELINE:
-                    raise TypeError(
-                        f"Value for {key} must be a dictionary, but got "
-                        f"{type(value).__name__}."
-                    )
-                else:
-                    raise TypeError(
-                        f"Value for {key} must be a string or a dictionary, "
-                        f"but got {type(value).__name__}."
-                    )
-
-
-def process_pipeline_space(key, special_configs, settings):
+def process_pipeline_space(key: str, special_configs: Dict, settings: Dict):
     """
     Process or load the pipeline space configuration.
 
@@ -289,19 +241,54 @@ def process_pipeline_space(key, special_configs, settings):
             else:
                 # pipeline_space stored in a python dict, not using a yaml
                 processed_pipeline_space = load_and_return_object(pipeline_space["path"],
-                                                             pipeline_space[
-                    "name"], PIPELINE_SPACE)
+                                                                  pipeline_space["name"],
+                                                                  key)
         elif isinstance(pipeline_space, str):
             # load yaml from path
             processed_pipeline_space = pipeline_space_from_yaml(pipeline_space)
         else:
             raise TypeError(
-                f"Value for {PIPELINE_SPACE} must be a string or a dictionary, "
+                f"Value for {key} must be a string or a dictionary, "
                 f"but got {type(pipeline_space).__name__}."
             )
         settings[key] = processed_pipeline_space
 
 
+def process_searcher(key: str, special_configs: Dict, settings: Dict):
+    if special_configs.get(key) is not None:
+        searcher = special_configs[key]
+        if isinstance(searcher, dict):
+            # determine if dict contains path_loading or the actual searcher config
+            expected_keys = {"path", "name"}
+            actual_keys = set(searcher.keys())
+            if expected_keys == actual_keys:
+                searcher = load_and_return_object(searcher["path"],
+                                                             searcher[
+                    "name"], key)
+        elif isinstance(searcher, (str, Path)):
+            pass
+        else:
+            raise TypeError(
+                f"Value for {key} must be a string or a dictionary, "
+                f"but got {type(searcher).__name__}."
+            )
+        settings[key] = searcher
+
+
+def process_run_pipeline(key: str, special_configs: Dict, settings: Dict):
+    if special_configs.get(key) is not None:
+        config = special_configs[key]
+        try:
+            func = load_and_return_object(config["path"], config["name"], key)
+            settings[key] = func
+        except KeyError as e:
+            raise KeyError(
+                f"Missing key for argument {key}: {e}. Expect 'path' "
+                f"and 'name' as keys when loading '{key}' "
+                f"from 'run_args'"
+            ) from e
+
+
 def load_and_return_object(module_path: str, object_name: str, key: str) -> object:
     """
     Dynamically loads an object from a given module file path.

diff --git a/tests/test_yaml_run_args/test_declarative_usage_docs/customizing_neps_optimizer.yaml b/tests/test_yaml_run_args/test_declarative_usage_docs/customizing_neps_optimizer.yaml
@@ -1,17 +1,21 @@
 run_pipeline:
-  path: path/to/your/run_pipeline.py  # Path to the function file
-  name: example_pipeline              # Function name within the file
+  path: tests/test_yaml_run_args/test_declarative_usage_docs/run_pipeline.py
+  name: run_pipeline_constant
 
 pipeline_space:
   learning_rate:
     lower: 1e-5
     upper: 1e-1
     log: True  # Log scale for learning rate
+  epochs:
+    lower: 5
+    upper: 20
+    is_fidelity: True
   optimizer:
     choices: [adam, sgd, adamw]
-  epochs: 50
+  batch_size: 64
 
-root_directory: path/to/results       # Directory for result storage
+root_directory: path/to/results/custominizing_neps_optimizer       # Directory for result storage
 max_evaluations_total: 20               # Budget
 searcher:
   algorithm: bayesian_optimization    # name linked with neps keywords, more information click here..?
@@ -22,3 +26,4 @@ searcher:
   acquisition_sampler: random
   random_interleave_prob: 0.1
 
+overwrite_working_directory: True
diff --git a/tests/test_yaml_run_args/test_declarative_usage_docs/test_declarative_usage_docs.py b/tests/test_yaml_run_args/test_declarative_usage_docs/test_declarative_usage_docs.py
@@ -9,7 +9,8 @@
 @pytest.mark.parametrize("yaml_file", [
     "simple_example_including_run_pipeline.yaml",
     "full_configuration_template.yaml",
-    "defining_hooks.yaml"
+    "defining_hooks.yaml",
+    "customizing_neps_optimizer.yaml"
 ])
 def test_run_with_yaml(yaml_file: str) -> None:
     """