From 28b9264df7a0b144fe8412b3afa0b684f5c9b0d4 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 20 Jan 2026 04:07:39 +0000
Subject: [PATCH 1/4] Initial plan


From ea0e37f6e2d770e4c3da0b9802f829bb0887e0a3 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 20 Jan 2026 04:11:10 +0000
Subject: [PATCH 2/4] Add hierarchical search space documentation to
 Tune-User-Defined-Function.md

Co-authored-by: thinkall <3197038+thinkall@users.noreply.github.com>
---
 .../Use-Cases/Tune-User-Defined-Function.md   | 141 ++++++++++++++++++
 1 file changed, 141 insertions(+)

diff --git a/website/docs/Use-Cases/Tune-User-Defined-Function.md b/website/docs/Use-Cases/Tune-User-Defined-Function.md
index f565feef4d..1e3e30bfe0 100644
--- a/website/docs/Use-Cases/Tune-User-Defined-Function.md
+++ b/website/docs/Use-Cases/Tune-User-Defined-Function.md
@@ -181,6 +181,147 @@ config = {
 
 <!-- Please refer to [ray.tune](https://docs.ray.io/en/latest/tune/api_docs/search_space.html#overview) for a more comprehensive introduction about possible choices of the domain. -->
 
+#### Hierarchical search space
+
+A hierarchical (or conditional) search space allows you to define hyperparameters that depend on the value of other hyperparameters. This is useful when different choices for a categorical hyperparameter require different sets of hyperparameters.
+
+For example, if you're tuning a machine learning pipeline where different models require different hyperparameters, or when the choice of an optimizer determines which optimizer-specific hyperparameters are relevant.
+
+**Syntax**: To create a hierarchical search space, use `tune.choice()` with a list where some elements are dictionaries containing nested hyperparameter definitions.
+
+**Example 1: Model selection with model-specific hyperparameters**
+
+In this example, we have two model types (linear and tree-based), each with their own specific hyperparameters:
+
+```python
+from flaml import tune
+
+search_space = {
+    "model": tune.choice([
+        {
+            "model_type": "linear",
+            "learning_rate": tune.loguniform(1e-4, 1e-1),
+            "regularization": tune.uniform(0, 1),
+        },
+        {
+            "model_type": "tree",
+            "n_estimators": tune.randint(10, 100),
+            "max_depth": tune.randint(3, 10),
+        },
+    ]),
+    # Common hyperparameters for all models
+    "batch_size": tune.choice([32, 64, 128]),
+}
+
+def evaluate_config(config):
+    model_config = config["model"]
+    if model_config["model_type"] == "linear":
+        # Use learning_rate and regularization
+        score = train_linear_model(
+            lr=model_config["learning_rate"],
+            reg=model_config["regularization"],
+            batch_size=config["batch_size"]
+        )
+    else:  # tree
+        # Use n_estimators and max_depth
+        score = train_tree_model(
+            n_est=model_config["n_estimators"],
+            depth=model_config["max_depth"],
+            batch_size=config["batch_size"]
+        )
+    return {"score": score}
+
+# Run tuning
+analysis = tune.run(
+    evaluate_config,
+    config=search_space,
+    metric="score",
+    mode="min",
+    num_samples=20,
+)
+```
+
+**Example 2: Mixed choices with constants and nested spaces**
+
+You can also mix constant values with nested hyperparameter spaces in `tune.choice()`:
+
+```python
+search_space = {
+    "optimizer": tune.choice([
+        "sgd",  # constant value
+        {
+            "optimizer_type": "adam",
+            "beta1": tune.uniform(0.8, 0.99),
+            "beta2": tune.uniform(0.9, 0.999),
+        },
+        {
+            "optimizer_type": "rmsprop",
+            "decay": tune.loguniform(1e-3, 1e-1),
+            "momentum": tune.uniform(0, 0.99),
+        },
+    ]),
+    "learning_rate": tune.loguniform(1e-5, 1e-1),
+}
+
+def evaluate_config(config):
+    optimizer_config = config["optimizer"]
+    if optimizer_config == "sgd":
+        optimizer = create_sgd_optimizer(lr=config["learning_rate"])
+    elif optimizer_config["optimizer_type"] == "adam":
+        optimizer = create_adam_optimizer(
+            lr=config["learning_rate"],
+            beta1=optimizer_config["beta1"],
+            beta2=optimizer_config["beta2"],
+        )
+    else:  # rmsprop
+        optimizer = create_rmsprop_optimizer(
+            lr=config["learning_rate"],
+            decay=optimizer_config["decay"],
+            momentum=optimizer_config["momentum"],
+        )
+    return train_model(optimizer)
+```
+
+**Example 3: Nested hierarchical spaces**
+
+You can also nest dictionaries within the search space for organizing related hyperparameters:
+
+```python
+search_space = {
+    "preprocessing": {
+        "normalize": tune.choice([True, False]),
+        "feature_selection": tune.choice(["none", "pca", "lda"]),
+    },
+    "model": tune.choice([
+        {
+            "type": "neural_net",
+            "layers": tune.randint(1, 5),
+            "units_per_layer": tune.randint(32, 256),
+        },
+        {
+            "type": "ensemble",
+            "n_models": tune.randint(3, 10),
+        },
+    ]),
+}
+
+def evaluate_config(config):
+    # Access nested hyperparameters
+    normalize = config["preprocessing"]["normalize"]
+    feature_selection = config["preprocessing"]["feature_selection"]
+    model_config = config["model"]
+    
+    # Use the hyperparameters accordingly
+    score = train_with_config(normalize, feature_selection, model_config)
+    return {"score": score}
+```
+
+**Notes:**
+- When a configuration is sampled, only the selected branch of the hierarchical space will be active.
+- The evaluation function should check which choice was selected and use the corresponding nested hyperparameters.
+- Hierarchical search spaces work with all FLAML search algorithms (CFO, BlendSearch).
+- You can specify `low_cost_partial_config` for hierarchical spaces as well by providing the path to the nested parameters.
+
 #### Cost-related hyperparameters
 
 Cost-related hyperparameters are a subset of the hyperparameters which directly affect the computation cost incurred in the evaluation of any hyperparameter configuration. For example, the number of estimators (`n_estimators`) and the maximum number of leaves (`max_leaves`) are known to affect the training cost of tree-based learners. So they are cost-related hyperparameters for tree-based learners.

From 0d186e01abbebf05ca2a22227164a63eb81be6be Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 20 Jan 2026 04:13:34 +0000
Subject: [PATCH 3/4] Add clarifying comments to hierarchical search space
 examples

Co-authored-by: thinkall <3197038+thinkall@users.noreply.github.com>
---
 website/docs/Use-Cases/Tune-User-Defined-Function.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/website/docs/Use-Cases/Tune-User-Defined-Function.md b/website/docs/Use-Cases/Tune-User-Defined-Function.md
index 1e3e30bfe0..b82be12625 100644
--- a/website/docs/Use-Cases/Tune-User-Defined-Function.md
+++ b/website/docs/Use-Cases/Tune-User-Defined-Function.md
@@ -217,6 +217,7 @@ def evaluate_config(config):
     model_config = config["model"]
     if model_config["model_type"] == "linear":
         # Use learning_rate and regularization
+        # train_linear_model() is a placeholder for your actual training code
         score = train_linear_model(
             lr=model_config["learning_rate"],
             reg=model_config["regularization"],
@@ -224,6 +225,7 @@ def evaluate_config(config):
         )
     else:  # tree
         # Use n_estimators and max_depth
+        # train_tree_model() is a placeholder for your actual training code
         score = train_tree_model(
             n_est=model_config["n_estimators"],
             depth=model_config["max_depth"],
@@ -279,6 +281,7 @@ def evaluate_config(config):
             decay=optimizer_config["decay"],
             momentum=optimizer_config["momentum"],
         )
+    # train_model() is a placeholder for your actual training code
     return train_model(optimizer)
 ```
 
@@ -312,6 +315,7 @@ def evaluate_config(config):
     model_config = config["model"]
     
     # Use the hyperparameters accordingly
+    # train_with_config() is a placeholder for your actual training code
     score = train_with_config(normalize, feature_selection, model_config)
     return {"score": score}
 ```

From 554aea54bda0791f00530900483216801138d33f Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 20 Jan 2026 15:39:19 +0000
Subject: [PATCH 4/4] Fix formatting issues with pre-commit

Co-authored-by: thinkall <3197038+thinkall@users.noreply.github.com>
---
 .../Use-Cases/Tune-User-Defined-Function.md   | 89 +++++++++++--------
 1 file changed, 50 insertions(+), 39 deletions(-)

diff --git a/website/docs/Use-Cases/Tune-User-Defined-Function.md b/website/docs/Use-Cases/Tune-User-Defined-Function.md
index b82be12625..7a1afb364a 100644
--- a/website/docs/Use-Cases/Tune-User-Defined-Function.md
+++ b/website/docs/Use-Cases/Tune-User-Defined-Function.md
@@ -197,22 +197,25 @@ In this example, we have two model types (linear and tree-based), each with thei
 from flaml import tune
 
 search_space = {
-    "model": tune.choice([
-        {
-            "model_type": "linear",
-            "learning_rate": tune.loguniform(1e-4, 1e-1),
-            "regularization": tune.uniform(0, 1),
-        },
-        {
-            "model_type": "tree",
-            "n_estimators": tune.randint(10, 100),
-            "max_depth": tune.randint(3, 10),
-        },
-    ]),
+    "model": tune.choice(
+        [
+            {
+                "model_type": "linear",
+                "learning_rate": tune.loguniform(1e-4, 1e-1),
+                "regularization": tune.uniform(0, 1),
+            },
+            {
+                "model_type": "tree",
+                "n_estimators": tune.randint(10, 100),
+                "max_depth": tune.randint(3, 10),
+            },
+        ]
+    ),
     # Common hyperparameters for all models
     "batch_size": tune.choice([32, 64, 128]),
 }
 
+
 def evaluate_config(config):
     model_config = config["model"]
     if model_config["model_type"] == "linear":
@@ -221,7 +224,7 @@ def evaluate_config(config):
         score = train_linear_model(
             lr=model_config["learning_rate"],
             reg=model_config["regularization"],
-            batch_size=config["batch_size"]
+            batch_size=config["batch_size"],
         )
     else:  # tree
         # Use n_estimators and max_depth
@@ -229,10 +232,11 @@ def evaluate_config(config):
         score = train_tree_model(
             n_est=model_config["n_estimators"],
             depth=model_config["max_depth"],
-            batch_size=config["batch_size"]
+            batch_size=config["batch_size"],
         )
     return {"score": score}
 
+
 # Run tuning
 analysis = tune.run(
     evaluate_config,
@@ -249,22 +253,25 @@ You can also mix constant values with nested hyperparameter spaces in `tune.choi
 
 ```python
 search_space = {
-    "optimizer": tune.choice([
-        "sgd",  # constant value
-        {
-            "optimizer_type": "adam",
-            "beta1": tune.uniform(0.8, 0.99),
-            "beta2": tune.uniform(0.9, 0.999),
-        },
-        {
-            "optimizer_type": "rmsprop",
-            "decay": tune.loguniform(1e-3, 1e-1),
-            "momentum": tune.uniform(0, 0.99),
-        },
-    ]),
+    "optimizer": tune.choice(
+        [
+            "sgd",  # constant value
+            {
+                "optimizer_type": "adam",
+                "beta1": tune.uniform(0.8, 0.99),
+                "beta2": tune.uniform(0.9, 0.999),
+            },
+            {
+                "optimizer_type": "rmsprop",
+                "decay": tune.loguniform(1e-3, 1e-1),
+                "momentum": tune.uniform(0, 0.99),
+            },
+        ]
+    ),
     "learning_rate": tune.loguniform(1e-5, 1e-1),
 }
 
+
 def evaluate_config(config):
     optimizer_config = config["optimizer"]
     if optimizer_config == "sgd":
@@ -295,25 +302,28 @@ search_space = {
         "normalize": tune.choice([True, False]),
         "feature_selection": tune.choice(["none", "pca", "lda"]),
     },
-    "model": tune.choice([
-        {
-            "type": "neural_net",
-            "layers": tune.randint(1, 5),
-            "units_per_layer": tune.randint(32, 256),
-        },
-        {
-            "type": "ensemble",
-            "n_models": tune.randint(3, 10),
-        },
-    ]),
+    "model": tune.choice(
+        [
+            {
+                "type": "neural_net",
+                "layers": tune.randint(1, 5),
+                "units_per_layer": tune.randint(32, 256),
+            },
+            {
+                "type": "ensemble",
+                "n_models": tune.randint(3, 10),
+            },
+        ]
+    ),
 }
 
+
 def evaluate_config(config):
     # Access nested hyperparameters
     normalize = config["preprocessing"]["normalize"]
     feature_selection = config["preprocessing"]["feature_selection"]
     model_config = config["model"]
-    
+
     # Use the hyperparameters accordingly
     # train_with_config() is a placeholder for your actual training code
     score = train_with_config(normalize, feature_selection, model_config)
@@ -321,6 +331,7 @@ def evaluate_config(config):
 ```
 
 **Notes:**
+
 - When a configuration is sampled, only the selected branch of the hierarchical space will be active.
 - The evaluation function should check which choice was selected and use the corresponding nested hyperparameters.
 - Hierarchical search spaces work with all FLAML search algorithms (CFO, BlendSearch).