From e08be810108129db7f8b438f84c762091647775e Mon Sep 17 00:00:00 2001
From: dhalmazna <dhalmazna@seznam.cz>
Date: Mon, 16 Mar 2026 08:48:14 +0100
Subject: [PATCH 1/6] feat: implement the lookahead algorithm

---
 README.md                   |   4 +-
 ciao/algorithm/lookahead.py | 193 ++++++++++++++++++++++++++++++++++++
 2 files changed, 195 insertions(+), 2 deletions(-)
 create mode 100644 ciao/algorithm/lookahead.py

diff --git a/README.md b/README.md
index e75e36f..eb4464f 100644
--- a/README.md
+++ b/README.md
@@ -69,7 +69,7 @@ uv run python -m ciao
 - **MC-RAVE**: MCTS with Rapid Action Value Estimation
 - **MCGS (Monte Carlo Graph Search)**: Graph-based variant allowing revisiting of states
 - **MCGS-RAVE**: MCGS with RAVE enhancements
-- **Lookahead**: Greedy search with lookahead using efficient bitset operations
+- **Lookahead**: Greedy search with lookahead
 - **Potential**: Potential field-guided sequential search
 
 ### Segmentation Methods
@@ -92,7 +92,7 @@ ciao/
 │   ├── algorithm/                  # Search algorithms and data structures
 │   │   ├── mcts.py                 # Monte Carlo Tree Search
 │   │   ├── mcgs.py                 # Monte Carlo Graph Search
-│   │   ├── lookahead_bitset.py     # Greedy lookahead with bitsets
+│   │   ├── lookahead.py            # Greedy lookahead
 │   │   ├── potential.py            # Potential-based search
 │   │   ├── bitmask_graph.py        # Bitset operations for hyperpixels
 │   │   ├── nodes.py                # Node classes for tree/graph search
diff --git a/ciao/algorithm/lookahead.py b/ciao/algorithm/lookahead.py
new file mode 100644
index 0000000..7981f8f
--- /dev/null
+++ b/ciao/algorithm/lookahead.py
@@ -0,0 +1,193 @@
+"""Greedy lookahead hyperpixel building with bitmask operations.
+
+Rolling horizon strategy: Look ahead multiple steps but only commit one step at a time.
+"""
+
+import logging
+from collections import deque
+
+import numpy as np
+import torch
+
+from ciao.algorithm.bitmask_graph import (
+    add_node,
+    get_frontier,
+    iter_bits,
+    mask_to_ids,
+)
+from ciao.model.predictor import ModelPredictor
+from ciao.scoring.hyperpixel import calculate_hyperpixel_deltas
+
+
+logger = logging.getLogger(__name__)
+
+
+def build_hyperpixel_greedy_lookahead(
+    predictor: ModelPredictor,
+    input_batch: torch.Tensor,
+    segments: np.ndarray,
+    replacement_image: torch.Tensor,
+    adj_masks: tuple[int, ...],
+    target_class_idx: int,
+    seed_idx: int,
+    desired_length: int,
+    lookahead_distance: int,
+    optimization_sign: int,
+    used_mask: int,
+    batch_size: int = 64,
+) -> dict[str, object]:
+    """Build a single hyperpixel using greedy lookahead with rolling horizon.
+
+    Strategy: Look ahead up to lookahead_distance steps, evaluate all candidates,
+    but only commit the first step of the best path found.
+
+    Args:
+        predictor: Model predictor
+        input_batch: Preprocessed image
+        segments: Segmentation map
+        replacement_image: Replacement tensor [C, H, W]
+        adj_masks: Adjacency bitmasks
+        target_class_idx: Target class
+        seed_idx: Starting segment
+        desired_length: Target hyperpixel size
+        lookahead_distance: How many steps to look ahead (1=greedy, 2+=lookahead)
+        optimization_sign: +1 to maximize, -1 to minimize
+        used_mask: Globally excluded segments
+        batch_size: Batch size for evaluation
+
+    Returns:
+        Dict with segments, sign, score, final mask, and stats
+    """
+    current_mask = add_node(0, seed_idx)
+    total_evaluations = 0
+    num_steps = 0
+
+    logger.info(f"Starting greedy lookahead from seed {seed_idx}")
+
+    # Grow hyperpixel one step at a time
+    while current_mask.bit_count() < desired_length:
+        num_steps += 1
+        current_size = current_mask.bit_count()
+
+        # Generate all candidate masks via BFS up to lookahead_distance
+        candidates = _generate_lookahead_candidates(
+            current_mask=current_mask,
+            adj_masks=adj_masks,
+            used_mask=used_mask,
+            lookahead_distance=lookahead_distance,
+            desired_length=desired_length,
+        )
+
+        if not candidates:
+            logger.info(
+                f"Step {num_steps}: No candidates available, stopping at size {current_size}"
+            )
+            break
+
+        logger.debug(
+            f"Step {num_steps}: Size={current_size}/{desired_length}, evaluating {len(candidates)} candidates"
+        )
+
+        # Batch evaluate all candidates
+        candidate_masks = list(candidates.keys())
+        segment_id_lists = [mask_to_ids(mask) for mask in candidate_masks]
+        total_evaluations += len(candidate_masks)
+
+        scores_list = calculate_hyperpixel_deltas(
+            predictor=predictor,
+            input_batch=input_batch,
+            segments=segments,
+            hyperpixel_segment_ids_list=segment_id_lists,
+            replacement_image=replacement_image,
+            target_class_idx=target_class_idx,
+            batch_size=batch_size,
+        )
+
+        # Find best candidate (maximize optimization_sign * score)
+        best_idx = max(
+            range(len(scores_list)), key=lambda i: scores_list[i] * optimization_sign
+        )
+        best_mask = candidate_masks[best_idx]
+        best_score = scores_list[best_idx]
+        first_step = candidates[best_mask]
+
+        logger.debug(
+            f"Step {num_steps}: Best lookahead candidate score={best_score:.4f}, adding segment {first_step}"
+        )
+
+        # Commit only the first step
+        # (it is an open question whether we should add only the first step or the entire best_mask)
+        current_mask = add_node(current_mask, first_step)
+
+    # Re-evaluate the final built mask to get its exact score
+    # (since the last loop might have evaluated a lookahead candidate, not the exact current_mask)
+    final_segments = mask_to_ids(current_mask)
+    final_score = calculate_hyperpixel_deltas(
+        predictor=predictor,
+        input_batch=input_batch,
+        segments=segments,
+        hyperpixel_segment_ids_list=[final_segments],
+        replacement_image=replacement_image,
+        target_class_idx=target_class_idx,
+        batch_size=1,
+    )[0]
+    total_evaluations += 1
+
+    logger.info(
+        f"Built hyperpixel with {len(final_segments)} segments, final exact score={final_score:.4f}"
+    )
+
+    return {
+        "mask": current_mask,
+        "segments": final_segments,
+        "sign": optimization_sign,
+        "score": final_score,
+        "size": len(final_segments),
+        "stats": {
+            "total_evaluations": total_evaluations,
+        },
+    }
+
+
+def _generate_lookahead_candidates(
+    current_mask: int,
+    adj_masks: tuple[int, ...],
+    used_mask: int,
+    lookahead_distance: int,
+    desired_length: int,
+) -> dict[int, int]:
+    """Generate all connected supersets up to lookahead_distance steps via BFS.
+
+    Returns:
+        Dict mapping candidate_mask -> first_step_segment_id
+    """
+    candidates: dict[int, int] = {}  # mask -> first_step
+
+    # Queue stores tuples of: (current_mask, first_step_that_led_here, current_depth)
+    queue: deque[tuple[int, int | None, int]] = deque([(current_mask, None, 0)])
+    visited = {current_mask}
+
+    while queue:
+        mask, first_step, depth = queue.popleft()
+
+        # Store valid candidates (depth > 0)
+        if depth > 0 and first_step is not None and mask not in candidates:
+            # Only add if not already seen (shortest path wins)
+            candidates[mask] = first_step
+
+        # Stop expanding if we reached the lookahead limit or maximum size
+        if depth >= lookahead_distance or mask.bit_count() >= desired_length:
+            continue
+
+        frontier = get_frontier(mask, adj_masks, used_mask)
+        for seg_id in iter_bits(frontier):
+            new_mask = add_node(mask, seg_id)
+
+            if new_mask not in visited:
+                visited.add(new_mask)
+                # If at the first layer (depth 0), this seg_id is our first_step.
+                # Otherwise, pass along the first_step inherited from the parent.
+                next_first_step = seg_id if depth == 0 else first_step
+                queue.append((new_mask, next_first_step, depth + 1))
+
+    return candidates

From bf545fd2d6ec5b29d8842089991ef054dbcf7c59 Mon Sep 17 00:00:00 2001
From: dhalmazna <dhalmazna@seznam.cz>
Date: Mon, 16 Mar 2026 09:14:07 +0100
Subject: [PATCH 2/6] chore: edit the __init__.py file for the algorithm folder

---
 ciao/algorithm/__init__.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/ciao/algorithm/__init__.py b/ciao/algorithm/__init__.py
index 4552852..ad85bd9 100644
--- a/ciao/algorithm/__init__.py
+++ b/ciao/algorithm/__init__.py
@@ -10,13 +10,13 @@
     remove_node,
     sample_connected_superset,
 )
+from ciao.algorithm.lookahead import build_hyperpixel_greedy_lookahead
 from ciao.algorithm.search_helpers import evaluate_masks, is_terminal
 
 
 __all__ = [
-    # Bitmask graph utilities
     "add_node",
-    # Shared MCTS/MCGS utilities
+    "build_hyperpixel_greedy_lookahead",
     "evaluate_masks",
     "get_frontier",
     "has_node",

From f39e384467cc3c0df741187b80db71d78b791c32 Mon Sep 17 00:00:00 2001
From: dhalmazna <dhalmazna@seznam.cz>
Date: Mon, 16 Mar 2026 13:33:58 +0100
Subject: [PATCH 3/6] feat: update hyperpixel result type

---
 ciao/algorithm/lookahead.py |  4 ++--
 ciao/scoring/hyperpixel.py  | 19 ++++++++++++++++---
 2 files changed, 18 insertions(+), 5 deletions(-)

diff --git a/ciao/algorithm/lookahead.py b/ciao/algorithm/lookahead.py
index 7981f8f..3cc135c 100644
--- a/ciao/algorithm/lookahead.py
+++ b/ciao/algorithm/lookahead.py
@@ -16,7 +16,7 @@
     mask_to_ids,
 )
 from ciao.model.predictor import ModelPredictor
-from ciao.scoring.hyperpixel import calculate_hyperpixel_deltas
+from ciao.scoring.hyperpixel import HyperpixelResult, calculate_hyperpixel_deltas
 
 
 logger = logging.getLogger(__name__)
@@ -35,7 +35,7 @@ def build_hyperpixel_greedy_lookahead(
     optimization_sign: int,
     used_mask: int,
     batch_size: int = 64,
-) -> dict[str, object]:
+) -> HyperpixelResult:
     """Build a single hyperpixel using greedy lookahead with rolling horizon.
 
     Strategy: Look ahead up to lookahead_distance steps, evaluate all candidates,
diff --git a/ciao/scoring/hyperpixel.py b/ciao/scoring/hyperpixel.py
index 39c2580..105ecc8 100644
--- a/ciao/scoring/hyperpixel.py
+++ b/ciao/scoring/hyperpixel.py
@@ -1,9 +1,22 @@
+from typing import TypedDict
+
 import numpy as np
 import torch
 
 from ciao.model.predictor import ModelPredictor
 
 
+class HyperpixelResult(TypedDict):
+    """Type definition for the output of hyperpixel building algorithms."""
+
+    mask: np.ndarray
+    segments: list[int]
+    sign: int
+    score: float
+    size: int
+    stats: dict[str, object]
+
+
 def calculate_hyperpixel_deltas(
     predictor: ModelPredictor,
     input_batch: torch.Tensor,
@@ -105,11 +118,11 @@ def calculate_hyperpixel_deltas(
 
 
 def select_top_hyperpixels(
-    hyperpixels: list[dict[str, object]], max_hyperpixels: int = 10
-) -> list[dict[str, object]]:
+    hyperpixels: list[HyperpixelResult], max_hyperpixels: int = 10
+) -> list[HyperpixelResult]:
     """Select top hyperpixels by their primary algorithm-specific score."""
     return sorted(
         hyperpixels,
-        key=lambda hp: abs(hp["hyperpixel_score"]),  # type: ignore[arg-type]
+        key=lambda hp: abs(hp["score"]),
         reverse=True,
     )[:max_hyperpixels]

From 0f58aa612de5844ede8412b1eeb8a977acbd886e Mon Sep 17 00:00:00 2001
From: dhalmazna <dhalmazna@seznam.cz>
Date: Mon, 16 Mar 2026 13:43:52 +0100
Subject: [PATCH 4/6] fix: correct type definition for mask in HyperpixelResult

---
 ciao/algorithm/lookahead.py | 3 ++-
 ciao/scoring/hyperpixel.py  | 2 +-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/ciao/algorithm/lookahead.py b/ciao/algorithm/lookahead.py
index 3cc135c..1774b34 100644
--- a/ciao/algorithm/lookahead.py
+++ b/ciao/algorithm/lookahead.py
@@ -137,7 +137,7 @@ def build_hyperpixel_greedy_lookahead(
         f"Built hyperpixel with {len(final_segments)} segments, final exact score={final_score:.4f}"
     )
 
-    return {
+    result: HyperpixelResult = {
         "mask": current_mask,
         "segments": final_segments,
         "sign": optimization_sign,
@@ -147,6 +147,7 @@ def build_hyperpixel_greedy_lookahead(
             "total_evaluations": total_evaluations,
         },
     }
+    return result
 
 
 def _generate_lookahead_candidates(
diff --git a/ciao/scoring/hyperpixel.py b/ciao/scoring/hyperpixel.py
index 105ecc8..2bcd8c2 100644
--- a/ciao/scoring/hyperpixel.py
+++ b/ciao/scoring/hyperpixel.py
@@ -9,7 +9,7 @@
 class HyperpixelResult(TypedDict):
     """Type definition for the output of hyperpixel building algorithms."""
 
-    mask: np.ndarray
+    mask: int
     segments: list[int]
     sign: int
     score: float

From 4f1e5eaf767af425b82db4f4a44a2bb0ed86a1e1 Mon Sep 17 00:00:00 2001
From: dhalmazna <dhalmazna@seznam.cz>
Date: Mon, 16 Mar 2026 16:46:37 +0100
Subject: [PATCH 5/6] feat: enhance lookahead algorithm with known final score
 optimization

---
 ciao/algorithm/lookahead.py | 40 ++++++++++++++++++++++++++-----------
 1 file changed, 28 insertions(+), 12 deletions(-)

diff --git a/ciao/algorithm/lookahead.py b/ciao/algorithm/lookahead.py
index 1774b34..5e6df09 100644
--- a/ciao/algorithm/lookahead.py
+++ b/ciao/algorithm/lookahead.py
@@ -59,6 +59,7 @@ def build_hyperpixel_greedy_lookahead(
         Dict with segments, sign, score, final mask, and stats
     """
     current_mask = add_node(0, seed_idx)
+    known_final_score: float | None = None
     total_evaluations = 0
     num_steps = 0
 
@@ -111,6 +112,15 @@ def build_hyperpixel_greedy_lookahead(
         best_score = scores_list[best_idx]
         first_step = candidates[best_mask]
 
+        # Optimization
+        if best_mask.bit_count() == desired_length:
+            current_mask = best_mask
+            known_final_score = best_score
+            logger.debug(
+                f"Step {num_steps}: Lookahead reached desired length, committing entire path."
+            )
+            break
+
         logger.debug(
             f"Step {num_steps}: Best lookahead candidate score={best_score:.4f}, adding segment {first_step}"
         )
@@ -119,19 +129,25 @@ def build_hyperpixel_greedy_lookahead(
         # (it is an open question whether we should add only the first step or the entire best_mask)
         current_mask = add_node(current_mask, first_step)
 
-    # Re-evaluate the final built mask to get its exact score
-    # (since the last loop might have evaluated a lookahead candidate, not the exact current_mask)
     final_segments = mask_to_ids(current_mask)
-    final_score = calculate_hyperpixel_deltas(
-        predictor=predictor,
-        input_batch=input_batch,
-        segments=segments,
-        hyperpixel_segment_ids_list=[final_segments],
-        replacement_image=replacement_image,
-        target_class_idx=target_class_idx,
-        batch_size=1,
-    )[0]
-    total_evaluations += 1
+
+    # Re-evaluate the final built mask to get its exact score.
+    # Why? If the loop terminated early due to a dead end (no valid candidates),
+    # the exact current_mask was never evaluated (we only evaluated larger lookahead candidates).
+    if known_final_score is not None:
+        final_score = known_final_score
+    else:
+        logger.debug("Dead end reached. Re-evaluating the exact final mask.")
+        final_score = calculate_hyperpixel_deltas(
+            predictor=predictor,
+            input_batch=input_batch,
+            segments=segments,
+            hyperpixel_segment_ids_list=[final_segments],
+            replacement_image=replacement_image,
+            target_class_idx=target_class_idx,
+            batch_size=1,
+        )[0]
+        total_evaluations += 1
 
     logger.info(
         f"Built hyperpixel with {len(final_segments)} segments, final exact score={final_score:.4f}"

From 33727dd3fb9f213e3b953b92b898a7197c188a78 Mon Sep 17 00:00:00 2001
From: dhalmazna <dhalmazna@seznam.cz>
Date: Mon, 16 Mar 2026 17:05:37 +0100
Subject: [PATCH 6/6] feat: add docstring for lookahead candidate generation
 function

---
 ciao/algorithm/lookahead.py | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/ciao/algorithm/lookahead.py b/ciao/algorithm/lookahead.py
index 5e6df09..b50b29d 100644
--- a/ciao/algorithm/lookahead.py
+++ b/ciao/algorithm/lookahead.py
@@ -175,6 +175,13 @@ def _generate_lookahead_candidates(
 ) -> dict[int, int]:
     """Generate all connected supersets up to lookahead_distance steps via BFS.
 
+    Args:
+        current_mask: Bitmask of the currently built hyperpixel.
+        adj_masks: Tuple of adjacency bitmasks for each segment in the image.
+        used_mask: Bitmask of globally excluded or already used segments.
+        lookahead_distance: Maximum depth for the BFS expansion.
+        desired_length: Maximum allowed total size of the candidate mask.
+
     Returns:
         Dict mapping candidate_mask -> first_step_segment_id
     """