SkyDiscover/adaevolve

AdaEvolve

Hierarchical adaptive search: G-signal exploration intensity, UCB island allocation, and LLM meta-guidance on stagnation.

Test-time searchApache-2.0

"""AdaEvolve Memory component — Level-3 paradigm (solution-tactics) state. One file per component (see scaffold.py). Faithful port of SkyDiscover's ``ParadigmTracker`` (search/adaevolve/paradigm/tracker.py) behind the :class:`~galapagos.components.memory.Memory` interface. Per the reference code (not the paper), stagnation is the *windowed improvement rate*: the binary window (size 10) of "did this admitted child set a new global best" is full, no active non-exhausted paradigm exists, and the rate is below 0.12 — not "G ≤ τ_M for all islands". Memory interface mapping: * ``read()`` → the active paradigm's "## BREAKTHROUGH IDEA" injection block (or ``""``), consumed by the PromptBuilder. * ``read({"spec": "tried"})`` → the formatted previously-tried ideas with SUCCESS/FAILED outcomes, fed back to the paradigm generator. * ``write(_, kind="improvement", improved=..., best_score=...)`` → one improvement-window tick (the open mirror of ``record_improvement``). * ``write(_, kind="paradigms", paradigms=[...], best_score=...)`` → install a fresh paradigm set (``set_paradigms``), archiving outgoing used paradigms with their outcome. The rotation/usage methods (:meth:`use_paradigm`, :meth:`has_active_paradigm`, :meth:`is_stagnating`) are concrete extras called by the scaffold. """ from __future__ import annotations from ...components.memory import Memory _PARADIGM_BLOCK = """## BREAKTHROUGH IDEA - IMPLEMENT THIS The search has stagnated globally. You MUST implement this breakthrough idea: **IDEA:** {idea} **HOW TO IMPLEMENT:** {description} **TARGET METRIC:** {what_to_optimize} **CAUTIONS:** {cautions} **APPROACH TYPE:** {approach_type} **CRITICAL:** - You MUST implement the breakthrough idea - Ensure the paradigm is actually used in your implementation (not just mentioned in comments) - Correctness is essential - your implementation must be correct and functional - Verify output format matches evaluator requirements - Make purposeful changes that implement the idea - Test your implementation logic carefully""" class AdaEvolveParadigmMemory(Memory): """``ParadigmTracker``: bounded binary improvement window, paradigm rotation with bounded uses, and an outcome-annotated history of tried ideas.""" def __init__(self, window_size: int = 10, improvement_threshold: float = 0.12, max_uses: int = 2, max_tried: int = 10, num_to_generate: int = 3): self.window_size = int(window_size) self.improvement_threshold = float(improvement_threshold) self.max_uses = int(max_uses) self.max_tried = int(max_tried) self.num_to_generate = int(num_to_generate) self.improvement_history: list[float] = [] # bounded binary window self.active_paradigms: list[dict] = [] self.usage_counts: list[int] = [] self.current_index = 0 self.tried_paradigms: list[str] = [] # bounded outcome history self.best_score_at_generation = 0.0 self.best_score_during = 0.0 # ---- Memory interface -------------------------------------------------------------------- def read(self, spec: dict | None = None) -> str: if spec and spec.get("spec") == "tried": return "\n".join(self.tried_paradigms) paradigm = self.current_paradigm() if paradigm is None: return "" return _PARADIGM_BLOCK.format( idea=paradigm.get("idea", ""), description=paradigm.get("description", ""), what_to_optimize=paradigm.get("what_to_optimize", ""), cautions=paradigm.get("cautions", ""), approach_type=paradigm.get("approach_type", ""), ) def write(self, knowledge: str, **meta) -> None: kind = meta.get("kind") if kind == "improvement": self.record_improvement(bool(meta.get("improved")), float(meta.get("best_score", 0.0))) elif kind == "paradigms": self.set_paradigms(list(meta.get("paradigms") or []), float(meta.get("best_score", 0.0))) # ---- ParadigmTracker port ------------------------------------------------------------------ def record_improvement(self, improved: bool, current_best_score: float) -> None: """One tick of the binary window — called once per admitted non-migrant child.""" self.improvement_history.append(1.0 if improved else 0.0) if len(self.improvement_history) > self.window_size: self.improvement_history.pop(0) if self.active_paradigms: # track the best score reached during the paradigms' tenure self.best_score_during = max(self.best_score_during, current_best_score) def get_improvement_rate(self) -> float: if not self.improvement_history: return 0.0 return sum(self.improvement_history) / len(self.improvement_history) def is_stagnating(self) -> bool: """Trigger condition: full window AND no active non-exhausted paradigm AND rate below the threshold (the reference-code divergence from the paper's G-based trigger).""" return (len(self.improvement_history) >= self.window_size and not self.has_active_paradigm() and self.get_improvement_rate() < self.improvement_threshold) def has_active_paradigm(self) -> bool: """True iff a non-exhausted paradigm exists (auto-rotates past exhausted ones).""" if not self.active_paradigms: return False if self.usage_counts[self.current_index] >= self.max_uses: self._rotate() return self.usage_counts[self.current_index] < self.max_uses def current_paradigm(self) -> dict | None: if not self.has_active_paradigm(): return None return self.active_paradigms[self.current_index] def use_paradigm(self) -> None: """Increment the current paradigm's usage, then rotate round-robin to the next non-exhausted paradigm.""" if not self.has_active_paradigm(): return self.usage_counts[self.current_index] += 1 self._rotate() def _rotate(self) -> None: """Round-robin past exhausted paradigms (may stay put if only the current has uses left).""" n = len(self.active_paradigms) for offset in range(1, n + 1): j = (self.current_index + offset) % n if self.usage_counts[j] < self.max_uses: self.current_index = j return def set_paradigms(self, paradigms: list[dict], current_best_score: float) -> None: """Install a fresh set; archive outgoing *used* paradigms with outcome SUCCESS iff the best score rose > 0.001 during their tenure (bounded history of ``max_tried``).""" improvement = self.best_score_during - self.best_score_at_generation for i, paradigm in enumerate(self.active_paradigms): if self.usage_counts[i] > 0: outcome = "SUCCESS" if improvement > 0.001 else "FAILED" self.tried_paradigms.append( f"{outcome}: {paradigm.get('approach_type', '?')} - {paradigm.get('idea', '?')}" f" (improvement: {improvement:+.4f})") self.tried_paradigms = self.tried_paradigms[-self.max_tried:] self.active_paradigms = list(paradigms) self.usage_counts = [0] * len(self.active_paradigms) self.current_index = 0 self.best_score_at_generation = current_best_score self.best_score_during = current_best_score def get_previously_tried_ideas(self) -> list[str]: return list(self.tried_paradigms)