All-Hands-AI · xingyaoww · Jan 7, 2025 · Nov 26, 2024 · Nov 26, 2024 · Nov 26, 2024
diff --git a/evaluation/benchmarks/swe_bench/run_infer.py b/evaluation/benchmarks/swe_bench/run_infer.py
@@ -35,6 +35,7 @@
 from openhands.events.action import CmdRunAction, MessageAction
 from openhands.events.observation import CmdOutputObservation, ErrorObservation
 from openhands.events.serialization.event import event_to_dict
+from openhands.memory.condenser import get_condensation_metadata
 from openhands.runtime.base import Runtime
 from openhands.utils.async_utils import call_async_from_sync
 from openhands.utils.shutdown_listener import sleep_if_should_continue
@@ -148,6 +149,7 @@ def get_config(
         codeact_enable_jupyter=False,
         codeact_enable_browsing=RUN_WITH_BROWSING,
         codeact_enable_llm_editor=False,
+        condenser=metadata.condenser_config,
     )
     config.set_agent_config(agent_config)
     return config
@@ -439,7 +441,8 @@ def process_instance(
 
     # NOTE: this is NO LONGER the event stream, but an agent history that includes delegate agent's events
     histories = [event_to_dict(event) for event in state.history]
-    metrics = state.metrics.get() if state.metrics else None
+    metrics = state.metrics.get() if state.metrics else {}
+    metrics['condenser'] = get_condensation_metadata(state) if state else []
 
     # Save the output
     output = EvalOutput(

diff --git a/evaluation/utils/shared.py b/evaluation/utils/shared.py
@@ -17,6 +17,10 @@
 
 from openhands.controller.state.state import State
 from openhands.core.config import LLMConfig
+from openhands.core.config.condenser_config import (
+    CondenserConfig,
+    NoOpCondenserConfig,
+)
 from openhands.core.exceptions import (
     AgentRuntimeBuildError,
     AgentRuntimeDisconnectedError,
@@ -45,18 +49,29 @@ class EvalMetadata(BaseModel):
     dataset: str | None = None
     data_split: str | None = None
     details: dict[str, Any] | None = None
+    condenser_config: CondenserConfig | None = None
 
     def model_dump(self, *args, **kwargs):
         dumped_dict = super().model_dump(*args, **kwargs)
         # avoid leaking sensitive information
         dumped_dict['llm_config'] = self.llm_config.to_safe_dict()
+        if hasattr(self.condenser_config, 'llm_config'):
+            dumped_dict['condenser_config']['llm_config'] = (
+                self.condenser_config.llm_config.to_safe_dict()
+            )
+
         return dumped_dict
 
     def model_dump_json(self, *args, **kwargs):
         dumped = super().model_dump_json(*args, **kwargs)
         dumped_dict = json.loads(dumped)
         # avoid leaking sensitive information
         dumped_dict['llm_config'] = self.llm_config.to_safe_dict()
+        if hasattr(self.condenser_config, 'llm_config'):
+            dumped_dict['condenser_config']['llm_config'] = (
+                self.condenser_config.llm_config.to_safe_dict()
+            )
+
         logger.debug(f'Dumped metadata: {dumped_dict}')
         return json.dumps(dumped_dict)
 
@@ -192,6 +207,7 @@ def make_metadata(
     eval_output_dir: str,
     data_split: str | None = None,
     details: dict[str, Any] | None = None,
+    condenser_config: CondenserConfig | None = None,
 ) -> EvalMetadata:
     model_name = llm_config.model.split('/')[-1]
     model_path = model_name.replace(':', '_').replace('@', '-')
@@ -222,6 +238,9 @@ def make_metadata(
         dataset=dataset_name,
         data_split=data_split,
         details=details,
+        condenser_config=condenser_config
+        if condenser_config
+        else NoOpCondenserConfig(),
     )
     metadata_json = metadata.model_dump_json()
     logger.info(f'Metadata: {metadata_json}')

diff --git a/openhands/agenthub/codeact_agent/codeact_agent.py b/openhands/agenthub/codeact_agent/codeact_agent.py
@@ -35,6 +35,10 @@
 from openhands.events.observation.observation import Observation
 from openhands.events.serialization.event import truncate_content
 from openhands.llm.llm import LLM
+from openhands.memory.condenser import (
+    CondensationObservation,
+    Condenser,
+)
 from openhands.runtime.plugins import (
     AgentSkillsRequirement,
     JupyterRequirement,
@@ -110,6 +114,9 @@ def __init__(
             disabled_microagents=self.config.disabled_microagents,
         )
 
+        self.condenser = Condenser.from_config(self.config.condenser)
+        logger.debug(f'Using condenser: {self.condenser}')
+
         self.pending_actions: deque[Action] = deque()
 
     def get_action_message(
@@ -317,6 +324,9 @@ def get_observation_message(
             text = 'OBSERVATION:\n' + truncate_content(obs.content, max_message_chars)
             text += '\n[Last action has been rejected by the user]'
             message = Message(role='user', content=[TextContent(text=text)])
+        elif isinstance(obs, CondensationObservation):
+            text = truncate_content(obs.content, max_message_chars)
+            message = Message(role='user', content=[TextContent(text=text)])
         else:
             # If an observation message is not returned, it will cause an error
             # when the LLM tries to return the next message
@@ -436,7 +446,10 @@ def _get_messages(self, state: State) -> list[Message]:
 
         pending_tool_call_action_messages: dict[str, Message] = {}
         tool_call_id_to_message: dict[str, Message] = {}
-        events = list(state.history)
+
+        # Condense the events from the state.
+        events = self.condenser.condensed_history(state)
+
         for event in events:
             # create a regular message from an event
             if isinstance(event, Action):

diff --git a/openhands/core/config/agent_config.py b/openhands/core/config/agent_config.py
@@ -1,5 +1,6 @@
-from dataclasses import dataclass, fields
+from dataclasses import dataclass, field, fields
 
+from openhands.core.config.condenser_config import CondenserConfig, NoOpCondenserConfig
 from openhands.core.config.config_utils import get_field_info
 
 
@@ -18,6 +19,7 @@ class AgentConfig:
         llm_config: The name of the llm config to use. If specified, this will override global llm config.
         use_microagents: Whether to use microagents at all. Default is True.
         disabled_microagents: A list of microagents to disable. Default is None.
+        condenser: Configuration for the memory condenser. Default is NoOpCondenserConfig.
     """
 
     codeact_enable_browsing: bool = True
@@ -29,6 +31,7 @@ class AgentConfig:
     llm_config: str | None = None
     use_microagents: bool = True
     disabled_microagents: list[str] | None = None
+    condenser: CondenserConfig = field(default_factory=NoOpCondenserConfig)  # type: ignore
 
     def defaults_to_dict(self) -> dict:
         """Serialize fields to a dict for the frontend, including type hints, defaults, and whether it's optional."""

diff --git a/openhands/core/config/condenser_config.py b/openhands/core/config/condenser_config.py
@@ -0,0 +1,88 @@
+from typing import Literal
+
+from pydantic import BaseModel, Field
+
+from openhands.core.config.llm_config import LLMConfig
+
+
+class NoOpCondenserConfig(BaseModel):
+    """Configuration for NoOpCondenser."""
+
+    type: Literal['noop'] = Field('noop')
+
+
+class ObservationMaskingCondenserConfig(BaseModel):
+    """Configuration for ObservationMaskingCondenser."""
+
+    type: Literal['observation_masking'] = Field('observation_masking')
+    attention_window: int = Field(
+        default=10,
+        description='The number of most-recent events where observations will not be masked.',
+    )
+
+
+class RecentEventsCondenserConfig(BaseModel):
+    """Configuration for RecentEventsCondenser."""
+
+    type: Literal['recent'] = Field('recent')
+    keep_first: int = Field(
+        default=0,
+        description='The number of initial events to condense.',
+    )
+    max_events: int = Field(
+        default=10, description='Maximum number of events to keep.', ge=1
+    )
+
+
+class LLMSummarizingCondenserConfig(BaseModel):
+    """Configuration for LLMCondenser."""
+
+    type: Literal['llm'] = Field('llm')
+    llm_config: LLMConfig = Field(
+        ..., description='Configuration for the LLM to use for condensing.'
+    )
+
+
+class AmortizedForgettingCondenserConfig(BaseModel):
+    """Configuration for AmortizedForgettingCondenser."""
+
+    type: Literal['amortized'] = Field('amortized')
+    max_size: int = Field(
+        default=100,
+        description='Maximum size of the condensed history before triggering forgetting.',
+        ge=2,
+    )
+    keep_first: int = Field(
+        default=0,
+        description='Number of initial events to always keep in history.',
+        ge=0,
+    )
+
+
+class LLMAttentionCondenserConfig(BaseModel):
+    """Configuration for LLMAttentionCondenser."""
+
+    type: Literal['llm_attention'] = Field('llm_attention')
+    llm_config: LLMConfig = Field(
+        ..., description='Configuration for the LLM to use for attention.'
+    )
+    max_size: int = Field(
+        default=100,
+        description='Maximum size of the condensed history before triggering forgetting.',
+        ge=2,
+    )
+    keep_first: int = Field(
+        default=0,
+        description='Number of initial events to always keep in history.',
+        ge=0,
+    )
+
+
+CondenserConfig = (
+    NoOpCondenserConfig
+    | ObservationMaskingCondenserConfig
+    | RecentEventsCondenserConfig
+    | LLMSummarizingCondenserConfig
+    | AmortizedForgettingCondenserConfig
+    | LLMAttentionCondenserConfig
+)
diff --git a/openhands/memory/__init__.py b/openhands/memory/__init__.py
@@ -1,4 +1,4 @@
-from openhands.memory.condenser import MemoryCondenser
+from openhands.memory.condenser import Condenser
 from openhands.memory.memory import LongTermMemory
 
-__all__ = ['LongTermMemory', 'MemoryCondenser']
+__all__ = ['LongTermMemory', 'Condenser']