TextualAgent
TextualAgent class
Full source code
"""
Extension of the `default.py` agent that uses Textual for an interactive TUI.
For a simpler version of an interactive UI that does not require threading and more, see `interactive.py`.
"""
import logging
import os
import re
import threading
import time
import traceback
from collections.abc import Iterable
from dataclasses import dataclass, field
from pathlib import Path
from typing import Literal
from rich.spinner import Spinner
from rich.text import Text
from textual.app import App, ComposeResult, SystemCommand
from textual.binding import Binding
from textual.containers import Container, Vertical, VerticalScroll
from textual.css.query import NoMatches
from textual.events import Key
from textual.screen import Screen
from textual.widgets import Footer, Header, Input, Static, TextArea
from minisweagent.agents.default import AgentConfig, DefaultAgent, NonTerminatingException, Submitted
@dataclass
class TextualAgentConfig(AgentConfig):
    mode: Literal["confirm", "yolo"] = "confirm"
    """Mode for action execution: 'confirm' requires user confirmation, 'yolo' executes immediately."""
    whitelist_actions: list[str] = field(default_factory=list)
    """Never confirm actions that match these regular expressions."""
    confirm_exit: bool = True
    """If the agent wants to finish, do we ask for confirmation from user?"""
class _TextualAgent(DefaultAgent):
    def __init__(self, app: "TextualAgent", *args, **kwargs):
        """Connects the DefaultAgent to the TextualApp."""
        self.app = app
        super().__init__(*args, config_class=TextualAgentConfig, **kwargs)
        self._current_action_from_human = False
    def add_message(self, role: str, content: str, **kwargs):
        super().add_message(role, content, **kwargs)
        if self.app.agent_state != "UNINITIALIZED":
            self.app.call_from_thread(self.app.on_message_added)
    def query(self) -> dict:
        if self.config.mode == "human":
            human_input = self.app.input_container.request_input("Enter your command:")
            self._current_action_from_human = True
            msg = {"content": f"\n```bash\n{human_input}\n```"}
            self.add_message("assistant", msg["content"])
            return msg
        self._current_action_from_human = False
        return super().query()
    def run(self, task: str, **kwargs) -> tuple[str, str]:
        try:
            exit_status, result = super().run(task, **kwargs)
        except Exception as e:
            result = str(e)
            self.app.call_from_thread(self.app.action_quit)
            print(traceback.format_exc())
            return "ERROR", result
        else:
            self.app.call_from_thread(self.app.on_agent_finished, exit_status, result)
        self.app.call_from_thread(self.app.action_quit)
        return exit_status, result
    def execute_action(self, action: dict) -> dict:
        if self.config.mode == "human" and not self._current_action_from_human:  # threading, grrrrr
            raise NonTerminatingException("Command not executed because user switched to manual mode.")
        if (
            self.config.mode == "confirm"
            and action["action"].strip()
            and not any(re.match(r, action["action"]) for r in self.config.whitelist_actions)
        ):
            result = self.app.input_container.request_input("Press ENTER to confirm or provide rejection reason")
            if result:  # Non-empty string means rejection
                raise NonTerminatingException(f"Command not executed: {result}")
        return super().execute_action(action)
    def has_finished(self, output: dict[str, str]):
        try:
            return super().has_finished(output)
        except Submitted as e:
            if self.config.confirm_exit:
                if new_task := self.app.input_container.request_input(
                    "[bold green]Agent wants to finish.[/bold green] "
                    "[green]Type a comment to give it a new task or press enter to quit.\n"
                ).strip():
                    raise NonTerminatingException(f"The user added a new task: {new_task}")
            raise e
class AddLogEmitCallback(logging.Handler):
    def __init__(self, callback):
        """Custom log handler that forwards messages via callback."""
        super().__init__()
        self.callback = callback
    def emit(self, record: logging.LogRecord):
        self.callback(record)  # type: ignore[attr-defined]
def _messages_to_steps(messages: list[dict]) -> list[list[dict]]:
    """Group messages into "pages" as shown by the UI."""
    steps = []
    current_step = []
    for message in messages:
        current_step.append(message)
        if message["role"] == "user":
            steps.append(current_step)
            current_step = []
    if current_step:
        steps.append(current_step)
    return steps
class SmartInputContainer(Container):
    def __init__(self, app: "TextualAgent"):
        """Smart input container supporting single-line and multi-line input modes."""
        super().__init__(classes="smart-input-container")
        self._app = app
        self._multiline_mode = False
        self.can_focus = True
        self.display = False
        self.pending_prompt: str | None = None
        self._input_event = threading.Event()
        self._input_result: str | None = None
        self._header_display = Static(id="input-header-display", classes="message-header input-request-header")
        self._hint_text = Static(classes="hint-text")
        self._single_input = Input(placeholder="Type your input...")
        self._multi_input = TextArea(show_line_numbers=False, classes="multi-input")
        self._input_elements_container = Vertical(
            self._header_display,
            self._hint_text,
            self._single_input,
            self._multi_input,
            classes="message-container",
        )
    def compose(self) -> ComposeResult:
        yield self._input_elements_container
    def on_mount(self) -> None:
        """Initialize the widget state."""
        self._multi_input.display = False
        self._update_mode_display()
    def on_focus(self) -> None:
        """Called when the container gains focus."""
        if self._multiline_mode:
            self._multi_input.focus()
        else:
            self._single_input.focus()
    def request_input(self, prompt: str) -> str:
        """Request input from user. Returns input text (empty string if confirmed without reason)."""
        self._input_event.clear()
        self._input_result = None
        self.pending_prompt = prompt
        self._header_display.update(prompt)
        self._update_mode_display()
        self._app.call_from_thread(self._app.update_content)
        self._input_event.wait()
        return self._input_result or ""
    def _complete_input(self, input_text: str):
        """Internal method to complete the input process."""
        self._input_result = input_text
        self.pending_prompt = None
        self.display = False
        self._single_input.value = ""
        self._multi_input.text = ""
        self._multiline_mode = False
        self._update_mode_display()
        self._app.agent_state = "RUNNING"
        self._app.update_content()
        # Reset scroll position to bottom since input container disappearing changes layout
        # somehow scroll_to doesn't work.
        self._app._vscroll.scroll_y = 0
        self._input_event.set()
    def action_toggle_mode(self) -> None:
        """Switch from single-line to multi-line mode (one-way only)."""
        if self.pending_prompt is None or self._multiline_mode:
            return
        self._multiline_mode = True
        self._update_mode_display()
        self.on_focus()
    def _update_mode_display(self) -> None:
        """Update the display based on current mode."""
        if self._multiline_mode:
            self._multi_input.text = self._single_input.value
            self._single_input.display = False
            self._multi_input.display = True
            self._hint_text.update(
                "[reverse][bold][$accent] Ctrl+D [/][/][/] to submit, [reverse][bold][$accent] Tab [/][/][/] to switch focus with other controls"
            )
        else:
            self._hint_text.update(
                "[reverse][bold][$accent] Enter [/][/][/] to submit, [reverse][bold][$accent] Ctrl+T [/][/][/] to switch to multi-line input, [reverse][bold][$accent] Tab [/][/][/] to switch focus with other controls",
            )
            self._multi_input.display = False
            self._single_input.display = True
    def on_input_submitted(self, event: Input.Submitted) -> None:
        """Handle single-line input submission."""
        if not self._multiline_mode:
            text = event.input.value.strip()
            self._complete_input(text)
    def on_key(self, event: Key) -> None:
        """Handle key events."""
        if event.key == "ctrl+t" and not self._multiline_mode:
            event.prevent_default()
            self.action_toggle_mode()
            return
        if self._multiline_mode and event.key == "ctrl+d":
            event.prevent_default()
            self._complete_input(self._multi_input.text.strip())
            return
        if event.key == "escape":
            event.prevent_default()
            self.can_focus = False
            self._app.set_focus(None)
            return
class TextualAgent(App):
    BINDINGS = [
        Binding("right,l", "next_step", "Step++", tooltip="Show next step of the agent"),
        Binding("left,h", "previous_step", "Step--", tooltip="Show previous step of the agent"),
        Binding("0", "first_step", "Step=0", tooltip="Show first step of the agent", show=False),
        Binding("$", "last_step", "Step=-1", tooltip="Show last step of the agent", show=False),
        Binding("j,down", "scroll_down", "Scroll down", show=False),
        Binding("k,up", "scroll_up", "Scroll up", show=False),
        Binding("q,ctrl+q", "quit", "Quit", tooltip="Quit the agent"),
        Binding("y,ctrl+y", "yolo", "YOLO mode", tooltip="Switch to YOLO Mode (LM actions will execute immediately)"),
        Binding(
            "c",
            "confirm",
            "CONFIRM mode",
            tooltip="Switch to Confirm Mode (LM proposes commands and you confirm/reject them)",
        ),
        Binding("u,ctrl+u", "human", "HUMAN mode", tooltip="Switch to Human Mode (you can now type commands directly)"),
        Binding("f1,question_mark", "toggle_help_panel", "Help", tooltip="Show help"),
    ]
    def __init__(self, model, env, **kwargs):
        css_path = os.environ.get("MSWEA_MINI_STYLE_PATH", str(Path(__file__).parent.parent / "config" / "mini.tcss"))
        self.__class__.CSS = Path(css_path).read_text()
        super().__init__()
        self.agent_state = "UNINITIALIZED"
        self.agent = _TextualAgent(self, model=model, env=env, **kwargs)
        self._i_step = 0
        self.n_steps = 1
        self.input_container = SmartInputContainer(self)
        self.log_handler = AddLogEmitCallback(lambda record: self.call_from_thread(self.on_log_message_emitted, record))
        logging.getLogger().addHandler(self.log_handler)
        self._spinner = Spinner("dots")
        self.exit_status: str = "ExitStatusUnset"
        self.result: str = ""
        self._vscroll = VerticalScroll()
    def run(self, task: str, **kwargs) -> tuple[str, str]:
        threading.Thread(target=lambda: self.agent.run(task, **kwargs), daemon=True).start()
        super().run()
        return self.exit_status, self.result
    # --- Basics ---
    @property
    def config(self):
        return self.agent.config
    @property
    def i_step(self) -> int:
        """Current step index."""
        return self._i_step
    @i_step.setter
    def i_step(self, value: int) -> None:
        """Set current step index, automatically clamping to valid bounds."""
        if value != self._i_step:
            self._i_step = max(0, min(value, self.n_steps - 1))
            self._vscroll.scroll_to(y=0, animate=False)
            self.update_content()
    def compose(self) -> ComposeResult:
        yield Header()
        with Container(id="main"):
            with self._vscroll:
                with Vertical(id="content"):
                    pass
                yield self.input_container
        yield Footer()
    def on_mount(self) -> None:
        self.agent_state = "RUNNING"
        self.update_content()
        self.set_interval(1 / 8, self._update_headers)
    @property
    def messages(self) -> list[dict]:
        return self.agent.messages
    @property
    def model(self):
        return self.agent.model
    @property
    def env(self):
        return self.agent.env
    # --- Reacting to events ---
    def on_message_added(self) -> None:
        auto_follow = self.i_step == self.n_steps - 1 and self._vscroll.scroll_y <= 1
        self.n_steps = len(_messages_to_steps(self.agent.messages))
        self.update_content()
        if auto_follow:
            self.action_last_step()
    def on_log_message_emitted(self, record: logging.LogRecord) -> None:
        """Handle log messages of warning level or higher by showing them as notifications."""
        if record.levelno >= logging.WARNING:
            self.notify(f"[{record.levelname}] {record.getMessage()}", severity="warning")
    def on_unmount(self) -> None:
        """Clean up the log handler when the app shuts down."""
        if hasattr(self, "log_handler"):
            logging.getLogger().removeHandler(self.log_handler)
    def on_agent_finished(self, exit_status: str, result: str):
        self.agent_state = "STOPPED"
        self.notify(f"Agent finished with status: {exit_status}")
        self.exit_status = exit_status
        self.result = result
        self.update_content()
    # --- UI update logic ---
    def update_content(self) -> None:
        container = self.query_one("#content", Vertical)
        container.remove_children()
        items = _messages_to_steps(self.agent.messages)
        if not items:
            container.mount(Static("Waiting for agent to start..."))
            return
        for message in items[self.i_step]:
            if isinstance(message["content"], list):
                content_str = "\n".join([item["text"] for item in message["content"]])
            else:
                content_str = str(message["content"])
            message_container = Vertical(classes="message-container")
            container.mount(message_container)
            role = message["role"].replace("assistant", "mini-swe-agent")
            message_container.mount(Static(role.upper(), classes="message-header"))
            message_container.mount(Static(Text(content_str, no_wrap=False), classes="message-content"))
        if self.input_container.pending_prompt is not None:
            self.agent_state = "AWAITING_INPUT"
        self.input_container.display = self.input_container.pending_prompt is not None and self.i_step == len(items) - 1
        if self.input_container.display:
            self.input_container.on_focus()
        self._update_headers()
        self.refresh()
    def _update_headers(self) -> None:
        """Update just the title with current state and spinner if needed."""
        status_text = self.agent_state
        if self.agent_state == "RUNNING":
            spinner_frame = str(self._spinner.render(time.time())).strip()
            status_text = f"{self.agent_state} {spinner_frame}"
        self.title = f"Step {self.i_step + 1}/{self.n_steps} - {status_text} - Cost: ${self.agent.model.cost:.2f}"
        try:
            self.query_one("Header").set_class(self.agent_state == "RUNNING", "running")
        except NoMatches:  # might be called when shutting down
            pass
    # --- Other textual overrides ---
    def get_system_commands(self, screen: Screen) -> Iterable[SystemCommand]:
        # Add to palette
        yield from super().get_system_commands(screen)
        for binding in self.BINDINGS:
            description = f"{binding.description} (shortcut {' OR '.join(binding.key.split(','))})"  # type: ignore[attr-defined]
            action_method = getattr(self, f"action_{binding.action}")  # type: ignore[attr-defined]
            yield SystemCommand(description, binding.tooltip, action_method)  # type: ignore[attr-defined]
    # --- Textual bindings ---
    def action_yolo(self):
        self.agent.config.mode = "yolo"
        if self.input_container.pending_prompt is not None:
            self.input_container._complete_input("")  # accept
        self.notify("YOLO mode enabled - LM actions will execute immediately")
    def action_human(self):
        if self.agent.config.mode == "confirm" and self.input_container.pending_prompt is not None:
            self.input_container._complete_input("User switched to manual mode, this command will be ignored")
        self.agent.config.mode = "human"
        self.notify("Human mode enabled - you can now type commands directly")
    def action_confirm(self):
        if self.agent.config.mode == "human" and self.input_container.pending_prompt is not None:
            self.input_container._complete_input("")  # just submit blank action
        self.agent.config.mode = "confirm"
        self.notify("Confirm mode enabled - LM proposes commands and you confirm/reject them")
    def action_next_step(self) -> None:
        self.i_step += 1
    def action_previous_step(self) -> None:
        self.i_step -= 1
    def action_first_step(self) -> None:
        self.i_step = 0
    def action_last_step(self) -> None:
        self.i_step = self.n_steps - 1
    def action_scroll_down(self) -> None:
        self._vscroll.scroll_to(y=self._vscroll.scroll_target_y + 15)
    def action_scroll_up(self) -> None:
        self._vscroll.scroll_to(y=self._vscroll.scroll_target_y - 15)
    def action_toggle_help_panel(self) -> None:
        if self.query("HelpPanel"):
            self.action_hide_help_panel()
        else:
            self.action_show_help_panel()
See also
- This agent subclass builds on top of the default agent, make sure to read that first.
- This class powers the minicommand line tool, see usage for more details.
TextualAgent(model, env, **kwargs)
              Bases: App
Source code in src/minisweagent/agents/interactive_textual.py
                    | 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 |  | 
class-attribute
      instance-attribute
  
BINDINGS = [
    Binding(
        "right,l",
        "next_step",
        "Step++",
        tooltip="Show next step of the agent",
    ),
    Binding(
        "left,h",
        "previous_step",
        "Step--",
        tooltip="Show previous step of the agent",
    ),
    Binding(
        "0",
        "first_step",
        "Step=0",
        tooltip="Show first step of the agent",
        show=False,
    ),
    Binding(
        "$",
        "last_step",
        "Step=-1",
        tooltip="Show last step of the agent",
        show=False,
    ),
    Binding(
        "j,down", "scroll_down", "Scroll down", show=False
    ),
    Binding("k,up", "scroll_up", "Scroll up", show=False),
    Binding(
        "q,ctrl+q", "quit", "Quit", tooltip="Quit the agent"
    ),
    Binding(
        "y,ctrl+y",
        "yolo",
        "YOLO mode",
        tooltip="Switch to YOLO Mode (LM actions will execute immediately)",
    ),
    Binding(
        "c",
        "confirm",
        "CONFIRM mode",
        tooltip="Switch to Confirm Mode (LM proposes commands and you confirm/reject them)",
    ),
    Binding(
        "u,ctrl+u",
        "human",
        "HUMAN mode",
        tooltip="Switch to Human Mode (you can now type commands directly)",
    ),
    Binding(
        "f1,question_mark",
        "toggle_help_panel",
        "Help",
        tooltip="Show help",
    ),
]
instance-attribute
  
agent_state = 'UNINITIALIZED'
instance-attribute
  
agent = _TextualAgent(self, model=model, env=env, **kwargs)
instance-attribute
  
n_steps = 1
instance-attribute
  
log_handler = AddLogEmitCallback(
    lambda record: call_from_thread(
        on_log_message_emitted, record
    )
)
instance-attribute
  
exit_status: str = 'ExitStatusUnset'
instance-attribute
  
result: str = ''
property
  
config
property
      writable
  
i_step: int
Current step index.
property
  
messages: list[dict]
property
  
model
property
  
env
run(task: str, **kwargs) -> tuple[str, str]
Source code in src/minisweagent/agents/interactive_textual.py
              | 279 280 281 282 |  | 
compose() -> ComposeResult
Source code in src/minisweagent/agents/interactive_textual.py
              | 303 304 305 306 307 308 309 310 |  | 
on_mount() -> None
Source code in src/minisweagent/agents/interactive_textual.py
              | 312 313 314 315 |  | 
on_message_added() -> None
Source code in src/minisweagent/agents/interactive_textual.py
              | 331 332 333 334 335 336 |  | 
on_log_message_emitted(record: LogRecord) -> None
Handle log messages of warning level or higher by showing them as notifications.
Source code in src/minisweagent/agents/interactive_textual.py
              | 338 339 340 341 |  | 
on_unmount() -> None
Clean up the log handler when the app shuts down.
Source code in src/minisweagent/agents/interactive_textual.py
              | 343 344 345 346 |  | 
on_agent_finished(exit_status: str, result: str)
Source code in src/minisweagent/agents/interactive_textual.py
              | 348 349 350 351 352 353 |  | 
update_content() -> None
Source code in src/minisweagent/agents/interactive_textual.py
              | 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 |  | 
get_system_commands(
    screen: Screen,
) -> Iterable[SystemCommand]
Source code in src/minisweagent/agents/interactive_textual.py
              | 400 401 402 403 404 405 406 |  | 
action_yolo()
Source code in src/minisweagent/agents/interactive_textual.py
              | 410 411 412 413 414 |  | 
action_human()
Source code in src/minisweagent/agents/interactive_textual.py
              | 416 417 418 419 420 |  | 
action_confirm()
Source code in src/minisweagent/agents/interactive_textual.py
              | 422 423 424 425 426 |  | 
action_next_step() -> None
Source code in src/minisweagent/agents/interactive_textual.py
              | 428 429 |  | 
action_previous_step() -> None
Source code in src/minisweagent/agents/interactive_textual.py
              | 431 432 |  | 
action_first_step() -> None
Source code in src/minisweagent/agents/interactive_textual.py
              | 434 435 |  | 
action_last_step() -> None
Source code in src/minisweagent/agents/interactive_textual.py
              | 437 438 |  | 
action_scroll_down() -> None
Source code in src/minisweagent/agents/interactive_textual.py
              | 440 441 |  | 
action_scroll_up() -> None
Source code in src/minisweagent/agents/interactive_textual.py
              | 443 444 |  | 
action_toggle_help_panel() -> None
Source code in src/minisweagent/agents/interactive_textual.py
              | 446 447 448 449 450 |  | 
dataclass
  
TextualAgentConfig(
    system_template: str = "You are a helpful assistant that can do anything.",
    instance_template: str = "Your task: {{task}}. Please reply with a single shell command in triple backticks. To finish, the first line of the output of the shell command must be 'COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT'.",
    timeout_template: str = "The last command <command>{{action['action']}}</command> timed out and has been killed.\nThe output of the command was:\n <output>\n{{output}}\n</output>\nPlease try another command and make sure to avoid those requiring interactive input.",
    format_error_template: str = "Please always provide EXACTLY ONE action in triple backticks.",
    action_observation_template: str = "Observation: {{output}}",
    step_limit: int = 0,
    cost_limit: float = 3.0,
    mode: Literal["confirm", "yolo"] = "confirm",
    whitelist_actions: list[str] = list(),
    confirm_exit: bool = True,
)
              Bases: AgentConfig
class-attribute
      instance-attribute
  
mode: Literal['confirm', 'yolo'] = 'confirm'
Mode for action execution: 'confirm' requires user confirmation, 'yolo' executes immediately.
class-attribute
      instance-attribute
  
whitelist_actions: list[str] = field(default_factory=list)
Never confirm actions that match these regular expressions.
class-attribute
      instance-attribute
  
confirm_exit: bool = True
If the agent wants to finish, do we ask for confirmation from user?
SmartInputContainer(app: TextualAgent)
              Bases: Container
Smart input container supporting single-line and multi-line input modes.
Source code in src/minisweagent/agents/interactive_textual.py
                    | 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 |  | 
instance-attribute
  
can_focus = True
instance-attribute
  
display = False
instance-attribute
  
pending_prompt: str | None = None
compose() -> ComposeResult
Source code in src/minisweagent/agents/interactive_textual.py
              | 150 151 |  | 
on_mount() -> None
Initialize the widget state.
Source code in src/minisweagent/agents/interactive_textual.py
              | 153 154 155 156 |  | 
on_focus() -> None
Called when the container gains focus.
Source code in src/minisweagent/agents/interactive_textual.py
              | 158 159 160 161 162 163 |  | 
request_input(prompt: str) -> str
Request input from user. Returns input text (empty string if confirmed without reason).
Source code in src/minisweagent/agents/interactive_textual.py
              | 165 166 167 168 169 170 171 172 173 174 |  | 
action_toggle_mode() -> None
Switch from single-line to multi-line mode (one-way only).
Source code in src/minisweagent/agents/interactive_textual.py
              | 192 193 194 195 196 197 198 199 |  | 
on_input_submitted(event: Submitted) -> None
Handle single-line input submission.
Source code in src/minisweagent/agents/interactive_textual.py
              | 217 218 219 220 221 |  | 
on_key(event: Key) -> None
Handle key events.
Source code in src/minisweagent/agents/interactive_textual.py
              | 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 |  | 
AddLogEmitCallback(callback)
              Bases: Handler
Custom log handler that forwards messages via callback.
Source code in src/minisweagent/agents/interactive_textual.py
                    | 102 103 104 105 |  | 
instance-attribute
  
callback = callback
emit(record: LogRecord)
Source code in src/minisweagent/agents/interactive_textual.py
              | 107 108 |  | 
 
    