OpenRouter Model

OpenRouter Model class

Read on GitHub

Full source code

import json
import logging
import os
import time
from typing import Any, Literal

import requests
from pydantic import BaseModel

from minisweagent.exceptions import FormatError
from minisweagent.models import GLOBAL_MODEL_STATS
from minisweagent.models.utils.actions_toolcall import (
    BASH_TOOL,
    format_toolcall_observation_messages,
    parse_toolcall_actions,
)
from minisweagent.models.utils.anthropic_utils import _reorder_anthropic_thinking_blocks
from minisweagent.models.utils.cache_control import set_cache_control
from minisweagent.models.utils.openai_multimodal import expand_multimodal_content
from minisweagent.models.utils.retry import retry

logger = logging.getLogger("openrouter_model")


class OpenRouterModelConfig(BaseModel):
    model_name: str
    model_kwargs: dict[str, Any] = {}
    set_cache_control: Literal["default_end"] | None = None
    """Set explicit cache control markers, for example for Anthropic models"""
    cost_tracking: Literal["default", "ignore_errors"] = os.getenv("MSWEA_COST_TRACKING", "default")
    """Cost tracking mode for this model. Can be "default" or "ignore_errors" (ignore errors/missing cost info)"""
    format_error_template: str = "{{ error }}"
    """Template used when the LM's output is not in the expected format."""
    observation_template: str = (
        "{% if output.exception_info %}<exception>{{output.exception_info}}</exception>\n{% endif %}"
        "<returncode>{{output.returncode}}</returncode>\n<output>\n{{output.output}}</output>"
    )
    """Template used to render the observation after executing an action."""
    multimodal_regex: str = ""
    """Regex to extract multimodal content. Empty string disables multimodal processing."""


class OpenRouterAPIError(Exception):
    """Custom exception for OpenRouter API errors."""


class OpenRouterAuthenticationError(Exception):
    """Custom exception for OpenRouter authentication errors."""


class OpenRouterRateLimitError(Exception):
    """Custom exception for OpenRouter rate limit errors."""


class OpenRouterModel:
    abort_exceptions: list[type[Exception]] = [OpenRouterAuthenticationError, KeyboardInterrupt]

    def __init__(self, **kwargs):
        self.config = OpenRouterModelConfig(**kwargs)
        self._api_url = "https://openrouter.ai/api/v1/chat/completions"
        self._api_key = os.getenv("OPENROUTER_API_KEY", "")

    def _query(self, messages: list[dict[str, str]], **kwargs):
        headers = {
            "Authorization": f"Bearer {self._api_key}",
            "Content-Type": "application/json",
        }

        payload = {
            "model": self.config.model_name,
            "messages": messages,
            "tools": [BASH_TOOL],
            "usage": {"include": True},
            **(self.config.model_kwargs | kwargs),
        }

        try:
            response = requests.post(self._api_url, headers=headers, data=json.dumps(payload), timeout=60)
            response.raise_for_status()
            return response.json()
        except requests.exceptions.HTTPError as e:
            if response.status_code == 401:
                error_msg = "Authentication failed. You can permanently set your API key with `mini-extra config set OPENROUTER_API_KEY YOUR_KEY`."
                raise OpenRouterAuthenticationError(error_msg) from e
            elif response.status_code == 429:
                raise OpenRouterRateLimitError("Rate limit exceeded") from e
            else:
                raise OpenRouterAPIError(f"HTTP {response.status_code}: {response.text}") from e
        except requests.exceptions.RequestException as e:
            raise OpenRouterAPIError(f"Request failed: {e}") from e

    def _prepare_messages_for_api(self, messages: list[dict]) -> list[dict]:
        prepared = [{k: v for k, v in msg.items() if k != "extra"} for msg in messages]
        prepared = _reorder_anthropic_thinking_blocks(prepared)
        return set_cache_control(prepared, mode=self.config.set_cache_control)

    def query(self, messages: list[dict[str, str]], **kwargs) -> dict:
        for attempt in retry(logger=logger, abort_exceptions=self.abort_exceptions):
            with attempt:
                response = self._query(self._prepare_messages_for_api(messages), **kwargs)
        cost_output = self._calculate_cost(response)
        GLOBAL_MODEL_STATS.add(cost_output["cost"])
        try:
            actions = self._parse_actions(response)
        except FormatError as e:
            # dict(response) is a shallow copy; the original response object is not mutated.
            e.messages[0]["extra"]["response"] = dict(response)
            raise
        message = dict(response["choices"][0]["message"])
        message["extra"] = {
            "actions": actions,
            "response": response,
            **cost_output,
            "timestamp": time.time(),
        }
        return message

    def _calculate_cost(self, response) -> dict[str, float]:
        usage = response.get("usage", {})
        cost = usage.get("cost", 0.0)
        if cost <= 0.0 and self.config.cost_tracking != "ignore_errors":
            raise RuntimeError(
                f"No valid cost information available from OpenRouter API for model {self.config.model_name}: "
                f"Usage {usage}, cost {cost}. Cost must be > 0.0. Set cost_tracking: 'ignore_errors' in your config file or "
                "export MSWEA_COST_TRACKING='ignore_errors' to ignore cost tracking errors "
                "(for example for free/local models), more information at https://klieret.short.gy/mini-local-models "
                "for more details. Still stuck? Please open a github issue at https://github.com/SWE-agent/mini-swe-agent/issues/new/choose!"
            )
        return {"cost": cost}

    def _parse_actions(self, response: dict) -> list[dict]:
        """Parse tool calls from the response. Raises FormatError if unknown tool."""
        tool_calls = response["choices"][0]["message"].get("tool_calls") or []
        tool_calls = [_DictToObj(tc) for tc in tool_calls]
        return parse_toolcall_actions(
            tool_calls,
            format_error_template=self.config.format_error_template,
            template_kwargs={"finish_reason": response["choices"][0].get("finish_reason")},
        )

    def format_message(self, **kwargs) -> dict:
        return expand_multimodal_content(kwargs, pattern=self.config.multimodal_regex)

    def format_observation_messages(
        self, message: dict, outputs: list[dict], template_vars: dict | None = None
    ) -> list[dict]:
        """Format execution outputs into tool result messages."""
        actions = message.get("extra", {}).get("actions", [])
        return format_toolcall_observation_messages(
            actions=actions,
            outputs=outputs,
            observation_template=self.config.observation_template,
            template_vars=template_vars,
            multimodal_regex=self.config.multimodal_regex,
        )

    def get_template_vars(self, **kwargs) -> dict[str, Any]:
        return self.config.model_dump()

    def serialize(self) -> dict:
        return {
            "info": {
                "config": {
                    "model": self.config.model_dump(mode="json"),
                    "model_type": f"{self.__class__.__module__}.{self.__class__.__name__}",
                },
            }
        }


class _DictToObj:
    """Simple wrapper to convert dict to object with attribute access."""

    def __init__(self, d: dict):
        self._d = d
        self.id = d.get("id")
        self.function = _DictToObj(d.get("function", {})) if "function" in d else None
        self.name = d.get("name")
        self.arguments = d.get("arguments")

Guide

Setting up OpenRouter models is covered in the quickstart guide.

minisweagent.models.openrouter_model

logger `module-attribute`

logger = getLogger('openrouter_model')

OpenRouterModelConfig

Bases: BaseModel

model_name `instance-attribute`

model_name: str

model_kwargs `class-attribute` `instance-attribute`

model_kwargs: dict[str, Any] = {}

set_cache_control `class-attribute` `instance-attribute`

set_cache_control: Literal['default_end'] | None = None

Set explicit cache control markers, for example for Anthropic models

cost_tracking `class-attribute` `instance-attribute`

cost_tracking: Literal["default", "ignore_errors"] = getenv(
    "MSWEA_COST_TRACKING", "default"
)

Cost tracking mode for this model. Can be "default" or "ignore_errors" (ignore errors/missing cost info)

format_error_template `class-attribute` `instance-attribute`

format_error_template: str = '{{ error }}'

Template used when the LM's output is not in the expected format.

observation_template `class-attribute` `instance-attribute`

observation_template: str = "{% if output.exception_info %}<exception>{{output.exception_info}}</exception>\n{% endif %}<returncode>{{output.returncode}}</returncode>\n<output>\n{{output.output}}</output>"

Template used to render the observation after executing an action.

multimodal_regex `class-attribute` `instance-attribute`

multimodal_regex: str = ''

Regex to extract multimodal content. Empty string disables multimodal processing.

OpenRouterAPIError

Bases: Exception

Custom exception for OpenRouter API errors.

OpenRouterAuthenticationError

Bases: Exception

Custom exception for OpenRouter authentication errors.

OpenRouterRateLimitError

Bases: Exception

Custom exception for OpenRouter rate limit errors.

OpenRouterModel

OpenRouterModel(**kwargs)

Source code in src/minisweagent/models/openrouter_model.py

def __init__(self, **kwargs):
    self.config = OpenRouterModelConfig(**kwargs)
    self._api_url = "https://openrouter.ai/api/v1/chat/completions"
    self._api_key = os.getenv("OPENROUTER_API_KEY", "")

abort_exceptions `class-attribute` `instance-attribute`

abort_exceptions: list[type[Exception]] = [
    OpenRouterAuthenticationError,
    KeyboardInterrupt,
]

config `instance-attribute`

config = OpenRouterModelConfig(**kwargs)

query

query(messages: list[dict[str, str]], **kwargs) -> dict

Source code in src/minisweagent/models/openrouter_model.py

def query(self, messages: list[dict[str, str]], **kwargs) -> dict:
    for attempt in retry(logger=logger, abort_exceptions=self.abort_exceptions):
        with attempt:
            response = self._query(self._prepare_messages_for_api(messages), **kwargs)
    cost_output = self._calculate_cost(response)
    GLOBAL_MODEL_STATS.add(cost_output["cost"])
    try:
        actions = self._parse_actions(response)
    except FormatError as e:
        # dict(response) is a shallow copy; the original response object is not mutated.
        e.messages[0]["extra"]["response"] = dict(response)
        raise
    message = dict(response["choices"][0]["message"])
    message["extra"] = {
        "actions": actions,
        "response": response,
        **cost_output,
        "timestamp": time.time(),
    }
    return message

format_message

format_message(**kwargs) -> dict

Source code in src/minisweagent/models/openrouter_model.py

def format_message(self, **kwargs) -> dict:
    return expand_multimodal_content(kwargs, pattern=self.config.multimodal_regex)

format_observation_messages

format_observation_messages(
    message: dict,
    outputs: list[dict],
    template_vars: dict | None = None,
) -> list[dict]

Format execution outputs into tool result messages.

Source code in src/minisweagent/models/openrouter_model.py

def format_observation_messages(
    self, message: dict, outputs: list[dict], template_vars: dict | None = None
) -> list[dict]:
    """Format execution outputs into tool result messages."""
    actions = message.get("extra", {}).get("actions", [])
    return format_toolcall_observation_messages(
        actions=actions,
        outputs=outputs,
        observation_template=self.config.observation_template,
        template_vars=template_vars,
        multimodal_regex=self.config.multimodal_regex,
    )

get_template_vars

get_template_vars(**kwargs) -> dict[str, Any]

Source code in src/minisweagent/models/openrouter_model.py

def get_template_vars(self, **kwargs) -> dict[str, Any]:
    return self.config.model_dump()

serialize

serialize() -> dict

Source code in src/minisweagent/models/openrouter_model.py

def serialize(self) -> dict:
    return {
        "info": {
            "config": {
                "model": self.config.model_dump(mode="json"),
                "model_type": f"{self.__class__.__module__}.{self.__class__.__name__}",
            },
        }
    }

bug_report Something broken/unclear?

Open an issue on GitHub!

help Open-ended discussions

Join our Slack!

Our projects

OpenRouter Model

minisweagent.models.openrouter_model

logger module-attribute

OpenRouterModelConfig

model_name instance-attribute

model_kwargs class-attribute instance-attribute

set_cache_control class-attribute instance-attribute

cost_tracking class-attribute instance-attribute

format_error_template class-attribute instance-attribute

observation_template class-attribute instance-attribute

multimodal_regex class-attribute instance-attribute

OpenRouterAPIError

OpenRouterAuthenticationError

OpenRouterRateLimitError

OpenRouterModel

abort_exceptions class-attribute instance-attribute

config instance-attribute

query

format_message

format_observation_messages

get_template_vars

serialize

logger `module-attribute`

model_name `instance-attribute`

model_kwargs `class-attribute` `instance-attribute`

set_cache_control `class-attribute` `instance-attribute`

cost_tracking `class-attribute` `instance-attribute`

format_error_template `class-attribute` `instance-attribute`

observation_template `class-attribute` `instance-attribute`

multimodal_regex `class-attribute` `instance-attribute`

abort_exceptions `class-attribute` `instance-attribute`

config `instance-attribute`