PyPI - mini-swe-agent - Versions diffs - 1.6.0__py3-none-any.whl → 1.8.0__py3-none-any.whl - Mend

mini-swe-agent 1.6.0py3-none-any.whl → 1.8.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/METADATA +3 -3
{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/RECORD +21 -21
minisweagent/__init__.py +2 -2
minisweagent/agents/default.py +6 -6
minisweagent/agents/interactive_textual.py +27 -12
minisweagent/config/default.yaml +2 -4
minisweagent/config/extra/swebench.yaml +6 -5
minisweagent/config/github_issue.yaml +3 -3
minisweagent/config/mini.yaml +2 -4
minisweagent/config/mini_no_temp.yaml +2 -4
minisweagent/environments/__init__.py +29 -0
minisweagent/environments/docker.py +1 -1
minisweagent/environments/singularity.py +24 -2
minisweagent/run/extra/config.py +2 -1
minisweagent/run/extra/swebench.py +32 -21
minisweagent/run/extra/swebench_single.py +22 -18
minisweagent/run/mini.py +12 -35
{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/WHEEL +0 -0
{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/entry_points.txt +0 -0
{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/licenses/LICENSE.md +0 -0
{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/top_level.txt +0 -0

{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: mini-swe-agent
-Version: 1.6.0
+Version: 1.8.0
 Summary: Nano SWE Agent - A simple AI software engineering agent
 Author-email: Kilian Lieret <kilian.lieret@posteo.de>, "Carlos E. Jimenez" <carlosej@princeton.edu>
 License: MIT License
@@ -40,7 +40,7 @@ License-File: LICENSE.md
 Requires-Dist: pyyaml
 Requires-Dist: requests
 Requires-Dist: jinja2
-Requires-Dist: litellm
+Requires-Dist: litellm>=1.75.5
 Requires-Dist: tenacity
 Requires-Dist: rich
 Requires-Dist: python-dotenv
@@ -92,7 +92,7 @@ Here's some details:
 - **Minimal**: Just [100 lines of python](https://github.com/SWE-agent/mini-swe-agent/blob/main/src/minisweagent/agents/default.py) (+100 total for [env](https://github.com/SWE-agent/mini-swe-agent/blob/main/src/minisweagent/environments/local.py),
 [model](https://github.com/SWE-agent/mini-swe-agent/blob/main/src/minisweagent/models/litellm_model.py), [script](https://github.com/SWE-agent/mini-swe-agent/blob/main/src/minisweagent/run/hello_world.py)) — no fancy dependencies!
-- **Powerful:** Resolves 65% of GitHub issues in the [SWE-bench verified benchmark](https://www.swebench.com/) ([leaderboard](https://swe-bench.com/)).
+- **Powerful:** Resolves 68% of GitHub issues in the [SWE-bench verified benchmark](https://www.swebench.com/) ([leaderboard](https://swe-bench.com/)).
 - **Convenient:** Comes with UIs that turn this into your daily dev swiss army knife!
 - **Deployable:** In addition to local envs, you can use **docker**, **podman**, **singularity**, **apptainer**, and more
 - **Tested:** [![Codecov](https://img.shields.io/codecov/c/github/swe-agent/mini-swe-agent?style=flat-square)](https://codecov.io/gh/SWE-agent/mini-swe-agent)

{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/RECORD RENAMED Viewed

@@ -1,24 +1,24 @@
-mini_swe_agent-1.6.0.dist-info/licenses/LICENSE.md,sha256=D3luWPkdHAe7LBsdD4vzqDAXw6Xewb3G-uczss0uh1s,1094
-minisweagent/__init__.py,sha256=TzDDE2Pena2PXb1qZldoecg2ELBnSm6KU_eXavcOWVQ,1787
+mini_swe_agent-1.8.0.dist-info/licenses/LICENSE.md,sha256=D3luWPkdHAe7LBsdD4vzqDAXw6Xewb3G-uczss0uh1s,1094
+minisweagent/__init__.py,sha256=uHro6Ebka9Iwr8HmO6GaEvNEuwJh_JKSd_54XNw445c,1797
 minisweagent/__main__.py,sha256=FIyAOiw--c3FQ2g240FOM1FdL0lk_PxSpixu0pQ7WFo,194
 minisweagent/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 minisweagent/agents/__init__.py,sha256=cpjJLzg1IGxLM-tZpoMJV9S33ye13XtdBO0x7DU_Lrk,48
-minisweagent/agents/default.py,sha256=bqLMtEptn61zc_ptAIQkz_2fMI8hBoVpydVA84mPH8I,5471
+minisweagent/agents/default.py,sha256=2KiXOGNXLlhMqFtcsYGICTnfk8pUHn292g_kOlMyECY,5555
 minisweagent/agents/interactive.py,sha256=7HW2cffaV5f66DIjxvtIbL8mo_S5aZSwgNLSmHp6VC0,7450
-minisweagent/agents/interactive_textual.py,sha256=Ef2GTH2_9ujD95ukVf-hb7X6FCRVgvIdlJZvPvCAd-E,17629
+minisweagent/agents/interactive_textual.py,sha256=yYVtgHXdrKkirMyyHehYs5S3e7ddzqtoMSx8rU8_zBo,17944
 minisweagent/config/README.md,sha256=ABd9anA4aRWtx7Oh37z36Wv6ARvcxD2w9lPUE24R2mY,435
 minisweagent/config/__init__.py,sha256=0KzHaaIqWgRy2zbwIzhrg6BJPDzOvYi3jb4eBNY4sAU,823
-minisweagent/config/default.yaml,sha256=_OJNNTGOr-cyqzkrDIzB2F5H1N49Dlp--N0SDJvkVxE,5233
-minisweagent/config/github_issue.yaml,sha256=evvu3AJ52tXYSdami9_B8zfazOAE2r2XXkzVmScBoKc,4539
+minisweagent/config/default.yaml,sha256=OHK9-7PkCa9ZzgYykF1zGYC_AWkiAdOrEpDuurF-1Rk,5143
+minisweagent/config/github_issue.yaml,sha256=qbjj3vmdukxz36_EY7e64vhNn1g2-_NrdNx5xgMOUAI,4569
 minisweagent/config/mini.tcss,sha256=fmAP9cYAp2n7Ps2Dw3e-ZOGEF2E8JcwTgK1LDcis-x4,1141
-minisweagent/config/mini.yaml,sha256=kQWVlAPbbVUb-wKa3lw0ouNpEADTr1a7bXKjU3WegLE,5249
-minisweagent/config/mini_no_temp.yaml,sha256=KQpqexf0oOdrMLGNPIy5Ll30bAEw7mrZpgnnMxEygLc,5294
+minisweagent/config/mini.yaml,sha256=mDfN7KputHf7kOGidJFX5-5CDKg97vxxu2cdYYlPoM8,5159
+minisweagent/config/mini_no_temp.yaml,sha256=n0W-017tBmMx57U9SLt7Fy9WJxI9x2vdTWBWeSngGMc,5204
 minisweagent/config/extra/__init__.py,sha256=e1MoAlDn_wc9HnXNoncf1P-B4DQ-iRf6n7Q_txjZGRI,52
-minisweagent/config/extra/swebench.yaml,sha256=LNpTahpul6HL0HozgAAz-C6kpX3wZA7Tg8uE-ZmgrF4,7577
-minisweagent/environments/__init__.py,sha256=g5mKac1YgVOZVKvmiAiuyPSevRYpI69V4vYrbCH3gsI,54
-minisweagent/environments/docker.py,sha256=VYk7i0T0IgUF_s-N-DqYkHsBWbfgaIMpJZIIdEtetTw,3871
+minisweagent/config/extra/swebench.yaml,sha256=5FKblpcNTHmVUNE1JLHo5_AsupvlwsrLj8I3R2mRItk,7680
+minisweagent/environments/__init__.py,sha256=tTnNjNAhMvIuB1mlesreBV5TLdQBp79qj_Mxr7HGzNk,1180
+minisweagent/environments/docker.py,sha256=dSkD8FtHb9yN_ejau3ekN-FaHQMH2AWdhfpvZOoH7NQ,3909
 minisweagent/environments/local.py,sha256=-2EV3RqZSB8WEjJE7BHLhRjocPMLpoJ3HbM8QB1WXUU,1060
-minisweagent/environments/singularity.py,sha256=j7ptRVF8GwDLd-5IjhT5j7fNxEJz9amuLTmVxotaMlI,1796
+minisweagent/environments/singularity.py,sha256=fqDH4nTg3njHMe7BzQ4HUp_jAgXeKyLWm-TmH8WuNlA,2552
 minisweagent/environments/extra/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 minisweagent/environments/extra/swerex_docker.py,sha256=MOhhFdX1sAk_U0g-GOxohfjrldzO4YfrUnHq8qJff7c,1502
 minisweagent/models/__init__.py,sha256=J4bnvfMByTVG0cL_6p51sm8gdargXhARfbG5c0UZ8Z4,2890
@@ -32,18 +32,18 @@ minisweagent/run/__init__.py,sha256=WIoYgHVl7iZF2YncrfV3IttupG6P5KogroKHKECka3A,
 minisweagent/run/github_issue.py,sha256=GWOkGM09jOYV93p6xIM_kKWmC1yP_d5lprafWlqoBN0,2748
 minisweagent/run/hello_world.py,sha256=erLnEwNmPFLxq3-8zyv66Vy1kIqMqQf97vISX7LrQXg,959
 minisweagent/run/inspector.py,sha256=QnY3oYzm-yq3w9Jzs112Lco2Rg84vSocAWrQRVz_1lc,7127
-minisweagent/run/mini.py,sha256=yeVYaaQrYfAW5gzPsunxqB73CTnwugkQ1qPn2-Os-GM,4849
+minisweagent/run/mini.py,sha256=d-dtnddRDvs0Ub3mFuXJYsNh3sSfRnSPjp6877Y9O2I,4215
 minisweagent/run/mini_extra.py,sha256=ecA1PnTWElpO60G9RktvVLtUOf3bZ_ESmnSttS6izhQ,1465
 minisweagent/run/extra/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-minisweagent/run/extra/config.py,sha256=ezUu8n2-h79cfphWXv-j9LQXfxzkxrF2aPlh7mObF7k,3545
-minisweagent/run/extra/swebench.py,sha256=m5_PZI4ojkUyCxzkkMtel_vlnYmjziWrXu73yHoZGFs,9688
-minisweagent/run/extra/swebench_single.py,sha256=L3Kk4G65o3MCPLMEwGNIs77-AFf6Lfc8o1oxrbN-ZWM,1991
+minisweagent/run/extra/config.py,sha256=CEsEr8AdEm64Jods2ZRURChHKMILSatkBLkLmRywkrw,3672
+minisweagent/run/extra/swebench.py,sha256=1v5qGLaAOKdESEaa6qMgJUlUFh025gASpbEyxfzb4uM,10601
+minisweagent/run/extra/swebench_single.py,sha256=YWYAMr6rfsUCGtB_4_e_w_CQ5RWfLbXIXOOGV8HPDYc,2441
 minisweagent/run/extra/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 minisweagent/run/extra/utils/batch_progress.py,sha256=xhJ7FmsaTBGz-yh8pzYl4yMoUGjn7GA24eYrP-nHj60,6804
 minisweagent/run/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 minisweagent/run/utils/save.py,sha256=yI_hSU-GOaB7j8YeHBCc7Fhl4js9AyO9N5SC6p-nnu8,1606
-mini_swe_agent-1.6.0.dist-info/METADATA,sha256=QDXPWyxQpaflZdPzuFZmzdgIDnEAMp_XGnAfRnV41vU,13783
-mini_swe_agent-1.6.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-mini_swe_agent-1.6.0.dist-info/entry_points.txt,sha256=d1_yRbTaGjs1UXHa6JQK0sKDGBIVGm8oeW0k2kfbJgQ,182
-mini_swe_agent-1.6.0.dist-info/top_level.txt,sha256=zKF4t8bFpV87fdVABZt2Da-vnb4Vkh_CxkwQx5YT4Ew,13
-mini_swe_agent-1.6.0.dist-info/RECORD,,
+mini_swe_agent-1.8.0.dist-info/METADATA,sha256=jwXlBjL8-xSWt3QxyvLsw7E8erT0xtWYELQkdk3Ean8,13791
+mini_swe_agent-1.8.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+mini_swe_agent-1.8.0.dist-info/entry_points.txt,sha256=d1_yRbTaGjs1UXHa6JQK0sKDGBIVGm8oeW0k2kfbJgQ,182
+mini_swe_agent-1.8.0.dist-info/top_level.txt,sha256=zKF4t8bFpV87fdVABZt2Da-vnb4Vkh_CxkwQx5YT4Ew,13
+mini_swe_agent-1.8.0.dist-info/RECORD,,

minisweagent/__init__.py CHANGED Viewed

@@ -8,7 +8,7 @@ This file provides:
   unless you want the static type checking.
 """
-__version__ = "1.6.0"
+__version__ = "1.8.0"
 import os
 from pathlib import Path
@@ -61,7 +61,7 @@ class Agent(Protocol):
     env: Environment
     messages: list[dict[str, str]]
-    def run(self, task: str) -> tuple[str, str]: ...
+    def run(self, task: str, **kwargs) -> tuple[str, str]: ...
 __all__ = ["Agent", "Model", "Environment", "package_dir", "__version__", "global_config_file", "global_config_dir"]

minisweagent/agents/default.py CHANGED Viewed

@@ -18,7 +18,7 @@ class AgentConfig:
     system_template: str = "You are a helpful assistant that can do anything."
     instance_template: str = (
         "Your task: {{task}}. Please reply with a single shell command in triple backticks. "
-        "To finish, the first line of the output of the shell command must be 'MINI_SWE_AGENT_FINAL_OUTPUT'."
+        "To finish, the first line of the output of the shell command must be 'COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT'."
     )
     timeout_template: str = (
         "The last command <command>{{action['action']}}</command> timed out and has been killed.\n"
@@ -69,11 +69,11 @@ class DefaultAgent:
     def add_message(self, role: str, content: str, **kwargs):
         self.messages.append({"role": role, "content": content, **kwargs})
-    def run(self, task: str) -> tuple[str, str]:
+    def run(self, task: str, **kwargs) -> tuple[str, str]:
         """Run step() until agent is finished. Return exit status & message"""
         self.messages = []
         self.add_message("system", self.render_template(self.config.system_template))
-        self.add_message("user", self.render_template(self.config.instance_template, task=task))
+        self.add_message("user", self.render_template(self.config.instance_template, task=task, **kwargs))
         while True:
             try:
                 self.step()
@@ -124,6 +124,6 @@ class DefaultAgent:
     def has_finished(self, output: dict[str, str]):
         """Raises Submitted exception with final output if the agent has finished its task."""
-        lines = output.get("output", "").lstrip().splitlines()
-        if lines and lines[0].strip() == "MINI_SWE_AGENT_FINAL_OUTPUT":
-            raise Submitted("\n".join(lines[1:]))
+        lines = output.get("output", "").lstrip().splitlines(keepends=True)
+        if lines and lines[0].strip() in ["MINI_SWE_AGENT_FINAL_OUTPUT", "COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT"]:
+            raise Submitted("".join(lines[1:]))

minisweagent/agents/interactive_textual.py CHANGED Viewed

@@ -37,8 +37,8 @@ class TextualAgentConfig(AgentConfig):
     """If the agent wants to finish, do we ask for confirmation from user?"""
-class TextualAgent(DefaultAgent):
-    def __init__(self, app: "AgentApp", *args, **kwargs):
+class _TextualAgent(DefaultAgent):
+    def __init__(self, app: "TextualAgent", *args, **kwargs):
         """Connects the DefaultAgent to the TextualApp."""
         self.app = app
         super().__init__(*args, config_class=TextualAgentConfig, **kwargs)
@@ -59,9 +59,9 @@ class TextualAgent(DefaultAgent):
         self._current_action_from_human = False
         return super().query()
-    def run(self, task: str) -> tuple[str, str]:
+    def run(self, task: str, **kwargs) -> tuple[str, str]:
         try:
-            exit_status, result = super().run(task)
+            exit_status, result = super().run(task, **kwargs)
         except Exception as e:
             result = str(e)
             self.app.call_from_thread(self.app.action_quit)
@@ -123,7 +123,7 @@ def _messages_to_steps(messages: list[dict]) -> list[list[dict]]:
 class SmartInputContainer(Container):
-    def __init__(self, app: "AgentApp"):
+    def __init__(self, app: "TextualAgent"):
         """Smart input container supporting single-line and multi-line input modes."""
         super().__init__(classes="smart-input-container")
         self._app = app
@@ -239,7 +239,7 @@ class SmartInputContainer(Container):
             return
-class AgentApp(App):
+class TextualAgent(App):
     BINDINGS = [
         Binding("right,l", "next_step", "Step++", tooltip="Show next step of the agent"),
         Binding("left,h", "previous_step", "Step--", tooltip="Show previous step of the agent"),
@@ -259,24 +259,28 @@ class AgentApp(App):
         Binding("f1,question_mark", "toggle_help_panel", "Help", tooltip="Show help"),
     ]
-    def __init__(self, model, env, task: str, **kwargs):
+    def __init__(self, model, env, **kwargs):
         css_path = os.environ.get("MSWEA_MINI_STYLE_PATH", str(Path(__file__).parent.parent / "config" / "mini.tcss"))
         self.__class__.CSS = Path(css_path).read_text()
         super().__init__()
         self.agent_state = "UNINITIALIZED"
-        self.agent_task = task
-        self.agent = TextualAgent(self, model=model, env=env, **kwargs)
+        self.agent = _TextualAgent(self, model=model, env=env, **kwargs)
         self._i_step = 0
         self.n_steps = 1
         self.input_container = SmartInputContainer(self)
         self.log_handler = AddLogEmitCallback(lambda record: self.call_from_thread(self.on_log_message_emitted, record))
         logging.getLogger().addHandler(self.log_handler)
         self._spinner = Spinner("dots")
-        self.exit_status: str | None = None
-        self.result: str | None = None
+        self.exit_status: str = "ExitStatusUnset"
+        self.result: str = ""
         self._vscroll = VerticalScroll()
+    def run(self, task: str) -> tuple[str, str]:
+        threading.Thread(target=lambda: self.agent.run(task), daemon=True).start()
+        super().run()
+        return self.exit_status, self.result
     # --- Basics ---
     @property
@@ -305,7 +309,18 @@ class AgentApp(App):
         self.agent_state = "RUNNING"
         self.update_content()
         self.set_interval(1 / 8, self._update_headers)
-        threading.Thread(target=lambda: self.agent.run(self.agent_task), daemon=True).start()
+    @property
+    def messages(self) -> list[dict]:
+        return self.agent.messages
+    @property
+    def model(self):
+        return self.agent.model
+    @property
+    def env(self):
+        return self.agent.env
     # --- Reacting to events ---

minisweagent/config/default.yaml CHANGED Viewed

@@ -15,8 +15,6 @@ agent:
     </format_example>
     Failure to follow these rules will cause your response to be rejected.
-    To finish, issue the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`
-    without any other command.
   instance_template: |
     Please solve this issue: {{task}}
@@ -31,7 +29,7 @@ agent:
     3. Edit the source code to resolve the issue
     4. Verify your fix works by running your script again
     5. Test edge cases to ensure your fix is robust
-    6. Submit your changes and finish your work by issuing the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`.
+    6. Submit your changes and finish your work by issuing the following command: `echo COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT`.
        Do not combine it with any other command. <important>After this command, you cannot continue working on this task.</important>
     ## Important Rules
@@ -130,7 +128,7 @@ agent:
     {%- endif -%}
   format_error_template: |
     Please always provide EXACTLY ONE action in triple backticks, found {{actions|length}} actions.
-    If you want to end the task, please issue the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`
+    If you want to end the task, please issue the following command: `echo COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT`
     without any other command.
     Else, please format your response exactly as follows:

minisweagent/config/extra/swebench.yaml CHANGED Viewed

@@ -159,15 +159,15 @@ agent:
     ```
     ## Submission
-    When you've completed your changes or can't make further progress
+    When you've completed your work (reading, editing, testing), and cannot make further progress
     issue exactly the following command:
     ```bash
-    echo MINI_SWE_AGENT_FINAL_OUTPUT && git add -A && git diff --cached
+    echo COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT && git add -A && git diff --cached
     ```
-    This command will submit your changes.
-    You cannot continue working on this task after submitting.
+    This command will submit your work.
+    You cannot continue working (reading, editing, testing) in any way on this task after submitting.
     </instructions>
   action_observation_template: |
     <returncode>{{output.returncode}}</returncode>
@@ -221,9 +221,10 @@ environment:
     LESS: -R
     PIP_PROGRESS_BAR: 'off'
     TQDM_DISABLE: '1'
+  environment_class: docker
 model:
   model_name: "claude-sonnet-4-20250514"
   model_kwargs:
+    drop_params: true
     temperature: 0.0
-    drop_params: true

minisweagent/config/github_issue.yaml CHANGED Viewed

@@ -15,7 +15,7 @@ agent:
     </format_example>
     Failure to follow these rules will cause your response to be rejected.
-    To finish, issue the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`
+    To finish, issue the following command: `echo COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT`
     without any other command.
   instance_template: |
     Please solve this issue: {{task}}
@@ -35,7 +35,7 @@ agent:
     2. The action must be enclosed in triple backticks
     3. Directory or environment variable changes are not persistent. Every action is executed in a new subshell.
        However, you can prefix any action with `MY_ENV_VAR=MY_VALUE cd /path/to/working/dir && ...` or write/load environment variables from files
-    4. To finish, issue the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`.
+    4. To finish, issue the following command: `echo COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT`.
        Do not combine it with any other command.
     ## Formatting your response
@@ -117,7 +117,7 @@ agent:
     {%- endif -%}
   format_error_template: |
     Please always provide EXACTLY ONE action in triple backticks, found {{actions|length}} actions.
-    If you want to end the task, please issue the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`
+    If you want to end the task, please issue the following command: `echo COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT`
     without any other command.
     Else, please format your response exactly as follows:

minisweagent/config/mini.yaml CHANGED Viewed

@@ -15,8 +15,6 @@ agent:
     </format_example>
     Failure to follow these rules will cause your response to be rejected.
-    To finish, issue the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`
-    without any other command.
   instance_template: |
     Please solve this issue: {{task}}
@@ -31,7 +29,7 @@ agent:
     3. Edit the source code to resolve the issue
     4. Verify your fix works by running your script again
     5. Test edge cases to ensure your fix is robust
-    6. Submit your changes and finish your work by issuing the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`.
+    6. Submit your changes and finish your work by issuing the following command: `echo COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT`.
        Do not combine it with any other command. <important>After this command, you cannot continue working on this task.</important>
     ## Important Rules
@@ -130,7 +128,7 @@ agent:
     {%- endif -%}
   format_error_template: |
     Please always provide EXACTLY ONE action in triple backticks, found {{actions|length}} actions.
-    If you want to end the task, please issue the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`
+    If you want to end the task, please issue the following command: `echo COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT`
     without any other command.
     Else, please format your response exactly as follows:

minisweagent/config/mini_no_temp.yaml CHANGED Viewed

@@ -16,8 +16,6 @@ agent:
     </format_example>
     Failure to follow these rules will cause your response to be rejected.
-    To finish, issue the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`
-    without any other command.
   instance_template: |
     Please solve this issue: {{task}}
@@ -32,7 +30,7 @@ agent:
     3. Edit the source code to resolve the issue
     4. Verify your fix works by running your script again
     5. Test edge cases to ensure your fix is robust
-    6. Submit your changes and finish your work by issuing the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`.
+    6. Submit your changes and finish your work by issuing the following command: `echo COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT`.
        Do not combine it with any other command. <important>After this command, you cannot continue working on this task.</important>
     ## Important Rules
@@ -131,7 +129,7 @@ agent:
     {%- endif -%}
   format_error_template: |
     Please always provide EXACTLY ONE action in triple backticks, found {{actions|length}} actions.
-    If you want to end the task, please issue the following command: `echo MINI_SWE_AGENT_FINAL_OUTPUT`
+    If you want to end the task, please issue the following command: `echo COMPLETE_TASK_AND_SUBMIT_FINAL_OUTPUT`
     without any other command.
     Else, please format your response exactly as follows:

minisweagent/environments/__init__.py CHANGED Viewed

@@ -1 +1,30 @@
 """Environment implementations for mini-SWE-agent."""
+import copy
+import importlib
+from minisweagent import Environment
+_ENVIRONMENT_MAPPING = {
+    "docker": "minisweagent.environments.docker.DockerEnvironment",
+    "singularity": "minisweagent.environments.singularity.SingularityEnvironment",
+    "local": "minisweagent.environments.local.LocalEnvironment",
+    "swerex_docker": "minisweagent.environments.extra.swerex_docker.SwerexDockerEnvironment",
+}
+def get_environment_class(spec: str) -> type[Environment]:
+    full_path = _ENVIRONMENT_MAPPING.get(spec, spec)
+    try:
+        module_name, class_name = full_path.rsplit(".", 1)
+        module = importlib.import_module(module_name)
+        return getattr(module, class_name)
+    except (ValueError, ImportError, AttributeError):
+        msg = f"Unknown environment type: {spec} (resolved to {full_path}, available: {_ENVIRONMENT_MAPPING})"
+        raise ValueError(msg)
+def get_environment(config: dict, *, default_type: str = "") -> Environment:
+    config = copy.deepcopy(config)
+    environment_class = config.pop("environment_class", default_type)
+    return get_environment_class(environment_class)(**config)

minisweagent/environments/docker.py CHANGED Viewed

@@ -20,7 +20,7 @@ class DockerEnvironmentConfig:
     """
     timeout: int = 30
     """Timeout for executing commands in the container."""
-    executable: str = "docker"
+    executable: str = os.getenv("MSWEA_DOCKER_EXECUTABLE", "docker")
     """Path to the docker/container executable."""
     run_args: list[str] = field(default_factory=list)
     """Additional arguments to pass to the docker/container executable."""

minisweagent/environments/singularity.py CHANGED Viewed

@@ -1,8 +1,12 @@
 #!/usr/bin/env python3
 import os
+import shutil
 import subprocess
+import tempfile
+import uuid
 from dataclasses import dataclass, field
+from pathlib import Path
 from typing import Any
@@ -16,7 +20,7 @@ class SingularityEnvironmentConfig:
     """Environment variables to forward to the container."""
     timeout: int = 30
     """Timeout for executing commands in the container."""
-    executable: str = "singularity"
+    executable: str = os.getenv("MSWEA_SINGULARITY_EXECUTABLE", "singularity")
     """Path to the singularity executable."""
@@ -24,11 +28,20 @@ class SingularityEnvironment:
     def __init__(self, **kwargs):
         """Singularity environment. See `SingularityEnvironmentConfig` for kwargs."""
         self.config = SingularityEnvironmentConfig(**kwargs)
+        self.sandbox_dir = Path(tempfile.gettempdir()) / f"minisweagent-{uuid.uuid4().hex[:8]}"
+        subprocess.run(
+            [self.config.executable, "build", "--sandbox", self.sandbox_dir, self.config.image],
+            check=True,
+        )
     def execute(self, command: str, cwd: str = "") -> dict[str, Any]:
         """Execute a command in a Singularity container and return the result as a dict."""
         cmd = [self.config.executable, "exec"]
+        # Do not inherit directories and env vars from host
+        cmd.extend(["--contain", "--cleanenv"])
         work_dir = cwd or self.config.cwd
         if work_dir and work_dir != "/":
             cmd.extend(["--pwd", work_dir])
@@ -39,7 +52,7 @@ class SingularityEnvironment:
         for key, value in self.config.env.items():
             cmd.extend(["--env", f"{key}={value}"])
-        cmd.extend([self.config.image, "bash", "-c", command])
+        cmd.extend(["--writable", str(self.sandbox_dir), "bash", "-c", command])
         result = subprocess.run(
             cmd,
             text=True,
@@ -50,3 +63,12 @@ class SingularityEnvironment:
             stderr=subprocess.STDOUT,
         )
         return {"output": result.stdout, "returncode": result.returncode}
+    def cleanup(self):
+        if self.sandbox_dir.exists():
+            print(f"Removing sandbox {self.sandbox_dir}")
+            shutil.rmtree(self.sandbox_dir)
+    def __del__(self):
+        """Cleanup sandbox when object is destroyed."""
+        self.cleanup()

minisweagent/run/extra/config.py CHANGED Viewed

@@ -34,11 +34,12 @@ This setup will ask you for your model and an API key.
 Here's a few popular models and the required API keys:
 [bold green]claude-sonnet-4-20250514[/bold green] ([bold green]ANTHROPIC_API_KEY[/bold green])
-[bold green]o3[/bold green] ([bold green]OPENAI_API_KEY[/bold green])
+[bold green]openai/gpt-5[/bold green] or [bold green]openai/gpt-5-mini[/bold green] ([bold green]OPENAI_API_KEY[/bold green])
 [bold yellow]You can leave any setting blank to skip it.[/bold yellow]
 More information at https://mini-swe-agent.com/latest/quickstart/
+To find the best model, check the leaderboard at https://swebench.com/
 """

minisweagent/run/extra/swebench.py CHANGED Viewed

@@ -17,9 +17,10 @@ import yaml
 from datasets import load_dataset
 from rich.live import Live
+from minisweagent import Environment
 from minisweagent.agents.default import DefaultAgent
 from minisweagent.config import builtin_config_dir, get_config_path
-from minisweagent.environments.docker import DockerEnvironment
+from minisweagent.environments import get_environment
 from minisweagent.models import get_model
 from minisweagent.run.extra.utils.batch_progress import RunBatchProgressManager
 from minisweagent.run.utils.save import save_traj
@@ -74,6 +75,15 @@ def get_swebench_docker_image_name(instance: dict) -> str:
     return image_name
+def get_sb_environment(config: dict, instance: dict) -> Environment:
+    image_name = get_swebench_docker_image_name(instance)
+    env_config = config.get("environment", {})
+    if env_config.get("environment_class") == "singularity":
+        image_name = "docker://" + image_name
+    env_config["image"] = image_name
+    return get_environment(env_config, default_type="docker")
 def update_preds_file(output_path: Path, instance_id: str, model_name: str, result: str):
     """Update the output JSON file with results from a single instance."""
     with _OUTPUT_FILE_LOCK:
@@ -102,8 +112,7 @@ def remove_from_preds_file(output_path: Path, instance_id: str):
 def process_instance(
     instance: dict,
     output_dir: Path,
-    model_name: str | None,
-    config_path: str | Path,
+    config: dict,
     progress_manager: RunBatchProgressManager,
 ) -> None:
     """Process a single SWEBench instance."""
@@ -112,10 +121,7 @@ def process_instance(
     # avoid inconsistent state if something here fails and there's leftover previous files
     remove_from_preds_file(output_dir / "preds.json", instance_id)
     (instance_dir / f"{instance_id}.traj.json").unlink(missing_ok=True)
-    image_name = get_swebench_docker_image_name(instance)
-    config = yaml.safe_load(get_config_path(config_path).read_text())
-    model = get_model(model_name, config=config.get("model", {}))
+    model = get_model(config=config.get("model", {}))
     task = instance["problem_statement"]
     progress_manager.on_instance_start(instance_id)
@@ -125,7 +131,7 @@ def process_instance(
     extra_info = None
     try:
-        env = DockerEnvironment(**(config.get("environment", {}) | {"image": image_name}))
+        env = get_sb_environment(config, instance)
         agent = ProgressTrackingAgent(
             model,
             env,
@@ -171,21 +177,22 @@ def filter_instances(
     return instances
+# fmt: off
 @app.command(help=_HELP_TEXT)
 def main(
-    subset: str = typer.Option("lite", "--subset", help="SWEBench subset to use or path to a dataset"),
-    split: str = typer.Option("dev", "--split", help="Dataset split"),
-    slice_spec: str = typer.Option("", "--slice", help="Slice specification (e.g., '0:5' for first 5 instances)"),
-    filter_spec: str = typer.Option("", "--filter", help="Filter instance IDs by regex"),
-    shuffle: bool = typer.Option(False, "--shuffle", help="Shuffle instances"),
-    output: str = typer.Option("", "-o", "--output", help="Output directory"),
-    workers: int = typer.Option(1, "-w", "--workers", help="Number of worker threads for parallel processing"),
-    model: str | None = typer.Option(None, "-m", "--model", help="Model to use"),
-    redo_existing: bool = typer.Option(False, "--redo-existing", help="Redo existing instances"),
-    config: Path = typer.Option(
-        builtin_config_dir / "extra" / "swebench.yaml", "-c", "--config", help="Path to a config file"
-    ),
+    subset: str = typer.Option("lite", "--subset", help="SWEBench subset to use or path to a dataset", rich_help_panel="Data selection"),
+    split: str = typer.Option("dev", "--split", help="Dataset split", rich_help_panel="Data selection"),
+    slice_spec: str = typer.Option("", "--slice", help="Slice specification (e.g., '0:5' for first 5 instances)", rich_help_panel="Data selection"),
+    filter_spec: str = typer.Option("", "--filter", help="Filter instance IDs by regex", rich_help_panel="Data selection"),
+    shuffle: bool = typer.Option(False, "--shuffle", help="Shuffle instances", rich_help_panel="Data selection"),
+    output: str = typer.Option("", "-o", "--output", help="Output directory", rich_help_panel="Basic"),
+    workers: int = typer.Option(1, "-w", "--workers", help="Number of worker threads for parallel processing", rich_help_panel="Basic"),
+    model: str | None = typer.Option(None, "-m", "--model", help="Model to use", rich_help_panel="Basic"),
+    redo_existing: bool = typer.Option(False, "--redo-existing", help="Redo existing instances", rich_help_panel="Data selection"),
+    config_spec: Path = typer.Option( builtin_config_dir / "extra" / "swebench.yaml", "-c", "--config", help="Path to a config file", rich_help_panel="Basic"),
+    environment_class: str | None = typer.Option( None, "--environment-class", help="Environment type to use. Recommended are docker or singularity", rich_help_panel="Advanced"),
 ) -> None:
+    # fmt: on
     dataset_path = DATASET_MAPPING.get(subset, subset)
     print(f"Loading dataset {dataset_path}, split {split}...")
     instances = list(load_dataset(dataset_path, split=split))
@@ -201,6 +208,10 @@ def main(
     print(f"Running on {len(instances)} instances...")
     print(f"Results will be saved to {output_path}")
+    config = yaml.safe_load(get_config_path(config_spec).read_text())
+    config.setdefault("environment", {}).setdefault("environment_class", environment_class)
+    config.setdefault("model", {}).setdefault("model_name", model)
     progress_manager = RunBatchProgressManager(len(instances), output_path / f"exit_statuses_{time.time()}.yaml")
     def process_futures(futures: dict[concurrent.futures.Future, str]):
@@ -218,7 +229,7 @@ def main(
     with Live(progress_manager.render_group, refresh_per_second=4):
         with concurrent.futures.ThreadPoolExecutor(max_workers=workers) as executor:
             futures = {
-                executor.submit(process_instance, instance, output_path, model, config, progress_manager): instance[
+                executor.submit(process_instance, instance, output_path, config, progress_manager): instance[
                     "instance_id"
                 ]
                 for instance in instances

minisweagent/run/extra/swebench_single.py CHANGED Viewed

@@ -8,29 +8,30 @@ from datasets import load_dataset
 from minisweagent.agents.interactive import InteractiveAgent
 from minisweagent.config import builtin_config_dir, get_config_path
-from minisweagent.environments.docker import DockerEnvironment
 from minisweagent.models import get_model
-from minisweagent.run.extra.swebench import DATASET_MAPPING, get_swebench_docker_image_name
+from minisweagent.run.extra.swebench import (
+    DATASET_MAPPING,
+    get_sb_environment,
+)
 app = typer.Typer(add_completion=False)
+# fmt: off
 @app.command()
 def main(
-    subset: str = typer.Option("lite", "--subset", help="SWEBench subset to use or path to a dataset"),
-    split: str = typer.Option("dev", "--split", help="Dataset split"),
-    instance_spec: str = typer.Option(None, "-i", "--instance", help="SWE-Bench instance ID"),
-    model_name: str | None = typer.Option(None, "-m", "--model", help="Model to use"),
-    config_path: Path = typer.Option(
-        builtin_config_dir / "extra" / "swebench.yaml", "-c", "--config", help="Path to a config file"
-    ),
+    subset: str = typer.Option("lite", "--subset", help="SWEBench subset to use or path to a dataset", rich_help_panel="Data selection"),
+    split: str = typer.Option("dev", "--split", help="Dataset split", rich_help_panel="Data selection"),
+    instance_spec: str = typer.Option(0, "-i", "--instance", help="SWE-Bench instance ID or index", rich_help_panel="Data selection"),
+    model_name: str | None = typer.Option(None, "-m", "--model", help="Model to use", rich_help_panel="Basic"),
+    config_path: Path = typer.Option( builtin_config_dir / "extra" / "swebench.yaml", "-c", "--config", help="Path to a config file", rich_help_panel="Basic"),
+    environment_class: str | None = typer.Option(None, "--environment-class", rich_help_panel="Advanced"),
+    exit_immediately: bool = typer.Option( False, "--exit-immediately", help="Exit immediately when the agent wants to finish instead of prompting.", rich_help_panel="Basic"),
 ) -> None:
+    # fmt: on
     """Run on a single SWE-Bench instance."""
-    try:
-        dataset_path = DATASET_MAPPING[subset]
-    except KeyError:
-        dataset_path = subset
-    print(f"Loading dataset {dataset_path}, split {split}...")
+    dataset_path = DATASET_MAPPING.get(subset, subset)
+    print(f"Loading dataset from {dataset_path}, split {split}...")
     instances = {
         inst["instance_id"]: inst  # type: ignore
         for inst in load_dataset(dataset_path, split=split)
@@ -39,12 +40,15 @@ def main(
         instance_spec = sorted(instances.keys())[int(instance_spec)]
     instance: dict = instances[instance_spec]  # type: ignore
-    _config = yaml.safe_load(get_config_path(config_path).read_text())
-    env = DockerEnvironment(**(_config.get("environment", {}) | {"image": get_swebench_docker_image_name(instance)}))
+    config = yaml.safe_load(get_config_path(config_path).read_text())
+    config.setdefault("environment", {}).setdefault("environment_class", environment_class)
+    if exit_immediately:
+        config.setdefault("agent", {})["confirm_exit"] = False
+    env = get_sb_environment(config, instance)
     agent = InteractiveAgent(
-        get_model(model_name, _config.get("model", {})),
+        get_model(model_name, config.get("model", {})),
         env,
-        **(_config.get("agent", {}) | {"mode": "yolo"}),
+        **(config.get("agent", {}) | {"mode": "yolo"}),
     )
     agent.run(instance["problem_statement"])

minisweagent/run/mini.py CHANGED Viewed

@@ -14,9 +14,9 @@ from prompt_toolkit.history import FileHistory
 from prompt_toolkit.shortcuts import PromptSession
 from rich.console import Console
-from minisweagent import Environment, Model, global_config_dir
+from minisweagent import global_config_dir
 from minisweagent.agents.interactive import InteractiveAgent
-from minisweagent.agents.interactive_textual import AgentApp
+from minisweagent.agents.interactive_textual import TextualAgent
 from minisweagent.config import builtin_config_dir, get_config_path
 from minisweagent.environments.local import LocalEnvironment
 from minisweagent.models import get_model
@@ -41,36 +41,6 @@ More information about the usage: [bold green]https://mini-swe-agent.com/latest/
 """
-def run_interactive(model: Model, env: Environment, agent_config: dict, task: str, output: Path | None = None) -> Any:
-    agent = InteractiveAgent(
-        model,
-        env,
-        **agent_config,
-    )
-    exit_status, result = None, None
-    try:
-        exit_status, result = agent.run(task)
-    finally:
-        if output:
-            save_traj(agent, output, exit_status=exit_status, result=result)
-    return agent
-def run_textual(model: Model, env: Environment, agent_config: dict, task: str, output: Path | None = None) -> Any:
-    agent_app = AgentApp(
-        model,
-        env,
-        task,
-        **agent_config,
-    )
-    try:
-        agent_app.run()
-    finally:
-        if output:
-            save_traj(agent_app.agent, output, exit_status=agent_app.exit_status, result=agent_app.result)
 @app.command(help=_HELP_TEXT)
 def main(
     visual: bool = typer.Option(
@@ -119,10 +89,17 @@ def main(
     env = LocalEnvironment(**config.get("env", {}))
     # Both visual flag and the MSWEA_VISUAL_MODE_DEFAULT flip the mode, so it's essentially a XOR
+    agent_class = InteractiveAgent
     if visual == (os.getenv("MSWEA_VISUAL_MODE_DEFAULT", "false") == "false"):
-        return run_textual(model, env, config["agent"], task, output)  # type: ignore[arg-type]
-    else:
-        return run_interactive(model, env, config["agent"], task, output)  # type: ignore[arg-type]
+        agent_class = TextualAgent
+    exit_status, result = None, None
+    agent = agent_class(model, env, **config.get("agent", {}))
+    try:
+        exit_status, result = agent.run(task)  # type: ignore[arg-type]
+    finally:
+        if output:
+            save_traj(agent, output, exit_status=exit_status, result=result)  # type: ignore[arg-type]
+    return agent
 if __name__ == "__main__":

{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/WHEEL RENAMED Viewed

File without changes

{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/licenses/LICENSE.md RENAMED Viewed

File without changes

{mini_swe_agent-1.6.0.dist-info → mini_swe_agent-1.8.0.dist-info}/top_level.txt RENAMED Viewed

File without changes

mini-swe-agent 1.6.0__py3-none-any.whl → 1.8.0__py3-none-any.whl

mini-swe-agent 1.6.0py3-none-any.whl → 1.8.0py3-none-any.whl