Turn off auto linting by default, and on for swe_bench (#1861)

Disable Python linting by default, and turn it on for SWE Bench. It is turned off by default since this behavior is weird and somewhat annoying to end users. It is turned on for SWE Bench because linting python files gives LLM a chance to fix the indentations.
2026-01-09 14:57:59 -05:00 · 2024-05-17 21:04:38 -07:00
parent 94a9ec76b0
commit a57a213c7c
7 changed files with 17 additions and 5 deletions
--- a/evaluation/swe_bench/README.md
+++ b/evaluation/swe_bench/README.md
@@ -43,8 +43,10 @@ sandbox_type = "ssh"
 use_host_network = true
 ssh_hostname = "localhost"
 sandbox_timeout = 120
+
 # SWEBench eval specific
 run_as_devin = false
+enable_auto_lint = true

 # TODO: Change these to the model you want to evaluate
 [eval_gpt4_1106_preview]
--- a/evaluation/swe_bench/swe_env_box.py
+++ b/evaluation/swe_bench/swe_env_box.py
@@ -73,6 +73,10 @@ class SWEBenchSSHBox(DockerSSHBox):
            )
        config.workspace_base = workspace_mount_path
        config.workspace_mount_path = workspace_mount_path
+
+        # linting python after editing helps LLM fix indentations
+        config.enable_auto_lint = True
+
        sandbox = cls(
            container_image=SWE_BENCH_CONTAINER_IMAGE,
            swe_instance_id=instance['instance_id'],
--- a/opendevin/core/config.py
+++ b/opendevin/core/config.py
@@ -94,6 +94,9 @@ class AppConfig(metaclass=Singleton):
    sandbox_timeout: int = 120
    github_token: str | None = None
    debug: bool = False
+    enable_auto_lint: bool = (
+        False  # once enabled, OpenDevin would lint files after editing
+    )

    defaults_dict: ClassVar[dict] = {}

--- a/opendevin/runtime/docker/ssh_box.py
+++ b/opendevin/runtime/docker/ssh_box.py
@@ -1,5 +1,4 @@
 import atexit
-import json
 import os
 import re
 import sys
@@ -265,8 +264,6 @@ class DockerSSHBox(Sandbox):

    def add_to_env(self, key: str, value: str):
        super().add_to_env(key, value)
-        # Note: json.dumps gives us nice escaping for free
-        self.execute(f'export {key}={json.dumps(value)}')

    def setup_user(self):
        # Make users sudoers passwordless
--- a/opendevin/runtime/plugins/swe_agent_commands/cursors_edit_linting.sh
+++ b/opendevin/runtime/plugins/swe_agent_commands/cursors_edit_linting.sh
@@ -36,7 +36,7 @@ edit() {
    # Write the new stuff directly back into the original file
    printf "%s\n" "${new_lines[@]}" >| "$CURRENT_FILE"
    # Run linter if enabled
-    if [[ $CURRENT_FILE == *.py && -n "$RUN_LINT_AFTER_EDIT" ]]; then
+    if [[ $CURRENT_FILE == *.py && -n "$ENABLE_AUTO_LINT" ]]; then
        lint_output=$(flake8 --isolated --select=F821,F822,F831,E111,E112,E113,E999,E902 "$CURRENT_FILE" 2>&1)
    else
        # do nothing
--- a/opendevin/runtime/plugins/swe_agent_commands/edit_linting.sh
+++ b/opendevin/runtime/plugins/swe_agent_commands/edit_linting.sh
@@ -68,7 +68,7 @@ edit() {
    printf "%s\n" "${new_lines[@]}" >| "$CURRENT_FILE"

    # Run linter if enabled
-    if [[ $CURRENT_FILE == *.py && -n "$RUN_LINT_AFTER_EDIT" ]]; then
+    if [[ $CURRENT_FILE == *.py && -n "$ENABLE_AUTO_LINT" ]]; then
        lint_output=$(flake8 --isolated --select=F821,F822,F831,E111,E112,E113,E999,E902 "$CURRENT_FILE" 2>&1)
    else
        # do nothing
--- a/opendevin/runtime/sandbox.py
+++ b/opendevin/runtime/sandbox.py
@@ -1,6 +1,8 @@
+import json
 import os
 from abc import ABC, abstractmethod

+from opendevin.core.config import config
 from opendevin.core.schema import CancellableStream
 from opendevin.runtime.docker.process import Process
 from opendevin.runtime.plugins.mixin import PluginMixin
@@ -15,9 +17,13 @@ class Sandbox(ABC, PluginMixin):
            if key.startswith('SANDBOX_ENV_'):
                sandbox_key = key.removeprefix('SANDBOX_ENV_')
                self.add_to_env(sandbox_key, os.environ[key])
+        if config.enable_auto_lint:
+            self.add_to_env('ENABLE_AUTO_LINT', 'true')

    def add_to_env(self, key: str, value: str):
        self._env[key] = value
+        # Note: json.dumps gives us nice escaping for free
+        self.execute(f'export {key}={json.dumps(value)}')

    @abstractmethod
    def execute(