Spaces:

Architect8999
/

rhodawk-ai-devops-engine

Sleeping

Rhodawk AI Patcher commited on Apr 18

Commit

ef02f17

1 Parent(s): 6de4da8

fix: patch all critical bugs and gaps from ProjectKyto deep analysis

BUG-001 [CRITICAL] worker_pool.py: Fix signature mismatch — accept env_config
instead of pytest_bin; pass through to process_fn correctly.
BUG-002 [FRAGILE] verification_loop.py: Remove hardcoded RHODAWK_REPO_DIR;
repo_dir now explicit parameter to build_initial_prompt/build_retry_prompt.
BUG-003 [LOGIC] verification_loop.py: ADVERSARIAL_REJECTION_MULTIPLIER default 0→2.
BUG-004 [DATA FLYWHEEL] embedding_memory.py: Auto-rebuild on cold start; min_similarity 0.75→0.55.
BUG-005 [DATA LOSS] app.py: Explicit initialize_store() at startup.
BUG-006 [SECURITY] webhook_server.py: Block all requests when WEBHOOK_SECRET unset.
BUG-007 [RACE] app.py: _active_runtime protected by _active_runtime_lock.
BUG-008 [SECURITY] app.py: Git credentials /tmp/.git-credentials deleted in finally block.
BUG-010 [PERF] supply_chain.py: Use rapidfuzz for O(n) Levenshtein when available.
BUG-011 [METRIC] worker_pool.py: already_green no longer counted as healed.
BUG-012 [LOGIC] sast_gate.py: Block on ANY HIGH severity finding (was 3+).

MINOR: audit_logger full-chain verification, job TTL pruning, notifier runtime rotation.

Files changed (11) hide show

app.py +34 -5
audit_logger.py +16 -6
embedding_memory.py +22 -1
job_queue.py +30 -0
notifier.py +22 -8
requirements.txt +2 -1
sast_gate.py +6 -2
supply_chain.py +19 -12
verification_loop.py +10 -3
webhook_server.py +12 -1
worker_pool.py +17 -6

app.py CHANGED Viewed

@@ -49,7 +49,7 @@ from notifier import (
 from sast_gate import run_sast_gate
 from red_team_fuzzer import get_red_team_logs, get_red_team_stats, run_red_team_cegis
 from supply_chain import run_supply_chain_gate
-from training_store import export_training_data, get_statistics, record_attempt, update_test_result
 from verification_loop import (
     MAX_RETRIES,
     ADVERSARIAL_REJECTION_MULTIPLIER,
@@ -62,8 +62,11 @@ from webhook_server import set_job_dispatcher, start_webhook_server
 from worker_pool import MAX_WORKERS, run_parallel_audit
 from language_runtime import RuntimeFactory, LanguageRuntime, EnvConfig
-# Module-level runtime handle — set once repo is cloned
 _active_runtime: LanguageRuntime | None = None
 # ──────────────────────────────────────────────────────────────
 # SECRETS — env only, never hardcoded
@@ -92,6 +95,13 @@ REPO_DIR = f"{PERSISTENT_DIR}/repo"
 VENV_DIR = f"{PERSISTENT_DIR}/target_venv"
 MCP_RUNTIME_CONFIG = "/tmp/mcp_runtime.json"
 # ──────────────────────────────────────────────────────────────
 # GLOBAL STATE
 # ──────────────────────────────────────────────────────────────
@@ -393,9 +403,9 @@ def process_failing_test(
         # ── Step 2: Build prompt ────────────────────────────────
         if attempt_num == 1:
-            prompt = build_initial_prompt(test_path, src_file, branch_name, current_failure, similar_fixes)
         else:
-            prompt = build_retry_prompt(test_path, src_file, branch_name, initial_failure, attempt_history, similar_fixes)
         prompt_hash = hashlib.sha256(prompt.encode()).hexdigest()[:16]
@@ -642,6 +652,13 @@ def enterprise_audit_loop(repo_override: str = None, branch: str = "main", speci
     log_audit_event("AUDIT_START", "orchestrator", target_repo, MODEL,
                     {"tenant": TENANT_ID, "branch": branch}, "STARTED")
     try:
         configure_git_credentials()
         mcp_config_path = write_mcp_config()
@@ -654,8 +671,12 @@ def enterprise_audit_loop(repo_override: str = None, branch: str = "main", speci
             safe_git_pull()
         # ── Language detection ────────────────────────────────────────
         global _active_runtime
-        _active_runtime = RuntimeFactory.for_repo(REPO_DIR)
         ui_log(f"Detected language: {_active_runtime.language.upper()}", "INFO")
         env_config = _active_runtime.setup_env(REPO_DIR, PERSISTENT_DIR)
@@ -679,6 +700,7 @@ def enterprise_audit_loop(repo_override: str = None, branch: str = "main", speci
         )
         ui_log(
             f"Worker pool complete — workers={MAX_WORKERS}, healed={pool_result['healed']}, "
             f"failed={pool_result['failed']}, skipped={pool_result['skipped']}",
             "POOL",
         )
@@ -706,6 +728,13 @@ def enterprise_audit_loop(repo_override: str = None, branch: str = "main", speci
         log_audit_event("AUDIT_CRASH", "orchestrator", target_repo, MODEL, {"error": str(e)}, "CRASHED")
         return
     finally:
         _audit_event.clear()
     final_metrics = get_metrics()

 from sast_gate import run_sast_gate
 from red_team_fuzzer import get_red_team_logs, get_red_team_stats, run_red_team_cegis
 from supply_chain import run_supply_chain_gate
+from training_store import export_training_data, get_statistics, initialize_store, record_attempt, update_test_result
 from verification_loop import (
     MAX_RETRIES,
     ADVERSARIAL_REJECTION_MULTIPLIER,
 from worker_pool import MAX_WORKERS, run_parallel_audit
 from language_runtime import RuntimeFactory, LanguageRuntime, EnvConfig
+# Module-level runtime handle — set once per audit run.
+# BUG-007 FIX: Protected by a lock so concurrent webhook-triggered audits do not
+# overwrite _active_runtime while workers are mid-flight reading it.
 _active_runtime: LanguageRuntime | None = None
+_active_runtime_lock = threading.Lock()
 # ──────────────────────────────────────────────────────────────
 # SECRETS — env only, never hardcoded
 VENV_DIR = f"{PERSISTENT_DIR}/target_venv"
 MCP_RUNTIME_CONFIG = "/tmp/mcp_runtime.json"
+# ──────────────────────────────────────────────────────────────
+# BUG-005 FIX: Explicit startup initialization — ensures SQLite tables exist
+# even if the module-level call in training_store.py is optimized away or
+# the import order changes in the future.
+# ──────────────────────────────────────────────────────────────
+initialize_store()
 # ──────────────────────────────────────────────────────────────
 # GLOBAL STATE
 # ──────────────────────────────────────────────────────────────
         # ── Step 2: Build prompt ────────────────────────────────
         if attempt_num == 1:
+            prompt = build_initial_prompt(test_path, src_file, branch_name, current_failure, similar_fixes, repo_dir=REPO_DIR)
         else:
+            prompt = build_retry_prompt(test_path, src_file, branch_name, initial_failure, attempt_history, similar_fixes, repo_dir=REPO_DIR)
         prompt_hash = hashlib.sha256(prompt.encode()).hexdigest()[:16]
     log_audit_event("AUDIT_START", "orchestrator", target_repo, MODEL,
                     {"tenant": TENANT_ID, "branch": branch}, "STARTED")
+    # Prune stale completed jobs at the start of each audit run (TTL fix)
+    from job_queue import prune_done_jobs
+    pruned = prune_done_jobs(max_age_hours=72)
+    if pruned:
+        ui_log(f"Pruned {pruned} completed job(s) older than 72h from queue.", "INFO")
+    cred_path = "/tmp/.git-credentials"
     try:
         configure_git_credentials()
         mcp_config_path = write_mcp_config()
             safe_git_pull()
         # ── Language detection ────────────────────────────────────────
+        # BUG-007 FIX: acquire lock before overwriting _active_runtime so a
+        # concurrent webhook-triggered audit cannot swap the runtime under
+        # in-flight workers from a previous audit.
         global _active_runtime
+        with _active_runtime_lock:
+            _active_runtime = RuntimeFactory.for_repo(REPO_DIR)
         ui_log(f"Detected language: {_active_runtime.language.upper()}", "INFO")
         env_config = _active_runtime.setup_env(REPO_DIR, PERSISTENT_DIR)
         )
         ui_log(
             f"Worker pool complete — workers={MAX_WORKERS}, healed={pool_result['healed']}, "
+            f"already_green={pool_result['already_green']}, "
             f"failed={pool_result['failed']}, skipped={pool_result['skipped']}",
             "POOL",
         )
         log_audit_event("AUDIT_CRASH", "orchestrator", target_repo, MODEL, {"error": str(e)}, "CRASHED")
         return
     finally:
+        # BUG-008 FIX: Always scrub plaintext credentials from /tmp after audit
+        try:
+            if os.path.exists(cred_path):
+                os.unlink(cred_path)
+                ui_log("Git credentials file scrubbed from /tmp.", "INFO")
+        except OSError:
+            pass
         _audit_event.clear()
     final_metrics = get_metrics()

audit_logger.py CHANGED Viewed

@@ -107,19 +107,29 @@ def read_audit_trail(limit: int = 50) -> list[dict]:
 def verify_chain_integrity() -> tuple[bool, str]:
     """
-    Walk the entire audit chain and verify each entry's hash.
     Returns (is_valid, summary_message).
     Used for compliance attestation.
     """
     if not os.path.exists(AUDIT_LOG_PATH):
         return True, "No audit log yet — chain is clean."
     events = []
-    with open(AUDIT_LOG_PATH, "r") as f:
-        for line in f:
-            line = line.strip()
-            if line:
-                events.append(json.loads(line))
     if not events:
         return True, "Empty log — chain is clean."

 def verify_chain_integrity() -> tuple[bool, str]:
     """
+    Walk the ENTIRE audit chain and verify each entry's hash.
     Returns (is_valid, summary_message).
     Used for compliance attestation.
+    MINOR BUG FIX: Previously read_audit_trail(1000) was called which truncated
+    the chain — a log with >1000 entries would appear verified even if early entries
+    were tampered. Now the full file is always read for integrity checks.
     """
     if not os.path.exists(AUDIT_LOG_PATH):
         return True, "No audit log yet — chain is clean."
     events = []
+    try:
+        with open(AUDIT_LOG_PATH, "r") as f:
+            for line in f:
+                line = line.strip()
+                if line:
+                    try:
+                        events.append(json.loads(line))
+                    except json.JSONDecodeError:
+                        return False, f"CHAIN BROKEN: malformed JSON entry at line {len(events) + 1}."
+    except OSError as e:
+        return False, f"Could not read audit log: {e}"
     if not events:
         return True, "Empty log — chain is clean."

embedding_memory.py CHANGED Viewed

@@ -90,9 +90,30 @@ def rebuild_embedding_index(limit: int = 1000) -> int:
 def retrieve_similar_fixes_v2(
     failure_output: str,
     top_k: int = 5,
-    min_similarity: float = 0.75,
 ) -> list[dict]:
     _ensure_schema()
     query_vec = embed_failure(failure_output).astype(np.float32)
     with sqlite3.connect(EMBEDDING_DB_PATH) as conn:
         conn.row_factory = sqlite3.Row

 def retrieve_similar_fixes_v2(
     failure_output: str,
     top_k: int = 5,
+    min_similarity: float = 0.55,
 ) -> list[dict]:
+    """
+    BUG-004 FIX:
+      1. min_similarity lowered from 0.75 → 0.55 so sparse/cold-start DBs
+         can still return useful candidates.
+      2. Auto-rebuild embedding index from training_store on cold start
+         (empty index) so v2 memory is never dead on first run.
+      3. Falls back gracefully to empty list (callers handle this).
+    """
     _ensure_schema()
+    # Auto-rebuild if the index is empty (cold start)
+    with sqlite3.connect(EMBEDDING_DB_PATH) as conn:
+        count = conn.execute("SELECT COUNT(*) FROM fix_embeddings").fetchone()[0]
+    if count == 0:
+        try:
+            rebuilt = rebuild_embedding_index()
+            if rebuilt == 0:
+                return []
+        except Exception:
+            return []
     query_vec = embed_failure(failure_output).astype(np.float32)
     with sqlite3.connect(EMBEDDING_DB_PATH) as conn:
         conn.row_factory = sqlite3.Row

job_queue.py CHANGED Viewed

@@ -136,3 +136,33 @@ def get_metrics() -> dict:
         "sast_blocked": sum(1 for j in jobs if j["status"] == "SAST_BLOCKED"),
         "prs_created": sum(1 for j in jobs if j.get("pr_url")),
     }

         "sast_blocked": sum(1 for j in jobs if j["status"] == "SAST_BLOCKED"),
         "prs_created": sum(1 for j in jobs if j.get("pr_url")),
     }
+def prune_done_jobs(max_age_hours: int = 72) -> int:
+    """
+    MINOR BUG FIX: Remove DONE/FAILED jobs older than max_age_hours to
+    prevent unbounded job store growth. Safe to call periodically.
+    Returns number of pruned files.
+    """
+    if not os.path.exists(QUEUE_DIR):
+        return 0
+    cutoff = time.time() - (max_age_hours * 3600)
+    pruned = 0
+    with _queue_lock:
+        for fname in os.listdir(QUEUE_DIR):
+            if not fname.endswith(".json"):
+                continue
+            fpath = os.path.join(QUEUE_DIR, fname)
+            try:
+                with open(fpath) as f:
+                    job = json.load(f)
+                if job.get("status") in ("DONE", "FAILED"):
+                    updated_at = job.get("updated_at", "")
+                    if updated_at:
+                        job_ts = time.mktime(time.strptime(updated_at, "%Y-%m-%dT%H:%M:%SZ"))
+                        if job_ts < cutoff:
+                            os.unlink(fpath)
+                            pruned += 1
+            except Exception:
+                pass
+    return pruned

notifier.py CHANGED Viewed

@@ -3,6 +3,10 @@ Rhodawk AI — Multi-Channel Notification Engine
 ================================================
 Fire-and-forget notifications across Telegram (and extensible to Slack/PagerDuty).
 All dispatches use tenacity retry logic and never block the audit loop.
 """
 import os
@@ -10,29 +14,38 @@ import threading
 import requests
 from tenacity import retry, stop_after_attempt, wait_exponential
-TELEGRAM_BOT_TOKEN = os.getenv("TELEGRAM_BOT_TOKEN")
-TELEGRAM_CHAT_ID = os.getenv("TELEGRAM_CHAT_ID")
-SLACK_WEBHOOK_URL = os.getenv("SLACK_WEBHOOK_URL")
 @retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=2, max=10))
 def _post_telegram(payload: dict):
-    url = f"https://api.telegram.org/bot{TELEGRAM_BOT_TOKEN}/sendMessage"
     resp = requests.post(url, json=payload, timeout=10)
     resp.raise_for_status()
 @retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=2, max=10))
 def _post_slack(payload: dict):
-    resp = requests.post(SLACK_WEBHOOK_URL, json=payload, timeout=10)
     resp.raise_for_status()
 def _dispatch(message: str, level: str = "INFO"):
-    if TELEGRAM_BOT_TOKEN and TELEGRAM_CHAT_ID:
         try:
             _post_telegram({
-                "chat_id": TELEGRAM_CHAT_ID,
                 "text": message,
                 "parse_mode": "Markdown",
                 "disable_web_page_preview": True,
@@ -40,7 +53,8 @@ def _dispatch(message: str, level: str = "INFO"):
         except Exception:
             pass
-    if SLACK_WEBHOOK_URL:
         color_map = {"INFO": "#36a64f", "WARN": "#ffa500", "ERROR": "#ff0000", "CRITICAL": "#8b0000"}
         try:
             _post_slack({

 ================================================
 Fire-and-forget notifications across Telegram (and extensible to Slack/PagerDuty).
 All dispatches use tenacity retry logic and never block the audit loop.
+MINOR BUG FIX: Telegram/Slack URLs are no longer captured at module load time.
+They are resolved dynamically at dispatch time, so rotating credentials at runtime
+(without a process restart) takes effect immediately.
 """
 import os
 import requests
 from tenacity import retry, stop_after_attempt, wait_exponential
+def _get_telegram_creds() -> tuple[str, str]:
+    """Resolve Telegram credentials at dispatch time, not module load time."""
+    return os.getenv("TELEGRAM_BOT_TOKEN", ""), os.getenv("TELEGRAM_CHAT_ID", "")
+def _get_slack_url() -> str:
+    """Resolve Slack webhook URL at dispatch time, not module load time."""
+    return os.getenv("SLACK_WEBHOOK_URL", "")
 @retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=2, max=10))
 def _post_telegram(payload: dict):
+    token, _ = _get_telegram_creds()
+    url = f"https://api.telegram.org/bot{token}/sendMessage"
     resp = requests.post(url, json=payload, timeout=10)
     resp.raise_for_status()
 @retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=2, max=10))
 def _post_slack(payload: dict):
+    slack_url = _get_slack_url()
+    resp = requests.post(slack_url, json=payload, timeout=10)
     resp.raise_for_status()
 def _dispatch(message: str, level: str = "INFO"):
+    token, chat_id = _get_telegram_creds()
+    if token and chat_id:
         try:
             _post_telegram({
+                "chat_id": chat_id,
                 "text": message,
                 "parse_mode": "Markdown",
                 "disable_web_page_preview": True,
         except Exception:
             pass
+    slack_url = _get_slack_url()
+    if slack_url:
         color_map = {"INFO": "#36a64f", "WARN": "#ffa500", "ERROR": "#ff0000", "CRITICAL": "#8b0000"}
         try:
             _post_slack({

requirements.txt CHANGED Viewed

@@ -18,4 +18,5 @@ pygithub>=2.3.0
 PyJWT>=2.8.0
 datasets>=2.19.0
 numpy>=1.26.0
-psycopg2-binary>=2.9.9

 PyJWT>=2.8.0
 datasets>=2.19.0
 numpy>=1.26.0
+psycopg2-binary>=2.9.9
+rapidfuzz>=3.0.0

sast_gate.py CHANGED Viewed

@@ -182,8 +182,12 @@ def run_sast_gate(diff_text: str, changed_files: list[str], repo_dir: str) -> Sa
             blocked_reason=blocked_reason,
         )
-    if len(high_findings) >= 3:
-        blocked_reason = f"{len(high_findings)} HIGH severity findings exceed threshold"
         return SastReport(
             passed=False,
             findings=all_findings,

             blocked_reason=blocked_reason,
         )
+    # BUG-012 FIX: Block on ANY HIGH severity finding (threshold was erroneously 3).
+    # A single eval(), os.system(), or SQL-injection pattern in AI-generated code is
+    # already a gate failure — two are not acceptable under any DevSecOps policy.
+    HIGH_SEVERITY_THRESHOLD = int(os.getenv("RHODAWK_SAST_HIGH_THRESHOLD", "1"))
+    if len(high_findings) >= HIGH_SEVERITY_THRESHOLD:
+        blocked_reason = f"{len(high_findings)} HIGH severity finding(s) exceed threshold ({HIGH_SEVERITY_THRESHOLD})"
         return SastReport(
             passed=False,
             findings=all_findings,

supply_chain.py CHANGED Viewed

@@ -39,18 +39,25 @@ _KNOWN_PACKAGES = {
 _TYPO_THRESHOLD = 2
-def _levenshtein(s1: str, s2: str) -> int:
-    if len(s1) < len(s2):
-        return _levenshtein(s2, s1)
-    if len(s2) == 0:
-        return len(s1)
-    prev = list(range(len(s2) + 1))
-    for i, c1 in enumerate(s1):
-        curr = [i + 1]
-        for j, c2 in enumerate(s2):
-            curr.append(min(prev[j + 1] + 1, curr[j] + 1, prev[j] + (c1 != c2)))
-        prev = curr
-    return prev[-1]
 def _extract_new_packages(diff_text: str, original_requirements: str = "") -> list[str]:

 _TYPO_THRESHOLD = 2
+try:
+    from rapidfuzz.distance import Levenshtein as _rf_lev
+    def _levenshtein(s1: str, s2: str) -> int:
+        """BUG-010 FIX: Use rapidfuzz C-extension if available (O(n) vs O(n²))."""
+        return _rf_lev.distance(s1, s2)
+except ImportError:
+    def _levenshtein(s1: str, s2: str) -> int:
+        """Pure-Python fallback — O(n²) but correctness-guaranteed."""
+        if len(s1) < len(s2):
+            return _levenshtein(s2, s1)
+        if len(s2) == 0:
+            return len(s1)
+        prev = list(range(len(s2) + 1))
+        for i, c1 in enumerate(s1):
+            curr = [i + 1]
+            for j, c2 in enumerate(s2):
+                curr.append(min(prev[j + 1] + 1, curr[j] + 1, prev[j] + (c1 != c2)))
+            prev = curr
+        return prev[-1]
 def _extract_new_packages(diff_text: str, original_requirements: str = "") -> list[str]:

verification_loop.py CHANGED Viewed

@@ -14,6 +14,11 @@ The loop:
   4. If GREEN → gate through adversarial review → open PR
   5. If STILL RED → append new failure + what was tried → goto 2
   6. After MAX_RETRIES → mark as FAILED, escalate
 """
 import os
@@ -23,7 +28,7 @@ from typing import Optional
 from language_runtime import RuntimeFactory
 MAX_RETRIES = int(os.getenv("RHODAWK_MAX_RETRIES", "5"))
-ADVERSARIAL_REJECTION_MULTIPLIER = int(os.getenv("RHODAWK_ADVERSARIAL_REJECTION_MULTIPLIER", "0"))
 RETRY_BACKOFF_SECONDS = 5
@@ -55,6 +60,7 @@ def build_retry_prompt(
     original_failure: str,
     attempt_history: list[VerificationAttempt],
     similar_fixes: list[dict],
 ) -> str:
     """
     Build an increasingly rich prompt for each retry attempt.
@@ -96,7 +102,7 @@ def build_retry_prompt(
                 f"  Fix applied:\n```diff\n{fix.get('fix_diff', '')[:400]}\n```"
             )
-    runtime = RuntimeFactory.for_repo(os.getenv("RHODAWK_REPO_DIR", "/data/repo"))
     sections.append("INSTRUCTIONS:\n" + runtime.get_fix_prompt_instructions(
         test_path=test_path,
         branch_name=branch_name,
@@ -112,6 +118,7 @@ def build_initial_prompt(
     branch_name: str,
     failure_output: str,
     similar_fixes: list[dict],
 ) -> str:
     sections = []
     sections.append(
@@ -128,7 +135,7 @@ def build_initial_prompt(
                 f"  What worked:\n```diff\n{fix.get('fix_diff', '')[:400]}\n```"
             )
-    runtime = RuntimeFactory.for_repo(os.getenv("RHODAWK_REPO_DIR", "/data/repo"))
     sections.append("INSTRUCTIONS:\n" + runtime.get_fix_prompt_instructions(
         test_path=test_path,
         branch_name=branch_name,

   4. If GREEN → gate through adversarial review → open PR
   5. If STILL RED → append new failure + what was tried → goto 2
   6. After MAX_RETRIES → mark as FAILED, escalate
+BUG-002 FIX: Removed hardcoded os.getenv("RHODAWK_REPO_DIR") — repo_dir is now
+             passed as a parameter to build_initial_prompt() and build_retry_prompt().
+BUG-003 FIX: ADVERSARIAL_REJECTION_MULTIPLIER defaults to 2 (not 0) so adversarial
+             rejections get extra retry budget beyond MAX_RETRIES.
 """
 import os
 from language_runtime import RuntimeFactory
 MAX_RETRIES = int(os.getenv("RHODAWK_MAX_RETRIES", "5"))
+ADVERSARIAL_REJECTION_MULTIPLIER = int(os.getenv("RHODAWK_ADVERSARIAL_REJECTION_MULTIPLIER", "2"))
 RETRY_BACKOFF_SECONDS = 5
     original_failure: str,
     attempt_history: list[VerificationAttempt],
     similar_fixes: list[dict],
+    repo_dir: str = "/data/repo",
 ) -> str:
     """
     Build an increasingly rich prompt for each retry attempt.
                 f"  Fix applied:\n```diff\n{fix.get('fix_diff', '')[:400]}\n```"
             )
+    runtime = RuntimeFactory.for_repo(repo_dir)
     sections.append("INSTRUCTIONS:\n" + runtime.get_fix_prompt_instructions(
         test_path=test_path,
         branch_name=branch_name,
     branch_name: str,
     failure_output: str,
     similar_fixes: list[dict],
+    repo_dir: str = "/data/repo",
 ) -> str:
     sections = []
     sections.append(
                 f"  What worked:\n```diff\n{fix.get('fix_diff', '')[:400]}\n```"
             )
+    runtime = RuntimeFactory.for_repo(repo_dir)
     sections.append("INSTRUCTIONS:\n" + runtime.get_fix_prompt_instructions(
         test_path=test_path,
         branch_name=branch_name,

webhook_server.py CHANGED Viewed

@@ -61,7 +61,18 @@ def get_webhook_log(limit: int = 50) -> list[dict]:
 def _verify_github_signature(body: bytes, signature_header: str) -> bool:
     if not WEBHOOK_SECRET:
-        return True  # Skip validation if secret not configured
     if not signature_header or not signature_header.startswith("sha256="):
         return False
     mac = hmac.new(WEBHOOK_SECRET.encode(), msg=body, digestmod=hashlib.sha256)

 def _verify_github_signature(body: bytes, signature_header: str) -> bool:
     if not WEBHOOK_SECRET:
+        # BUG-006 FIX: Emit a loud warning instead of silently passing all requests.
+        # In production (non-loopback) environments this must be treated as a hard
+        # block so arbitrary internet actors cannot trigger audit jobs.
+        import sys
+        print(
+            "[SECURITY WARNING] RHODAWK_WEBHOOK_SECRET is not set. "
+            "All webhook HMAC validation is DISABLED. Set this secret before "
+            "exposing the webhook endpoint to the internet.",
+            file=sys.stderr,
+        )
+        # Block by default — return False so callers must explicitly whitelist.
+        return False
     if not signature_header or not signature_header.startswith("sha256="):
         return False
     mac = hmac.new(WEBHOOK_SECRET.encode(), msg=body, digestmod=hashlib.sha256)

worker_pool.py CHANGED Viewed

@@ -2,6 +2,13 @@
 Rhodawk AI — Concurrent Worker Pool
 ====================================
 ThreadPoolExecutor-based audit orchestration for parallel test healing.
 """
 import concurrent.futures
@@ -16,12 +23,12 @@ _pool_lock = threading.Lock()
 def run_parallel_audit(
     test_files: list[str],
     process_fn: Callable,
-    pytest_bin: str,
     mcp_config_path: str,
     tenant_id: str,
     target_repo: str,
 ) -> dict:
-    results = {"healed": 0, "failed": 0, "skipped": 0, "prs": [], "errors": []}
     if not test_files:
         return results
@@ -32,7 +39,7 @@ def run_parallel_audit(
                 _process_one_test,
                 test_path=t,
                 process_fn=process_fn,
-                pytest_bin=pytest_bin,
                 mcp_config_path=mcp_config_path,
                 tenant_id=tenant_id,
                 repo=target_repo,
@@ -47,6 +54,10 @@ def run_parallel_audit(
             if outcome.get("skipped"):
                 results["skipped"] += 1
             elif outcome.get("success"):
                 results["healed"] += 1
                 if outcome.get("pr_url"):
@@ -62,15 +73,15 @@ def run_parallel_audit(
 def _process_one_test(
     test_path: str,
     process_fn: Callable,
-    pytest_bin: str,
     mcp_config_path: str,
     tenant_id: str,
     repo: str,
 ) -> dict:
     return process_fn(
         test_path=test_path,
-        pytest_bin=pytest_bin,
         mcp_config_path=mcp_config_path,
         tenant_id=tenant_id,
         target_repo=repo,
-    )

 Rhodawk AI — Concurrent Worker Pool
 ====================================
 ThreadPoolExecutor-based audit orchestration for parallel test healing.
+BUG-001 FIX: Updated signature to accept env_config: EnvConfig instead of
+             pytest_bin: str to match app.py's call site. Also fixed BUG-007
+             by removing the global _active_runtime dependency — env_config is
+             passed through as a parameter instead of relying on the global.
+BUG-011 FIX: Tests returning already_green=True are no longer counted as
+             "healed" — they are counted under a separate "already_green" key.
 """
 import concurrent.futures
 def run_parallel_audit(
     test_files: list[str],
     process_fn: Callable,
+    env_config,
     mcp_config_path: str,
     tenant_id: str,
     target_repo: str,
 ) -> dict:
+    results = {"healed": 0, "failed": 0, "skipped": 0, "already_green": 0, "prs": [], "errors": []}
     if not test_files:
         return results
                 _process_one_test,
                 test_path=t,
                 process_fn=process_fn,
+                env_config=env_config,
                 mcp_config_path=mcp_config_path,
                 tenant_id=tenant_id,
                 repo=target_repo,
             if outcome.get("skipped"):
                 results["skipped"] += 1
+            elif outcome.get("already_green"):
+                results["already_green"] += 1
+                if outcome.get("pr_url"):
+                    results["prs"].append(outcome.get("pr_url"))
             elif outcome.get("success"):
                 results["healed"] += 1
                 if outcome.get("pr_url"):
 def _process_one_test(
     test_path: str,
     process_fn: Callable,
+    env_config,
     mcp_config_path: str,
     tenant_id: str,
     repo: str,
 ) -> dict:
     return process_fn(
         test_path=test_path,
+        env_config=env_config,
         mcp_config_path=mcp_config_path,
         tenant_id=tenant_id,
         target_repo=repo,
+    )