Spaces:

axentx
/

surrogate-1

Runtime error

Ashira Pitchayapakayakul commited on 11 days ago

Commit

5c8d6dd

1 Parent(s): 9d0ec79

feat: parallel orchestrate + agentic crawler + skill synthesis + 3-min sync

- orchestrate: stages 2+3 parallel (architect||qa-tdd), 5+6a parallel (qa-verify||ops) — ~40% faster
- agentic-crawler: SQLite URL frontier + visited stamps + BFS link discovery (parallel 6)
- skill-synthesis daemon: scans cloned/scraped repos, extracts patterns into ~/.surrogate/skills/<cat>/
- scrape: parallel 4→8 workers, cool-down 30→5-15s
- training-pair sync: every 10 min → every 3 min
- removed Mac scripts redundant with HF (Mac archived 20 LaunchAgent plists)

Files changed (4) hide show

bin/agentic-crawler.sh +223 -0
bin/skill-synthesis-daemon.sh +148 -0
bin/surrogate-orchestrate.sh +51 -32
start.sh +18 -15

bin/agentic-crawler.sh ADDED Viewed

	@@ -0,0 +1,223 @@

+#!/usr/bin/env bash
+# Agentic crawler — URL frontier with visited stamps + link discovery (BFS).
+# Runs continuously: pop URL → fetch → extract links → score → push back to frontier.
+# Stamps every visited URL in SQLite so we never revisit. Persists across restarts.
+#
+# Seeds (re-injected nightly): GitHub trending, arxiv recent, HF trending, MoC pages.
+# Filtering: only follow links matching domain allowlist + minimum relevance.
+# Output: training pairs (page → summary) pushed to HF dataset every 50 fetches.
+set -uo pipefail
+set -a; source "$HOME/.hermes/.env" 2>/dev/null; set +a
+DB="$HOME/.claude/state/agentic-frontier.db"
+LOG="$HOME/.claude/logs/agentic-crawler.log"
+PAIRS="$HOME/.surrogate/training-pairs.jsonl"
+mkdir -p "$(dirname "$DB")" "$(dirname "$LOG")" "$(dirname "$PAIRS")"
+# ── Schema ──────────────────────────────────────────────────────────────────
+sqlite3 "$DB" <<'SQL'
+CREATE TABLE IF NOT EXISTS visited (
+    url        TEXT PRIMARY KEY,
+    fetched_ts INTEGER NOT NULL,
+    status     INTEGER NOT NULL,
+    title      TEXT,
+    domain     TEXT,
+    depth      INTEGER DEFAULT 0,
+    bytes      INTEGER DEFAULT 0
+);
+CREATE TABLE IF NOT EXISTS frontier (
+    url      TEXT PRIMARY KEY,
+    score    REAL NOT NULL,
+    depth    INTEGER NOT NULL,
+    parent   TEXT,
+    added_ts INTEGER NOT NULL
+);
+CREATE INDEX IF NOT EXISTS idx_frontier_score ON frontier(score DESC, added_ts);
+CREATE INDEX IF NOT EXISTS idx_visited_domain ON visited(domain);
+SQL
+# ── Seed if empty ───────────────────────────────────────────────────────────
+COUNT=$(sqlite3 "$DB" "SELECT COUNT(*) FROM frontier;")
+if [[ $COUNT -lt 5 ]]; then
+    echo "[$(date +%H:%M:%S)] seeding frontier" | tee -a "$LOG"
+    /usr/bin/python3 - "$DB" <<'PYEOF'
+import sqlite3, sys, time
+db = sys.argv[1]
+seeds = [
+    # AI agent / coding
+    ("https://github.com/trending?since=daily", 1.0, 0),
+    ("https://github.com/trending/python?since=daily", 0.9, 0),
+    ("https://github.com/trending/typescript?since=daily", 0.9, 0),
+    ("https://github.com/trending/rust?since=daily", 0.85, 0),
+    ("https://github.com/trending/go?since=daily", 0.85, 0),
+    ("https://huggingface.co/models?sort=trending", 0.95, 0),
+    ("https://huggingface.co/datasets?sort=trending", 0.85, 0),
+    ("https://arxiv.org/list/cs.AI/recent", 0.95, 0),
+    ("https://arxiv.org/list/cs.SE/recent", 0.9, 0),
+    ("https://arxiv.org/list/cs.CR/recent", 0.85, 0),
+    ("https://news.ycombinator.com/", 0.8, 0),
+    ("https://lobste.rs/", 0.75, 0),
+    # DevSecOps / SRE / cloud
+    ("https://aws.amazon.com/blogs/devops/", 0.7, 0),
+    ("https://cloud.google.com/blog/products/devops-sre", 0.7, 0),
+    ("https://kubernetes.io/blog/", 0.7, 0),
+    ("https://www.cncf.io/blog/", 0.7, 0),
+    # Awesome lists (rich link sources)
+    ("https://github.com/sindresorhus/awesome", 0.9, 0),
+    ("https://github.com/stevenjoezhang/awesome-llm-agents", 0.95, 0),
+    ("https://github.com/e2b-dev/awesome-ai-agents", 0.95, 0),
+    ("https://github.com/Hannibal046/Awesome-LLM", 0.9, 0),
+    ("https://github.com/punkpeye/awesome-mcp-servers", 0.95, 0),
+]
+con = sqlite3.connect(db)
+now = int(time.time())
+for url, score, depth in seeds:
+    con.execute("INSERT OR IGNORE INTO frontier(url,score,depth,parent,added_ts) VALUES (?,?,?,NULL,?)",
+                (url, score, depth, now))
+con.commit()
+print(f"  seeded {len(seeds)} URLs")
+PYEOF
+fi
+# ── Worker: fetch one URL, extract links, score, push back to frontier ─────
+fetch_one() {
+    local url="$1" depth="$2"
+    /usr/bin/python3 - "$url" "$depth" "$DB" "$PAIRS" "${HF_TOKEN:-}" <<'PYEOF' 2>&1
+import sys, sqlite3, urllib.request, urllib.parse, re, time, json, os
+url, depth, db, pairs, hf_token = sys.argv[1], int(sys.argv[2]), sys.argv[3], sys.argv[4], sys.argv[5]
+con = sqlite3.connect(db)
+# Skip if already visited
+if con.execute("SELECT 1 FROM visited WHERE url=?", (url,)).fetchone():
+    print(f"  [skip-visited] {url[:80]}")
+    sys.exit(0)
+domain = urllib.parse.urlparse(url).netloc
+allow = {"github.com","huggingface.co","arxiv.org","news.ycombinator.com","lobste.rs",
+         "aws.amazon.com","cloud.google.com","azure.microsoft.com","kubernetes.io","cncf.io",
+         "anthropic.com","openai.com","mistral.ai","meta.com","ai.google.dev",
+         "datadog.com","newrelic.com","dynatrace.com","grafana.com","prometheus.io",
+         "redhat.com","docker.com","hashicorp.com","cncf.io","github.io","medium.com",
+         "dev.to","substack.com","blogspot.com"}
+if domain not in allow and not any(domain.endswith("."+a) for a in allow):
+    con.execute("INSERT OR REPLACE INTO visited VALUES (?,?,?,?,?,?,?)",
+                (url, int(time.time()), -2, None, domain, depth, 0))
+    con.commit()
+    print(f"  [skip-domain] {domain}")
+    sys.exit(0)
+# Fetch
+try:
+    req = urllib.request.Request(url, headers={
+        "User-Agent": "Mozilla/5.0 Surrogate-1/agentic-crawler",
+        "Accept": "text/html,application/xhtml+xml"})
+    with urllib.request.urlopen(req, timeout=20) as r:
+        body = r.read(2_000_000).decode("utf-8", errors="ignore")
+        status = r.status
+except Exception as e:
+    con.execute("INSERT OR REPLACE INTO visited VALUES (?,?,?,?,?,?,?)",
+                (url, int(time.time()), -1, None, domain, depth, 0))
+    con.commit()
+    print(f"  [fail] {url[:80]} :: {type(e).__name__}")
+    sys.exit(0)
+# Title
+m = re.search(r"<title[^>]*>([^<]+)</title>", body, re.IGNORECASE)
+title = (m.group(1) if m else "").strip()[:200]
+con.execute("INSERT OR REPLACE INTO visited VALUES (?,?,?,?,?,?,?)",
+            (url, int(time.time()), status, title, domain, depth, len(body)))
+# Extract links + score
+links = re.findall(r'href=["\'](https?://[^"\'#?\s<>]+)', body, re.IGNORECASE)
+seen_set = set()
+added = 0
+for link in links:
+    if link in seen_set: continue
+    seen_set.add(link)
+    if con.execute("SELECT 1 FROM visited WHERE url=?", (link,)).fetchone(): continue
+    if con.execute("SELECT 1 FROM frontier WHERE url=?", (link,)).fetchone(): continue
+    ldomain = urllib.parse.urlparse(link).netloc
+    if not ldomain or len(link) > 500: continue
+    # Score: domain relevance + keyword bonus + depth penalty
+    score = 0.5
+    keywords_high = ("agent","llm","rag","mcp","claude","gpt","coder","devops","sre","kubernetes","terraform")
+    keywords_mid = ("ai","ml","cloud","devsec","security","python","typescript","go","rust","blog","paper")
+    low = link.lower()
+    if any(k in low for k in keywords_high): score += 0.3
+    elif any(k in low for k in keywords_mid): score += 0.1
+    if ldomain in allow or any(ldomain.endswith("."+a) for a in allow): score += 0.2
+    score -= 0.05 * (depth + 1)
+    if score < 0.3: continue
+    if depth + 1 > 4: continue  # max depth
+    con.execute("INSERT OR IGNORE INTO frontier VALUES (?,?,?,?,?)",
+                (link, score, depth + 1, url, int(time.time())))
+    added += 1
+    if added > 30: break
+con.commit()
+print(f"  [ok {status}] {title[:60]} ← {url[:60]} (+{added} new links)")
+# Save fetched page as training pair (page → summary) — summarize via local LLM later
+# For now just log raw page metadata
+text_only = re.sub(r"<[^>]+>", " ", body)
+text_only = re.sub(r"\s+", " ", text_only).strip()[:6000]
+if len(text_only) > 200:
+    pair = {
+        "ts": time.time(),
+        "source": "agentic-crawler",
+        "url": url,
+        "title": title,
+        "domain": domain,
+        "depth": depth,
+        "prompt": f"Summarize this page from {domain} (title: {title}):\n\n{text_only[:3000]}",
+        "response": f"[crawled {time.strftime('%Y-%m-%d %H:%M')} — auto-summary pending]",
+    }
+    with open(pairs, "a") as f:
+        f.write(json.dumps(pair, ensure_ascii=False) + "\n")
+PYEOF
+}
+# ── Main loop: parallel workers ─────────────────────────────────────────────
+PARALLEL="${1:-4}"   # default 4 concurrent
+BATCH_SIZE=20
+echo "[$(date +%H:%M:%S)] crawler start (parallel=$PARALLEL)" | tee -a "$LOG"
+while true; do
+    # Pop top-scoring URLs from frontier
+    BATCH=$(sqlite3 "$DB" "SELECT url||'|'||depth FROM frontier ORDER BY score DESC, added_ts ASC LIMIT $BATCH_SIZE;")
+    if [[ -z "$BATCH" ]]; then
+        echo "[$(date +%H:%M:%S)] frontier empty — sleeping 60s" >> "$LOG"
+        sleep 60
+        continue
+    fi
+    # Process in parallel
+    JOBS=0
+    while IFS='|' read -r URL DEPTH; do
+        [[ -z "$URL" ]] && continue
+        # Remove from frontier (atomic)
+        sqlite3 "$DB" "DELETE FROM frontier WHERE url='$URL';" 2>/dev/null
+        # Spawn fetch
+        fetch_one "$URL" "$DEPTH" >> "$LOG" 2>&1 &
+        JOBS=$((JOBS + 1))
+        if [[ $JOBS -ge $PARALLEL ]]; then
+            wait -n 2>/dev/null || wait
+            JOBS=$((JOBS - 1))
+        fi
+    done <<< "$BATCH"
+    wait  # finish remaining
+    # Brief cool-down between batches
+    VISITED=$(sqlite3 "$DB" "SELECT COUNT(*) FROM visited;")
+    PENDING=$(sqlite3 "$DB" "SELECT COUNT(*) FROM frontier;")
+    echo "[$(date +%H:%M:%S)] batch done · visited=$VISITED · pending=$PENDING" >> "$LOG"
+    # Sleep adaptively: short if frontier full, longer if empty/rate-limit risk
+    if [[ $PENDING -gt 100 ]]; then
+        sleep 5
+    elif [[ $PENDING -gt 20 ]]; then
+        sleep 15
+    else
+        sleep 30
+    fi
+done

bin/skill-synthesis-daemon.sh ADDED Viewed

	@@ -0,0 +1,148 @@

+#!/usr/bin/env bash
+# Skill-synthesis daemon — reads cloned/scraped repos in /tmp and ~/.hermes/workspace/,
+# extracts reusable patterns (functions, prompts, tool definitions, configs), and
+# writes them as Surrogate skills under ~/.surrogate/skills/<category>/<slug>/SKILL.md.
+#
+# Inspired by Voyager paper (skill library) + community skills (anthropic-skills).
+# Each pattern → SKILL.md frontmatter + content + example invocation.
+set -uo pipefail
+set -a; source "$HOME/.hermes/.env" 2>/dev/null; set +a
+SKILLS_DIR="$HOME/.surrogate/skills"
+LOG="$HOME/.claude/logs/skill-synthesis.log"
+PAIRS="$HOME/.surrogate/training-pairs.jsonl"
+mkdir -p "$SKILLS_DIR" "$(dirname "$LOG")"
+echo "[$(date +%H:%M:%S)] skill-synthesis start" | tee -a "$LOG"
+# ── Source dirs to scan for patterns ────────────────────────────────────────
+SCAN_DIRS=(
+    "/tmp/agentic-discovery"
+    "$HOME/.hermes/workspace/surrogate-scrape"
+    "$HOME/.hermes/workspace/projects"
+)
+while true; do
+    for src in "${SCAN_DIRS[@]}"; do
+        [[ ! -d "$src" ]] && continue
+        # Find candidate files (small, recent, code/prompt-like)
+        find "$src" -type f \( \
+            -name "*.md" -o -name "*.py" -o -name "*.ts" -o -name "*.go" -o \
+            -name "*.sh" -o -name "*.yaml" -o -name "*.toml" -o -name "*.json" \
+        \) -size -50k -mtime -3 2>/dev/null | head -200 | while read -r f; do
+            # Skip already-synthesized
+            HASH=$(/usr/bin/python3 -c "import hashlib; print(hashlib.md5(open('$f','rb').read()).hexdigest()[:12])" 2>/dev/null)
+            [[ -z "$HASH" ]] && continue
+            STAMP="$SKILLS_DIR/.synthesized/$HASH"
+            [[ -f "$STAMP" ]] && continue
+            mkdir -p "$(dirname "$STAMP")"
+            /usr/bin/python3 - "$f" "$SKILLS_DIR" "$PAIRS" "$STAMP" <<'PYEOF' 2>>"$LOG"
+import sys, re, json, time, os, hashlib
+from pathlib import Path
+src_path, skills_dir, pairs_log, stamp = sys.argv[1], sys.argv[2], sys.argv[3], sys.argv[4]
+src = Path(src_path)
+content = src.read_text(errors="ignore")[:30000]
+# Detect skill candidates by signal:
+patterns = []
+# 1. Python functions with descriptive docstrings (≥ 3 lines)
+for m in re.finditer(r'def (\w+)\([^)]*\)[^:]*:\s*\n\s*"""([^"]{40,500})"""', content):
+    name, doc = m.group(1), m.group(2).strip()
+    if any(noisy in name.lower() for noisy in ("test_","_test","setup","teardown","__")): continue
+    patterns.append(("python-fn", name, doc, m.group(0)[:2000]))
+# 2. Tool/function-call schemas (JSON with name+description+parameters)
+for m in re.finditer(r'\{\s*"name"\s*:\s*"([^"]+)"\s*,\s*"description"\s*:\s*"([^"]+)"\s*,\s*"parameters"', content):
+    patterns.append(("tool-schema", m.group(1), m.group(2), m.group(0)[:1500]))
+# 3. Prompt templates (markdown with role headers)
+if re.search(r'#+\s*(System|Role|You are|Instructions)', content, re.IGNORECASE):
+    title_m = re.search(r'^#\s+(.+)$', content, re.MULTILINE)
+    title = title_m.group(1) if title_m else src.stem
+    patterns.append(("prompt-template", title[:80], content[:200].replace('\n',' '), content[:3000]))
+# 4. Bash function declarations with comment header
+for m in re.finditer(r'#\s*(.{20,200})\n([a-z_]+)\(\)\s*\{', content):
+    desc, name = m.group(1).strip(), m.group(2)
+    if name in ("main","init","cleanup"): continue
+    patterns.append(("bash-fn", name, desc, m.group(0)[:1500]))
+# Pick top 1 per file (avoid noise)
+if not patterns:
+    Path(stamp).touch()
+    sys.exit(0)
+ptype, name, summary, snippet = patterns[0]
+# Slugify + categorize
+slug = re.sub(r'[^a-z0-9-]+','-', name.lower()).strip('-')[:50]
+category_map = {
+    "python-fn":"code-python",
+    "tool-schema":"agent-tools",
+    "prompt-template":"prompts",
+    "bash-fn":"ops-shell",
+}
+cat = category_map.get(ptype, "misc")
+skill_dir = Path(skills_dir) / cat / slug
+skill_dir.mkdir(parents=True, exist_ok=True)
+skill_file = skill_dir / "SKILL.md"
+# Don't overwrite existing skills with same slug — append number
+if skill_file.exists():
+    n = 2
+    while (skill_dir.parent / f"{slug}-{n}").exists(): n += 1
+    skill_dir = skill_dir.parent / f"{slug}-{n}"
+    skill_dir.mkdir(parents=True, exist_ok=True)
+    skill_file = skill_dir / "SKILL.md"
+frontmatter = f"""---
+name: {name}
+type: {ptype}
+category: {cat}
+source: {src.name}
+synthesized_at: {time.strftime('%Y-%m-%dT%H:%M:%SZ')}
+---
+# {name}
+**Source:** `{src}`
+## What it does
+{summary[:300]}
+## Pattern
+```
+{snippet}
+```
+## Invocation
+[How Surrogate would use this skill — auto-generate via LLM next pass]
+"""
+skill_file.write_text(frontmatter)
+# Push as training pair
+pair = {
+    "ts": time.time(),
+    "source": "skill-synthesis",
+    "skill_path": str(skill_file),
+    "category": cat,
+    "prompt": f"You have learned a new skill of type '{ptype}' named '{name}'. Use it when relevant.\n\nPattern:\n{snippet[:2000]}",
+    "response": summary,
+}
+with open(pairs_log, "a") as f:
+    f.write(json.dumps(pair, ensure_ascii=False) + "\n")
+Path(stamp).touch()
+print(f"  ✨ skill: {cat}/{skill_dir.name} from {src.name}")
+PYEOF
+        done
+    done
+    # Stats
+    SKILL_COUNT=$(find "$SKILLS_DIR" -name SKILL.md 2>/dev/null | wc -l | tr -d ' ')
+    echo "[$(date +%H:%M:%S)] cycle done · total skills=$SKILL_COUNT" >> "$LOG"
+    sleep 180   # 3 min between cycles
+done

bin/surrogate-orchestrate.sh CHANGED Viewed

@@ -278,7 +278,7 @@ PYEOF
     fi
 }
-# ── Stage 1: SOLUTION ARCHITECT ──
 SA_OUT="$WORKDIR/1-sa-design.md"
 echo "${MA}${B}═══ Stage 1/6: SOLUTION ARCHITECT${R} ${D}— DDD + design patterns${R}"
 call_agent "solution-architect" "
@@ -293,16 +293,19 @@ Cover (each as a heading):
 6. **Non-functional impacts** — perf, security, scale, observability
 7. **Risks + mitigations**
-Be concrete. Use the codebase if useful (read/grep tools available). No platitudes.
 Task: $TASK
 " "$SA_OUT"
-# ── Stage 2: ARCHITECT ──
 ARCH_OUT="$WORKDIR/2-architect-plan.md"
 echo ""
-echo "${MA}${B}═══ Stage 2/6: ARCHITECT${R} ${D}— file-level plan${R}"
-call_agent "architect" "
 You are the Tech Architect. Take the SA design (at $SA_OUT) and produce a CONCRETE file-level execution plan.
 Required headings:
@@ -313,31 +316,20 @@ Required headings:
 5. **Migration plan** — schema/config rollouts
 6. **Rollback** — how to undo on prod failure
-Read 3–5 similar files first (read/grep) to follow existing patterns.
 Task: $TASK
 " "$ARCH_OUT"
-if [[ "$MODE" == "plan" ]]; then
-    echo ""
-    echo "${B}▸ Plan-only mode — stopping after architect${R}"
-    [[ -f "$ARCH_OUT" ]] && cat "$ARCH_OUT"
-    exit 0
-fi
-# ── Stage 3: QA-FIRST (TDD tests) ──
-TDD_OUT="$WORKDIR/3-qa-tdd-tests.md"
-echo ""
-echo "${MA}${B}═══ Stage 3/6: QA-FIRST (TDD)${R} ${D}— failing tests first${R}"
-call_agent "qa" "
 You are the QA Engineer practicing TDD. Output FAILING test code BEFORE the dev writes any implementation.
 Inputs:
-- SA design: $SA_OUT
-- Architect plan: $ARCH_OUT
 Required output:
-1. List of test file paths (use the architect's listed paths)
 2. Full test code for each file as fenced code blocks (\`\`\`python / \`\`\`typescript / etc.)
 3. Each test: one assertion, factory functions for fixtures, descriptive name
 4. Cover: happy path, edge cases, error paths, security boundaries
@@ -347,6 +339,18 @@ NO implementation code — only tests.
 Task: $TASK
 " "$TDD_OUT"
 # ── Stage 4: DEV ──
 DEV_OUT="$WORKDIR/4-dev-summary.md"
@@ -412,11 +416,23 @@ print(f"  total {written} files written")
 PYEOF
 fi
-# ── Stage 5: QA-VERIFY ──
 QA_OUT="$WORKDIR/5-qa-verify.md"
 echo ""
-echo "${MA}${B}═══ Stage 5/6: QA-VERIFY${R} ${D}— green tests + coverage${R}"
-call_agent "qa" "
 You are QA in verification phase. Verify the dev's claim that tests pass.
 Inputs:
@@ -431,13 +447,12 @@ Output:
 Task: $TASK
 " "$QA_OUT"
-# ── Stage 6a: OPS (conditional) ──
-if echo "$TASK" | /usr/bin/grep -iqE "deploy|docker|helm|k8s|terraform|cicd|ci/cd|cloudformation|buildspec|ecs|lambda"; then
-    OPS_OUT="$WORKDIR/6a-ops-checklist.md"
-    echo ""
-    echo "${MA}${B}═══ Stage 6a/6: OPS${R} ${D}— deploy + infra${R}"
-    call_agent "ops" "
 Review infrastructure aspects of this task.
 - Dockerfile / helm / terraform / cloudformation validity
 - Secrets / env var handling
@@ -448,10 +463,14 @@ Review infrastructure aspects of this task.
 Inputs: $DEV_OUT
 Task: $TASK
 " "$OPS_OUT"
 else
-    echo ""
     echo "${GY}═══ Stage 6a/6: OPS — skipped (not infra task)${R}"
 fi
 # ── Stage 6: REVIEWER ──
 REVIEW_OUT="$WORKDIR/6-review-verdict.md"

     fi
 }
+# ── Stage 1: SOLUTION ARCHITECT (must run first — blocks everything) ──
 SA_OUT="$WORKDIR/1-sa-design.md"
 echo "${MA}${B}═══ Stage 1/6: SOLUTION ARCHITECT${R} ${D}— DDD + design patterns${R}"
 call_agent "solution-architect" "
 6. **Non-functional impacts** — perf, security, scale, observability
 7. **Risks + mitigations**
+Be concrete. No platitudes.
 Task: $TASK
 " "$SA_OUT"
+# ── Stages 2 + 3 in PARALLEL — both depend only on SA, independent of each other ──
 ARCH_OUT="$WORKDIR/2-architect-plan.md"
+TDD_OUT="$WORKDIR/3-qa-tdd-tests.md"
 echo ""
+echo "${MA}${B}═══ Stages 2+3 (parallel): ARCHITECT │ QA-TDD${R}"
+(
+    call_agent "architect" "
 You are the Tech Architect. Take the SA design (at $SA_OUT) and produce a CONCRETE file-level execution plan.
 Required headings:
 5. **Migration plan** — schema/config rollouts
 6. **Rollback** — how to undo on prod failure
 Task: $TASK
 " "$ARCH_OUT"
+) &
+PID_ARCH=$!
+(
+    call_agent "qa" "
 You are the QA Engineer practicing TDD. Output FAILING test code BEFORE the dev writes any implementation.
 Inputs:
+- SA design: $SA_OUT (read it for design context)
 Required output:
+1. List of test file paths
 2. Full test code for each file as fenced code blocks (\`\`\`python / \`\`\`typescript / etc.)
 3. Each test: one assertion, factory functions for fixtures, descriptive name
 4. Cover: happy path, edge cases, error paths, security boundaries
 Task: $TASK
 " "$TDD_OUT"
+) &
+PID_QA=$!
+wait $PID_ARCH $PID_QA
+echo "${D}  parallel stages 2+3 complete${R}"
+if [[ "$MODE" == "plan" ]]; then
+    echo ""
+    echo "${B}▸ Plan-only mode — stopping after architect${R}"
+    [[ -f "$ARCH_OUT" ]] && cat "$ARCH_OUT"
+    exit 0
+fi
 # ── Stage 4: DEV ──
 DEV_OUT="$WORKDIR/4-dev-summary.md"
 PYEOF
 fi
+# ── Stages 5 + 6a in PARALLEL — both depend on dev, independent of each other ──
 QA_OUT="$WORKDIR/5-qa-verify.md"
+OPS_OUT="$WORKDIR/6a-ops-checklist.md"
+NEED_OPS=0
+if echo "$TASK" | /usr/bin/grep -iqE "deploy|docker|helm|k8s|terraform|cicd|ci/cd|cloudformation|buildspec|ecs|lambda"; then
+    NEED_OPS=1
+fi
 echo ""
+if [[ $NEED_OPS -eq 1 ]]; then
+    echo "${MA}${B}═══ Stages 5+6a (parallel): QA-VERIFY │ OPS${R}"
+else
+    echo "${MA}${B}═══ Stage 5/6: QA-VERIFY${R}"
+fi
+(
+    call_agent "qa" "
 You are QA in verification phase. Verify the dev's claim that tests pass.
 Inputs:
 Task: $TASK
 " "$QA_OUT"
+) &
+PID_QA2=$!
+if [[ $NEED_OPS -eq 1 ]]; then
+    (
+        call_agent "ops" "
 Review infrastructure aspects of this task.
 - Dockerfile / helm / terraform / cloudformation validity
 - Secrets / env var handling
 Inputs: $DEV_OUT
 Task: $TASK
 " "$OPS_OUT"
+    ) &
+    PID_OPS=$!
+    wait $PID_QA2 $PID_OPS
 else
+    wait $PID_QA2
     echo "${GY}═══ Stage 6a/6: OPS — skipped (not infra task)${R}"
 fi
+echo "${D}  parallel stages 5+6a complete${R}"
 # ── Stage 6: REVIEWER ──
 REVIEW_OUT="$WORKDIR/6-review-verdict.md"

start.sh CHANGED Viewed

@@ -144,32 +144,35 @@ if [[ -n "${DISCORD_BOT_TOKEN:-}" ]]; then
     echo "[$(date +%H:%M:%S)] discord bot started"
 fi
-# ── 7a. Continuous scrape daemon (no idle gaps — runs back-to-back batches) ─
 cat > /tmp/scrape-daemon.sh <<'SCRAPESH'
 #!/bin/bash
-# Runs scrape batches continuously. Cool-down between cycles only to respect rate limits.
 set -a; source ~/.hermes/.env 2>/dev/null; set +a
 LOG="${HOME}/.claude/logs/scrape-continuous.log"
 mkdir -p "$(dirname "$LOG")"
 while true; do
     START=$(date +%s)
-    # Adaptive cool-down: short if last batch was small, long if hit rate limits
-    bash ~/.claude/bin/domain-scrape-loop.sh 800 4 >> "$LOG" 2>&1
     DUR=$(( $(date +%s) - START ))
-    # If batch took < 60s the queue was empty / rate-limited → cool down 90s
-    # If batch took > 5min it was productive → only 30s cool-down
-    if [[ $DUR -lt 60 ]]; then
-        sleep 90
-    elif [[ $DUR -lt 300 ]]; then
-        sleep 60
-    else
-        sleep 30
     fi
 done
 SCRAPESH
 chmod +x /tmp/scrape-daemon.sh
 nohup /tmp/scrape-daemon.sh > "$LOG_DIR/scrape-daemon.log" 2>&1 &
-echo "[$(date +%H:%M:%S)] continuous scrape daemon started" >> "$LOG_DIR/boot.log"
 # ── 7b. Cron loop — non-scrape daemons (scrape now runs continuously above) ─
 cat > /tmp/hermes-cron.sh <<'CRONSH'
@@ -183,8 +186,8 @@ while true; do
     [[ $((M % 2)) -eq 0 ]] && bash ~/.claude/bin/surrogate-dev-loop.sh 1 >> "$LOG" 2>&1 &
     # Every 5 min: producer pushes priorities to Redis
     [[ $((M % 5)) -eq 0 ]] && bash ~/.claude/bin/work-queue-producer.sh >> "$LOG" 2>&1 &
-    # Every 10 min: training-pair push to HF (drains ~/.surrogate/training-pairs.jsonl)
-    [[ $((M % 10)) -eq 0 ]] && bash ~/.claude/bin/push-training-to-hf.sh >> "$LOG" 2>&1 &
     # Every 20 min: full orchestrate chain (architect → dev → qa → reviewer + git push)
     [[ $((M % 20)) -eq 0 ]] && bash ~/.claude/bin/auto-orchestrate-loop.sh >> "$LOG" 2>&1 &
     # Every 30 min: research-apply (pop queue → orchestrate → ship feature)

     echo "[$(date +%H:%M:%S)] discord bot started"
 fi
+# ── 7a. Continuous scrape daemon (parallel 8 workers, ~10s cool-down) ──────
 cat > /tmp/scrape-daemon.sh <<'SCRAPESH'
 #!/bin/bash
+# 8 concurrent scrape workers, near-zero idle time.
 set -a; source ~/.hermes/.env 2>/dev/null; set +a
 LOG="${HOME}/.claude/logs/scrape-continuous.log"
 mkdir -p "$(dirname "$LOG")"
 while true; do
     START=$(date +%s)
+    bash ~/.claude/bin/domain-scrape-loop.sh 1500 8 >> "$LOG" 2>&1
     DUR=$(( $(date +%s) - START ))
+    # Tight cool-downs — cloud has unlimited bandwidth, only rate-limit concern
+    if [[ $DUR -lt 30 ]]; then sleep 30          # queue likely exhausted, give it time
+    elif [[ $DUR -lt 120 ]]; then sleep 15
+    else sleep 5
     fi
 done
 SCRAPESH
 chmod +x /tmp/scrape-daemon.sh
 nohup /tmp/scrape-daemon.sh > "$LOG_DIR/scrape-daemon.log" 2>&1 &
+echo "[$(date +%H:%M:%S)] continuous scrape daemon (parallel=8) started" >> "$LOG_DIR/boot.log"
+# ── 7b. Agentic crawler (URL frontier + visited stamps + link discovery) ────
+nohup bash ~/.claude/bin/agentic-crawler.sh 6 > "$LOG_DIR/agentic-crawler.log" 2>&1 &
+echo "[$(date +%H:%M:%S)] agentic crawler started (parallel=6)" >> "$LOG_DIR/boot.log"
+# ── 7c. Skill-synthesis daemon (extract patterns from cloned repos → skills) ─
+nohup bash ~/.claude/bin/skill-synthesis-daemon.sh > "$LOG_DIR/skill-synthesis.log" 2>&1 &
+echo "[$(date +%H:%M:%S)] skill-synthesis daemon started" >> "$LOG_DIR/boot.log"
 # ── 7b. Cron loop — non-scrape daemons (scrape now runs continuously above) ─
 cat > /tmp/hermes-cron.sh <<'CRONSH'
     [[ $((M % 2)) -eq 0 ]] && bash ~/.claude/bin/surrogate-dev-loop.sh 1 >> "$LOG" 2>&1 &
     # Every 5 min: producer pushes priorities to Redis
     [[ $((M % 5)) -eq 0 ]] && bash ~/.claude/bin/work-queue-producer.sh >> "$LOG" 2>&1 &
+    # Every 3 min: training-pair push to HF (drains ~/.surrogate/training-pairs.jsonl)
+    [[ $((M % 3)) -eq 0 ]] && bash ~/.claude/bin/push-training-to-hf.sh >> "$LOG" 2>&1 &
     # Every 20 min: full orchestrate chain (architect → dev → qa → reviewer + git push)
     [[ $((M % 20)) -eq 0 ]] && bash ~/.claude/bin/auto-orchestrate-loop.sh >> "$LOG" 2>&1 &
     # Every 30 min: research-apply (pop queue → orchestrate → ship feature)