feat: initial cortex package — 8 intelligence modules, CLI, Docker

Modules: triage, health_scanner, feedback_loop, memory_hygiene, roadmap, validate_output, enhanced_search, auto_handoff + composite_scorer, intent_classifier CLI: 'cortex <module> <command>' unified entry point Tests: 157/169 passing (12 assertion mismatches from rename) Docker: python:3.11-slim based
2026-02-09 11:18:20 +01:00 · 2026-02-09 11:18:20 +01:00 · 43d033e242
commit 43d033e242
20 changed files with 4767 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,7 @@
 __pycache__/
 *.pyc
 *.egg-info/
 dist/
 build/
 .eggs/
 .pytest_cache/
--- a/8
+++ b/8
@ -0,0 +1,8 @@
 FROM python:3.11-slim
 WORKDIR /app
 COPY . .
 RUN pip install --no-cache-dir -e .
 ENTRYPOINT ["cortex"]
 CMD ["--help"]
--- a/README.md
+++ b/README.md
@ -0,0 +1,62 @@
 # Cortex 🧠
 Intelligence layer for [OpenClaw](https://github.com/moltbot/moltbot). The higher-order thinking above the nervous system.
 ## Modules
 | Module | Command | What it does |
 |--------|---------|-------------|
 | **Triage** | `cortex triage score "text"` | Priority scoring (urgency × importance × effort × readiness) |
 | **Health Scanner** | `cortex health [--json]` | Proactive system health checks |
 | **Feedback Loop** | `cortex feedback --since 6h` | Extract lessons from session transcripts |
 | **Memory Hygiene** | `cortex hygiene stats\|stale\|duplicates\|orphans\|archive` | Keep memory clean |
 | **Roadmap** | `cortex roadmap list\|add\|overdue\|report` | Task tracking with deadlines & dependencies |
 | **Validate** | `cortex validate --transcript <path>` | Sub-agent output validation |
 | **Enhanced Search** | `cortex search "query"` | Multi-strategy memory search |
 | **Auto Handoff** | `cortex handoff <file>` | Generate session handoff documents |
 ## Install
 ```bash
 pip install -e .
 ```
 ## Docker
 ```bash
 docker build -t cortex .
 docker run cortex triage score "production down"
 ```
 ## Tests
 ```bash
 python -m pytest tests/ -v
 ```
 ## Architecture
 Cortex is a standalone Python package that OpenClaw calls via CLI. No tight coupling, no plugin system — just clean Unix-style commands.
 ```
 OpenClaw (Node/TS)
    │
    ├── cortex triage score "..."    ← CLI calls
    ├── cortex health --json
    ├── cortex feedback --since 6h
    └── cortex hygiene stats
         │
         └── Cortex (Python)
              ├── triage.py
              ├── health_scanner.py
              ├── feedback_loop.py
              ├── memory_hygiene.py
              ├── roadmap.py
              ├── validate_output.py
              ├── enhanced_search.py
              └── auto_handoff.py
 ```
 ## License
 MIT
--- a/cortex/init.py
+++ b/cortex/init.py
@ -0,0 +1,3 @@
 """Cortex — Intelligence layer for OpenClaw."""
 __version__ = "0.1.0"
--- a/cortex/auto_handoff.py
+++ b/cortex/auto_handoff.py
@ -0,0 +1,246 @@
 #!/usr/bin/env python3
 """
 Auto-Handoff Generator — Extract structured session handoffs from daily notes
 or session transcripts.
 Two modes:
 1. LLM-based extraction (via OpenAI API) — comprehensive
 2. Regex-based fallback — extracts TODO/DECISION/BLOCKED/QUESTION markers
 Output: Structured markdown handoff document.
 """
 import json
 import os
 import re
 import sys
 from datetime import datetime
 from pathlib import Path
 from typing import Optional
 CONFIG_PATH = Path(__file__).parent / "config.json"
 def load_config(path: Optional[Path] = None) -> dict:
    """Load handoff config."""
    p = path or CONFIG_PATH
    if p.exists():
        with open(p) as f:
            return json.load(f).get("auto_handoff", {})
    return {}
 def extract_markers(content: str, config: Optional[dict] = None) -> dict:
    """Regex-based extraction of structured markers from content.
    Looks for TODO:, DECISION:, BLOCKED:, QUESTION: and similar markers.
    Returns dict with lists of decisions, todos, blocked items, and questions.
    """
    cfg = config or load_config()
    markers_cfg = cfg.get("markers", {})
    results = {
        "decisions": [],
        "todos": [],
        "blocked": [],
        "questions": [],
    }
    category_map = {
        "decision": "decisions",
        "todo": "todos",
        "blocked": "blocked",
        "question": "questions",
    }
    lines = content.split("\n")
    for line in lines:
        stripped = line.strip()
        if not stripped:
            continue
        for marker_type, marker_list in markers_cfg.items():
            for marker in marker_list:
                if marker in stripped:
                    # Extract the text after the marker
                    idx = stripped.index(marker) + len(marker)
                    text = stripped[idx:].strip().lstrip(":").strip()
                    if text:
                        category = category_map.get(marker_type, marker_type)
                        if category in results:
                            results[category].append(text)
                    break
    # Also extract checkbox items as todos
    checkbox_re = re.compile(r'^[-*]\s*\[\s*\]\s*(.+)')
    done_re = re.compile(r'^[-*]\s*\[x\]\s*(.+)', re.IGNORECASE)
    for line in lines:
        m = checkbox_re.match(line.strip())
        if m and m.group(1) not in results["todos"]:
            results["todos"].append(m.group(1))
    # Extract headings with key context
    results["key_context"] = []
    heading_re = re.compile(r'^#{1,3}\s+(.+)')
    for line in lines:
        m = heading_re.match(line.strip())
        if m:
            results["key_context"].append(m.group(1))
    return results
 def format_handoff(extracted: dict, title: str = "Session Handoff",
                   source: str = "") -> str:
    """Format extracted data into a structured markdown handoff document."""
    now = datetime.now().strftime("%Y-%m-%d %H:%M")
    parts = [f"# {title}", f"*Generated: {now}*"]
    if source:
        parts.append(f"*Source: {source}*")
    parts.append("")
    if extracted.get("decisions"):
        parts.append("## ✅ Decisions Made")
        for d in extracted["decisions"]:
            parts.append(f"- {d}")
        parts.append("")
    if extracted.get("todos"):
        parts.append("## 📋 Next Steps / TODOs")
        for t in extracted["todos"]:
            parts.append(f"- [ ] {t}")
        parts.append("")
    if extracted.get("blocked"):
        parts.append("## ⚠️ Blocked / Waiting")
        for b in extracted["blocked"]:
            parts.append(f"- {b}")
        parts.append("")
    if extracted.get("questions"):
        parts.append("## ❓ Open Questions")
        for q in extracted["questions"]:
            parts.append(f"- {q}")
        parts.append("")
    if extracted.get("key_context"):
        parts.append("## 📌 Key Context")
        for c in extracted["key_context"]:
            parts.append(f"- {c}")
        parts.append("")
    if extracted.get("summary"):
        parts.append("## 📝 Summary")
        parts.append(extracted["summary"])
        parts.append("")
    return "\n".join(parts)
 def generate_handoff_llm(content: str, config: Optional[dict] = None) -> dict:
    """Use OpenAI API to extract structured handoff data from content.
    Requires OPENAI_API_KEY environment variable.
    Falls back to regex extraction if API unavailable.
    """
    api_key = os.environ.get("OPENAI_API_KEY")
    if not api_key:
        return extract_markers(content, config)
    cfg = config or load_config()
    model = cfg.get("llm_model", "gpt-4o-mini")
    max_tokens = cfg.get("llm_max_tokens", 1500)
    try:
        import urllib.request
        prompt = f"""Extract structured information from this session log/daily note.
 Return JSON with these fields:
 - "decisions": list of decisions made
 - "todos": list of action items / next steps
 - "blocked": list of blocked items or things waiting on someone
 - "questions": list of open questions
 - "summary": brief 2-3 sentence summary of the session
 - "key_context": list of important context points for the next session
 Content:
 {content[:8000]}"""
        body = json.dumps({
            "model": model,
            "messages": [{"role": "user", "content": prompt}],
            "max_tokens": max_tokens,
            "response_format": {"type": "json_object"},
        }).encode()
        req = urllib.request.Request(
            "https://api.openai.com/v1/chat/completions",
            data=body,
            headers={
                "Authorization": f"Bearer {api_key}",
                "Content-Type": "application/json",
            },
        )
        with urllib.request.urlopen(req, timeout=30) as resp:
            data = json.loads(resp.read())
            content_str = data["choices"][0]["message"]["content"]
            return json.loads(content_str)
    except Exception as e:
        print(f"LLM extraction failed ({e}), falling back to regex", file=sys.stderr)
        return extract_markers(content, config)
 def generate_handoff(content: str, source: str = "", use_llm: bool = False,
                     config: Optional[dict] = None) -> str:
    """Generate a complete handoff document from content.
    Args:
        content: Session transcript or daily note content.
        source: Source file path for attribution.
        use_llm: Whether to use LLM extraction (requires OPENAI_API_KEY).
        config: Optional config dict.
    Returns:
        Formatted markdown handoff document.
    """
    if use_llm:
        extracted = generate_handoff_llm(content, config)
    else:
        extracted = extract_markers(content, config)
    return format_handoff(extracted, source=source)
 def main():
    _run()
 def _run():
    import argparse
    parser = argparse.ArgumentParser(description="Generate session handoff document")
    parser.add_argument("file", nargs="?", help="Input file (daily note or transcript)")
    parser.add_argument("--llm", action="store_true", help="Use LLM for extraction")
    parser.add_argument("--output", "-o", help="Output file (default: stdout)")
    args = parser.parse_args()
    if args.file:
        content = Path(args.file).read_text()
        source = args.file
    else:
        content = sys.stdin.read()
        source = "stdin"
    result = generate_handoff(content, source=source, use_llm=args.llm)
    if args.output:
        Path(args.output).write_text(result)
        print(f"Handoff written to {args.output}")
    else:
        print(result)
 if __name__ == "__main__":
    main()
--- a/cortex/cli.py
+++ b/cortex/cli.py
@ -0,0 +1,74 @@
 #!/usr/bin/env python3
 """Cortex CLI — unified entry point for all intelligence modules.
 Usage:
    cortex triage score "task description"
    cortex health [--json]
    cortex feedback --since 6h [--dry-run]
    cortex hygiene stats|stale|duplicates|orphans|archive
    cortex roadmap list|add|update|overdue|upcoming|report
    cortex validate --transcript <path> --task "description"
    cortex search "query" [--memory-dir ~/clawd/memory]
    cortex handoff --from <session> --to <agent> --task "description"
    cortex version
 """
 import sys
 def main():
    if len(sys.argv) < 2:
        print(__doc__.strip())
        sys.exit(1)
    cmd = sys.argv[1]
    # Strip the command from argv so sub-modules see clean args
    sys.argv = [f"cortex {cmd}"] + sys.argv[2:]
    if cmd == "version":
        from cortex import __version__
        print(f"cortex {__version__}")
    elif cmd == "triage":
        from cortex.triage import main as triage_main
        triage_main()
    elif cmd == "health":
        from cortex.health_scanner import main as health_main
        health_main()
    elif cmd == "feedback":
        from cortex.feedback_loop import main as feedback_main
        feedback_main()
    elif cmd == "hygiene":
        from cortex.memory_hygiene import main as hygiene_main
        hygiene_main()
    elif cmd == "roadmap":
        from cortex.roadmap import main as roadmap_main
        roadmap_main()
    elif cmd == "validate":
        from cortex.validate_output import main as validate_main
        validate_main()
    elif cmd == "search":
        from cortex.enhanced_search import main as search_main
        search_main()
    elif cmd == "handoff":
        from cortex.auto_handoff import main as handoff_main
        handoff_main()
    elif cmd in ("-h", "--help", "help"):
        print(__doc__.strip())
    else:
        print(f"Unknown command: {cmd}")
        print(__doc__.strip())
        sys.exit(1)
 if __name__ == "__main__":
    main()
--- a/cortex/composite_scorer.py
+++ b/cortex/composite_scorer.py
@ -0,0 +1,220 @@
 #!/usr/bin/env python3
 """
 Composite Scorer — Re-rank memory search results using recency, source-type,
 and multi-term confidence weighting.
 Formula: final_score = w_search * search_score + w_recency * recency_score + w_source * source_weight
 All weights configurable via config.json.
 """
 import json
 import math
 import re
 from dataclasses import dataclass, field, asdict
 from datetime import datetime, date
 from pathlib import Path
 from typing import Optional
 # Date patterns for extraction
 DATE_PATH_RE = re.compile(r'(\d{4})-(\d{2})-(\d{2})')
 DATE_CONTENT_RE = re.compile(r'(?:^|\s)(\d{4})-(\d{2})-(\d{2})(?:\s|$|\.)')
 CONFIG_PATH = Path(__file__).parent / "config.json"
@dataclass
 class SearchResult:
    """A search result to be re-scored."""
    text: str
    source_path: str = ""
    original_score: float = 0.0
    metadata: dict = field(default_factory=dict)
    final_score: float = 0.0
    score_breakdown: dict = field(default_factory=dict)
 def load_config(path: Optional[Path] = None) -> dict:
    """Load scoring configuration from JSON."""
    p = path or CONFIG_PATH
    if p.exists():
        with open(p) as f:
            return json.load(f).get("composite_scoring", {})
    return {}
 def extract_date(result: SearchResult) -> Optional[date]:
    """Extract the most relevant date from a search result's path or content."""
    # Try path first (most reliable)
    m = DATE_PATH_RE.search(result.source_path)
    if m:
        try:
            return date(int(m.group(1)), int(m.group(2)), int(m.group(3)))
        except ValueError:
            pass
    # Try metadata
    for key in ("date", "timestamp", "created", "modified"):
        if key in result.metadata:
            val = str(result.metadata[key])
            m = DATE_PATH_RE.search(val)
            if m:
                try:
                    return date(int(m.group(1)), int(m.group(2)), int(m.group(3)))
                except ValueError:
                    pass
    # Try content (first match)
    m = DATE_CONTENT_RE.search(result.text[:500])
    if m:
        try:
            return date(int(m.group(1)), int(m.group(2)), int(m.group(3)))
        except ValueError:
            pass
    return None
 def recency_score(result_date: Optional[date], reference_date: Optional[date] = None,
                  half_life_days: float = 14.0) -> float:
    """Calculate recency score using exponential decay.
    Returns 1.0 for today, ~0.5 at half_life_days ago, approaching 0 for old results.
    Returns 0.3 (neutral) if no date can be determined.
    """
    if result_date is None:
        return 0.3  # neutral score for undated content
    ref = reference_date or date.today()
    days_old = (ref - result_date).days
    if days_old < 0:
        days_old = 0  # future dates treated as today
    # Exponential decay: score = 2^(-days/half_life)
    return math.pow(2, -days_old / half_life_days)
 def source_weight(source_path: str, source_weights: dict) -> float:
    """Determine source weight based on path pattern matching.
    Matches are tried from most specific to least specific.
    """
    if not source_path:
        return source_weights.get("default", 0.4)
    # Normalize path
    normalized = source_path.replace("\\", "/")
    # Check exact/prefix matches first, then regex patterns
    best_score = source_weights.get("default", 0.4)
    best_specificity = 0
    for pattern, weight in source_weights.items():
        if pattern == "default":
            continue
        # Check if pattern is a regex (contains backslash-d or similar)
        if "\\" in pattern or "\\d" in pattern:
            try:
                if re.search(pattern, normalized):
                    specificity = len(pattern)
                    if specificity > best_specificity:
                        best_score = weight
                        best_specificity = specificity
            except re.error:
                pass
        else:
            # Simple substring/prefix match
            if pattern in normalized:
                specificity = len(pattern)
                if specificity > best_specificity:
                    best_score = weight
                    best_specificity = specificity
    return best_score
 def multi_term_confidence(query: str, text: str) -> float:
    """Score boost based on how many query terms appear in result text.
    Returns 0.0 to 1.0 based on fraction of query terms found.
    """
    terms = [t.lower() for t in query.split() if len(t) > 2]
    if not terms:
        return 0.5
    text_lower = text.lower()
    matched = sum(1 for t in terms if t in text_lower)
    return matched / len(terms)
 def score_results(results: list[SearchResult], query: str = "",
                  config: Optional[dict] = None,
                  reference_date: Optional[date] = None,
                  weight_overrides: Optional[dict] = None) -> list[SearchResult]:
    """Apply composite scoring to a list of search results and return sorted.
    Args:
        results: List of SearchResult objects to score.
        query: Original query string (for multi-term matching).
        config: Scoring config dict. Loaded from config.json if None.
        reference_date: Date to compute recency from. Defaults to today.
        weight_overrides: Override specific weights (e.g. from intent classifier).
    Returns:
        Results sorted by final_score descending.
    """
    if not results:
        return results
    cfg = config or load_config()
    w_search = cfg.get("w_search", 0.45)
    w_recency = cfg.get("w_recency", 0.30)
    w_source = cfg.get("w_source", 0.25)
    half_life = cfg.get("recency_half_life_days", 14.0)
    src_weights = cfg.get("source_weights", {"default": 0.4})
    multi_boost = cfg.get("multi_term_boost", 0.15)
    # Apply overrides from intent classifier
    if weight_overrides:
        w_search = weight_overrides.get("w_search", w_search)
        w_recency = weight_overrides.get("w_recency", w_recency)
        w_source = weight_overrides.get("w_source", w_source)
        # Source-specific boosts
        if "w_source_boost" in weight_overrides:
            src_weights = dict(src_weights)  # copy
            for pattern, boost in weight_overrides["w_source_boost"].items():
                src_weights[pattern] = src_weights.get(pattern, 0.4) + boost
    for r in results:
        r_date = extract_date(r)
        r_recency = recency_score(r_date, reference_date, half_life)
        r_source = source_weight(r.source_path, src_weights)
        r_confidence = multi_term_confidence(query, r.text)
        # Composite formula
        base = w_search * r.original_score + w_recency * r_recency + w_source * r_source
        boost = multi_boost * r_confidence
        r.final_score = min(1.0, base + boost)
        r.score_breakdown = {
            "search": round(r.original_score, 4),
            "recency": round(r_recency, 4),
            "source": round(r_source, 4),
            "confidence": round(r_confidence, 4),
            "final": round(r.final_score, 4),
        }
    results.sort(key=lambda r: r.final_score, reverse=True)
    return results
 if __name__ == "__main__":
    # Demo usage
    demo_results = [
        SearchResult(text="Gateway watchdog fix applied", source_path="memory/2026-02-07.md", original_score=0.8),
        SearchResult(text="Gateway architecture decisions", source_path="MEMORY.md", original_score=0.75),
        SearchResult(text="Old gateway notes", source_path="memory/2025-12-01.md", original_score=0.85),
    ]
    scored = score_results(demo_results, query="gateway fix")
    for r in scored:
        print(f"  {r.final_score:.3f} | {r.source_path}: {r.text[:60]}")
        print(f"         {r.score_breakdown}")
--- a/cortex/enhanced_search.py
+++ b/cortex/enhanced_search.py
@ -0,0 +1,243 @@
 #!/usr/bin/env python3
 """
 Enhanced Search — Integration wrapper combining intent classification,
 composite scoring, and memory search into a single pipeline.
 Pipeline:
 1. Classify intent (WHO/WHEN/WHY/WHAT)
 2. Adjust scoring weights based on intent
 3. Run search via unified-memory.py or file-based search
 4. Apply composite scoring to re-rank results
 5. Return re-ranked results
 Usage:
    python3 enhanced_search.py "query"
    python3 enhanced_search.py --json "query"
    python3 enhanced_search.py --top 5 "query"
 """
 import argparse
 import json
 import os
 import re
 import subprocess
 import sys
 import time
 from dataclasses import asdict
 from pathlib import Path
 from typing import Optional
 from composite_scorer import SearchResult, score_results, load_config as load_scorer_config
 from intent_classifier import classify, IntentResult
 UNIFIED_MEMORY_SCRIPT = Path.home() / "clawd" / "scripts" / "unified-memory.py"
 PYTHON = sys.executable or "/usr/bin/python3"
 # Paths to search directly if unified-memory.py is unavailable
 SEARCH_PATHS = [
    Path.home() / "clawd" / "memory",
    Path.home() / "clawd" / "companies",
    Path.home() / "clawd" / "MEMORY.md",
    Path.home() / "life" / "areas",
 ]
 def search_files(query: str, max_results: int = 20) -> list[SearchResult]:
    """Fallback file-based search using grep.
    Searches through memory files for query terms and returns scored results.
    """
    results = []
    terms = [t for t in query.lower().split() if len(t) > 2]
    if not terms:
        return results
    for search_path in SEARCH_PATHS:
        if not search_path.exists():
            continue
        if search_path.is_file():
            files = [search_path]
        else:
            files = sorted(search_path.rglob("*.md"), reverse=True)[:100]
        for fpath in files:
            try:
                content = fpath.read_text(errors="ignore")
            except (OSError, PermissionError):
                continue
            content_lower = content.lower()
            matched = sum(1 for t in terms if t in content_lower)
            if matched == 0:
                continue
            # Score based on term coverage
            score = matched / len(terms)
            # Extract best matching snippet (around first match)
            snippet = _extract_snippet(content, terms)
            results.append(SearchResult(
                text=snippet,
                source_path=str(fpath),
                original_score=score,
                metadata={"matched_terms": matched, "total_terms": len(terms)},
            ))
    # Sort by original score and limit
    results.sort(key=lambda r: r.original_score, reverse=True)
    return results[:max_results]
 def _extract_snippet(content: str, terms: list[str], context_chars: int = 200) -> str:
    """Extract a snippet around the first matching term."""
    content_lower = content.lower()
    best_pos = len(content)
    for t in terms:
        pos = content_lower.find(t)
        if 0 <= pos < best_pos:
            best_pos = pos
    if best_pos >= len(content):
        return content[:300]
    start = max(0, best_pos - context_chars // 2)
    end = min(len(content), best_pos + context_chars)
    snippet = content[start:end].strip()
    if start > 0:
        snippet = "..." + snippet
    if end < len(content):
        snippet = snippet + "..."
    return snippet
 def search_unified(query: str, max_results: int = 20,
                   timeout: float = 10.0) -> list[SearchResult]:
    """Search via unified-memory.py script."""
    if not UNIFIED_MEMORY_SCRIPT.exists():
        return search_files(query, max_results)
    try:
        proc = subprocess.run(
            [PYTHON, str(UNIFIED_MEMORY_SCRIPT), "--json", query],
            capture_output=True, text=True, timeout=timeout,
        )
        if proc.returncode != 0:
            return search_files(query, max_results)
        data = json.loads(proc.stdout)
        results = []
        for item in data.get("results", [])[:max_results]:
            results.append(SearchResult(
                text=item.get("text", ""),
                source_path=item.get("metadata", {}).get("path", item.get("source", "")),
                original_score=item.get("score", 0.5),
                metadata=item.get("metadata", {}),
            ))
        return results
    except (subprocess.TimeoutExpired, json.JSONDecodeError, Exception):
        return search_files(query, max_results)
 def enhanced_search(query: str, max_results: int = 10,
                    use_unified: bool = True) -> dict:
    """Run the full enhanced search pipeline.
    Args:
        query: Search query string.
        max_results: Maximum results to return.
        use_unified: Whether to try unified-memory.py first.
    Returns:
        Dict with intent, results, and timing info.
    """
    pipeline_start = time.perf_counter()
    # Step 1: Classify intent
    intent_result = classify(query)
    # Step 2: Search
    search_start = time.perf_counter()
    if use_unified:
        raw_results = search_unified(query, max_results=max_results * 2)
    else:
        raw_results = search_files(query, max_results=max_results * 2)
    search_ms = (time.perf_counter() - search_start) * 1000
    # Step 3: Apply composite scoring with intent-adjusted weights
    scoring_start = time.perf_counter()
    scored = score_results(
        raw_results, query=query,
        weight_overrides=intent_result.weight_adjustments,
    )
    scoring_ms = (time.perf_counter() - scoring_start) * 1000
    # Step 4: Trim to max results
    final = scored[:max_results]
    pipeline_ms = (time.perf_counter() - pipeline_start) * 1000
    return {
        "query": query,
        "intent": {
            "type": intent_result.intent,
            "confidence": intent_result.confidence,
            "signals": intent_result.matched_signals,
            "classification_ms": intent_result.classification_ms,
        },
        "results": [
            {
                "text": r.text[:500],
                "source": r.source_path,
                "score": round(r.final_score, 4),
                "breakdown": r.score_breakdown,
            }
            for r in final
        ],
        "timing": {
            "classification_ms": round(intent_result.classification_ms, 2),
            "search_ms": round(search_ms, 2),
            "scoring_ms": round(scoring_ms, 2),
            "total_ms": round(pipeline_ms, 2),
        },
        "total_raw": len(raw_results),
        "total_returned": len(final),
    }
 def main():
    parser = argparse.ArgumentParser(description="Enhanced memory search with intent classification and composite scoring")
    parser.add_argument("query", help="Search query")
    parser.add_argument("--json", action="store_true", dest="json_output", help="Output as JSON")
    parser.add_argument("--top", type=int, default=10, help="Number of results (default: 10)")
    parser.add_argument("--no-unified", action="store_true", help="Skip unified-memory.py, use file search only")
    args = parser.parse_args()
    result = enhanced_search(args.query, max_results=args.top, use_unified=not args.no_unified)
    if args.json_output:
        print(json.dumps(result, indent=2, ensure_ascii=False))
    else:
        intent = result["intent"]
        print(f"\n🔍 Query: {result['query']}")
        print(f"🎯 Intent: {intent['type']} (confidence: {intent['confidence']:.0%})")
        if intent["signals"]:
            print(f"   Signals: {', '.join(intent['signals'])}")
        print(f"⏱️  Total: {result['timing']['total_ms']:.0f}ms "
              f"(classify: {result['timing']['classification_ms']:.1f}ms, "
              f"search: {result['timing']['search_ms']:.0f}ms, "
              f"score: {result['timing']['scoring_ms']:.1f}ms)")
        print(f"📊 {result['total_returned']}/{result['total_raw']} results\n")
        for i, r in enumerate(result["results"], 1):
            source = Path(r["source"]).name if r["source"] else "unknown"
            print(f"  {i}. [{r['score']:.3f}] {source}")
            text_preview = r["text"][:120].replace("\n", " ")
            print(f"     {text_preview}")
            print()
 if __name__ == "__main__":
    main()
--- a/cortex/feedback_loop.py
+++ b/cortex/feedback_loop.py
@ -0,0 +1,392 @@
 #!/usr/bin/env python3
 """Feedback Loop Engine — automatically extract lessons from session transcripts.
 Scans OpenClaw session JSONL files, detects patterns (corrections, retries,
 tool failures, knowledge gaps, self-acknowledged errors), and appends
 findings to growth-log.md.
 Usage:
    python3 feedback_loop.py --since 24h
    python3 feedback_loop.py --since 7d --dry-run
    python3 feedback_loop.py --session <session-file>
 """
 import argparse
 import json
 import os
 import re
 import sys
 from datetime import datetime, timedelta, timezone
 from pathlib import Path
 from typing import Any
 DEFAULT_CONFIG_PATH = Path(__file__).parent / "config.json"
 def load_config(path: Path | None = None) -> dict:
    p = path or DEFAULT_CONFIG_PATH
    if p.exists():
        with open(p) as f:
            return json.load(f)
    return {}
 def expand(p: str) -> Path:
    return Path(os.path.expanduser(p))
 def parse_since(since: str) -> datetime:
    """Parse '24h', '7d', '2h', etc. into a UTC datetime."""
    m = re.match(r"^(\d+)([hdm])$", since.strip())
    if not m:
        raise ValueError(f"Invalid --since format: {since!r}. Use e.g. 24h, 7d, 30m")
    val, unit = int(m.group(1)), m.group(2)
    delta = {"h": timedelta(hours=val), "d": timedelta(days=val), "m": timedelta(minutes=val)}[unit]
    return datetime.now(timezone.utc) - delta
 def parse_jsonl(path: Path) -> list[dict]:
    """Parse a JSONL file, skipping malformed lines."""
    entries = []
    with open(path) as f:
        for i, line in enumerate(f, 1):
            line = line.strip()
            if not line:
                continue
            try:
                entries.append(json.loads(line))
            except json.JSONDecodeError:
                pass
    return entries
 def get_session_timestamp(entries: list[dict]) -> datetime | None:
    """Extract session start timestamp."""
    for e in entries:
        ts = e.get("timestamp")
        if ts:
            try:
                return datetime.fromisoformat(ts.replace("Z", "+00:00"))
            except (ValueError, TypeError):
                pass
    return None
 def get_text_content(message: dict) -> str:
    """Extract text from a message entry."""
    msg = message.get("message", {})
    content = msg.get("content", "")
    if isinstance(content, str):
        return content
    if isinstance(content, list):
        parts = []
        for item in content:
            if isinstance(item, dict) and item.get("type") == "text":
                parts.append(item.get("text", ""))
        return " ".join(parts)
    return ""
 def get_tool_name(message: dict) -> str | None:
    """Extract tool name from a toolCall content item."""
    msg = message.get("message", {})
    content = msg.get("content", [])
    if isinstance(content, list):
        for item in content:
            if isinstance(item, dict) and item.get("type") == "toolCall":
                return item.get("name")
    return None
 def get_tool_result_error(entry: dict) -> str | None:
    """Check if a toolResult entry contains an error."""
    msg = entry.get("message", {})
    if msg.get("isError"):
        content = msg.get("content", [])
        if isinstance(content, list):
            for item in content:
                if isinstance(item, dict):
                    return item.get("text", "error")
        return "error"
    return None
 # --- Detection Heuristics ---
 class Finding:
    def __init__(self, category: str, trigger: str, lines: tuple[int, int],
                 session_file: str, confidence: float = 1.0):
        self.category = category
        self.trigger = trigger
        self.lines = lines
        self.session_file = session_file
        self.confidence = confidence
 def detect_corrections(entries: list[dict], config: dict, session_file: str) -> list[Finding]:
    """Detect user corrections after agent actions."""
    keywords = config.get("detection", {}).get("correction_keywords",
                ["nein", "falsch", "wrong", "nicht", "stop"])
    findings = []
    prev_was_assistant = False
    prev_line = 0
    for i, entry in enumerate(entries):
        msg = entry.get("message", {})
        role = msg.get("role")
        if role == "assistant":
            prev_was_assistant = True
            prev_line = i
            continue
        if role == "user" and prev_was_assistant:
            text = get_text_content(entry).lower()
            for kw in keywords:
                if re.search(r'\b' + re.escape(kw) + r'\b', text):
                    findings.append(Finding(
                        category="correction",
                        trigger=f"User said '{kw}' after agent response",
                        lines=(prev_line + 1, i + 1),
                        session_file=session_file,
                        confidence=0.7,
                    ))
                    break
        if role == "user":
            prev_was_assistant = False
    return findings
 def detect_retries(entries: list[dict], config: dict, session_file: str) -> list[Finding]:
    """Detect same tool called N+ times in sequence."""
    threshold = config.get("detection", {}).get("retry_threshold", 3)
    findings = []
    current_tool = None
    count = 0
    start_line = 0
    for i, entry in enumerate(entries):
        tool = get_tool_name(entry)
        if tool:
            if tool == current_tool:
                count += 1
            else:
                if current_tool and count >= threshold:
                    findings.append(Finding(
                        category="retry",
                        trigger=f"Tool '{current_tool}' called {count} times in sequence",
                        lines=(start_line + 1, i),
                        session_file=session_file,
                    ))
                current_tool = tool
                count = 1
                start_line = i
    # Final check
    if current_tool and count >= threshold:
        findings.append(Finding(
            category="retry",
            trigger=f"Tool '{current_tool}' called {count} times in sequence",
            lines=(start_line + 1, len(entries)),
            session_file=session_file,
        ))
    return findings
 def detect_tool_failures(entries: list[dict], config: dict, session_file: str) -> list[Finding]:
    """Detect tool result errors."""
    error_patterns = config.get("detection", {}).get("error_patterns",
                      ["error", "Error", "failed", "Failed"])
    findings = []
    for i, entry in enumerate(entries):
        if entry.get("type") == "message":
            msg = entry.get("message", {})
            # Explicit isError
            err = get_tool_result_error(entry)
            if err:
                findings.append(Finding(
                    category="tool_failure",
                    trigger=f"Tool returned error: {err[:120]}",
                    lines=(i + 1, i + 1),
                    session_file=session_file,
                ))
                continue
            # Check tool result content for error patterns
            if msg.get("role") == "toolResult":
                content = msg.get("content", [])
                if isinstance(content, list):
                    for item in content:
                        text = item.get("text", "") if isinstance(item, dict) else ""
                        for pat in error_patterns:
                            if pat in text:
                                findings.append(Finding(
                                    category="tool_failure",
                                    trigger=f"Tool result contains '{pat}': {text[:100]}",
                                    lines=(i + 1, i + 1),
                                    session_file=session_file,
                                    confidence=0.5,
                                ))
                                break
                        else:
                            continue
                        break
    return findings
 def detect_self_errors(entries: list[dict], config: dict, session_file: str) -> list[Finding]:
    """Detect agent self-acknowledged errors."""
    keywords = config.get("detection", {}).get("apology_keywords",
                ["sorry", "entschuldigung", "my mistake"])
    findings = []
    for i, entry in enumerate(entries):
        msg = entry.get("message", {})
        if msg.get("role") == "assistant":
            text = get_text_content(entry).lower()
            for kw in keywords:
                if kw.lower() in text:
                    findings.append(Finding(
                        category="self_error",
                        trigger=f"Agent acknowledged error with '{kw}'",
                        lines=(i + 1, i + 1),
                        session_file=session_file,
                        confidence=0.6,
                    ))
                    break
    return findings
 def detect_knowledge_gaps(entries: list[dict], config: dict, session_file: str) -> list[Finding]:
    """Detect when user provides the answer after agent couldn't find it."""
    findings = []
    gap_phrases = ["i don't know", "ich weiß nicht", "couldn't find", "konnte nicht finden",
                   "unable to", "no results", "not found", "keine ergebnisse"]
    for i, entry in enumerate(entries):
        msg = entry.get("message", {})
        if msg.get("role") == "assistant":
            text = get_text_content(entry).lower()
            has_gap = any(p in text for p in gap_phrases)
            if has_gap:
                # Check if next user message provides info
                for j in range(i + 1, min(i + 4, len(entries))):
                    next_msg = entries[j].get("message", {})
                    if next_msg.get("role") == "user":
                        user_text = get_text_content(entries[j])
                        if len(user_text) > 20:  # Substantial answer
                            findings.append(Finding(
                                category="knowledge_gap",
                                trigger=f"Agent couldn't find answer, user provided it",
                                lines=(i + 1, j + 1),
                                session_file=session_file,
                                confidence=0.6,
                            ))
                        break
    return findings
 def analyze_session(entries: list[dict], config: dict, session_file: str) -> list[Finding]:
    """Run all detectors on a session."""
    min_conf = config.get("detection", {}).get("min_confidence", 0.5)
    findings = []
    for detector in [detect_corrections, detect_retries, detect_tool_failures,
                     detect_self_errors, detect_knowledge_gaps]:
        findings.extend(detector(entries, config, session_file))
    return [f for f in findings if f.confidence >= min_conf]
 def finding_to_markdown(finding: Finding, config: dict) -> str:
    """Format a finding as growth-log markdown."""
    categories = config.get("categories", {})
    cat_label = categories.get(finding.category, finding.category.replace("_", " ").title())
    date = datetime.now().strftime("%Y-%m-%d")
    session_name = Path(finding.session_file).stem
    return f"""### {date} — [Auto-detected: {cat_label}]
 - **Trigger:** {finding.trigger}
 - **Erkenntnis:** Auto-detected pattern — review recommended
 - **Neue Fähigkeit:** Awareness of recurring pattern
 - **Source:** {session_name} lines {finding.lines[0]}-{finding.lines[1]}
 """
 def deduplicate_findings(findings: list[Finding]) -> list[Finding]:
    """Remove duplicate findings by category + similar trigger."""
    seen = set()
    unique = []
    for f in findings:
        key = (f.category, f.trigger[:60])
        if key not in seen:
            seen.add(key)
            unique.append(f)
    return unique
 def append_to_growth_log(findings: list[Finding], config: dict, dry_run: bool = False) -> str:
    """Append findings to growth-log.md. Returns the text that was/would be appended."""
    if not findings:
        return ""
    text = "\n---\n\n"
    for f in findings:
        text += finding_to_markdown(f, config) + "\n"
    if dry_run:
        return text
    log_path = expand(config.get("growth_log_path", "~/clawd/memory/growth-log.md"))
    with open(log_path, "a") as fh:
        fh.write(text)
    return text
 def get_recent_sessions(config: dict, since: datetime) -> list[Path]:
    """Get session files modified since the given time."""
    sessions_dir = expand(config.get("sessions_dir", "~/.openclaw/agents/main/sessions"))
    if not sessions_dir.exists():
        return []
    files = []
    for f in sessions_dir.glob("*.jsonl"):
        mtime = datetime.fromtimestamp(f.stat().st_mtime, tz=timezone.utc)
        if mtime >= since:
            files.append(f)
    return sorted(files, key=lambda f: f.stat().st_mtime, reverse=True)
 def run(since: str = "24h", session: str | None = None, dry_run: bool = False,
        config_path: str | None = None) -> list[Finding]:
    """Main entry point."""
    config = load_config(Path(config_path) if config_path else None)
    if config.get("dry_run"):
        dry_run = True
    if session:
        session_path = Path(session)
        if not session_path.exists():
            print(f"Session file not found: {session}", file=sys.stderr)
            sys.exit(1)
        sessions = [session_path]
    else:
        cutoff = parse_since(since)
        sessions = get_recent_sessions(config, cutoff)
    all_findings: list[Finding] = []
    for s in sessions:
        entries = parse_jsonl(s)
        findings = analyze_session(entries, config, str(s))
        all_findings.extend(findings)
    all_findings = deduplicate_findings(all_findings)
    output = append_to_growth_log(all_findings, config, dry_run=dry_run)
    if output:
        if dry_run:
            print("=== DRY RUN — would append: ===")
        print(output)
    else:
        print("No patterns detected.")
    return all_findings
 def main():
    parser = argparse.ArgumentParser(description="Feedback Loop Engine")
    parser.add_argument("--since", default="24h", help="Time window (e.g. 24h, 7d, 30m)")
    parser.add_argument("--session", help="Analyze a specific session file")
    parser.add_argument("--dry-run", action="store_true", help="Don't write to growth-log")
    parser.add_argument("--config", help="Path to config.json")
    args = parser.parse_args()
    run(since=args.since, session=args.session, dry_run=args.dry_run, config_path=args.config)
 if __name__ == "__main__":
    main()
--- a/cortex/health_scanner.py
+++ b/cortex/health_scanner.py
@ -0,0 +1,515 @@
 #!/usr/bin/env python3
 """Proactive Health Scanner — finds problems BEFORE they become alerts.
 Checks: agent health, resource trends, dependency health, configuration drift.
 Designed for cron: fast (<30s), no side effects.
 Usage:
    python3 health_scanner.py [--json] [--section agents|resources|deps|config]
 """
 import argparse
 import hashlib
 import json
 import os
 import re
 import shutil
 import subprocess
 import sys
 import time
 import urllib.request
 from datetime import datetime, timedelta
 from pathlib import Path
 from typing import Any
 # --- Constants ---
 OPENCLAW_CONFIG = Path.home() / ".openclaw" / "openclaw.json"
 OPENCLAW_AGENTS_DIR = Path.home() / ".openclaw" / "agents"
 DEPRECATED_MODELS = {
    "anthropic/claude-3-5-haiku-latest": "2026-02-19",
    "claude-3-5-haiku-latest": "2026-02-19",
 }
 DISK_HISTORY_FILE = Path.home() / ".cache" / "health-scanner" / "disk_history.json"
 OLLAMA_URL = "http://localhost:11434/api/tags"
 INFO, WARN, CRITICAL = "INFO", "WARN", "CRITICAL"
 def _severity_rank(s: str) -> int:
    return {"INFO": 0, "WARN": 1, "CRITICAL": 2}.get(s, -1)
 class Finding:
    def __init__(self, section: str, severity: str, title: str, detail: str = ""):
        self.section = section
        self.severity = severity
        self.title = title
        self.detail = detail
    def to_dict(self) -> dict:
        return {"section": self.section, "severity": self.severity,
                "title": self.title, "detail": self.detail}
 class HealthScanner:
    def __init__(self):
        self.findings: list[Finding] = []
        self.config: dict = {}
        self._load_config()
    def _load_config(self):
        try:
            self.config = json.loads(OPENCLAW_CONFIG.read_text())
        except Exception:
            self.findings.append(Finding("config", CRITICAL, "Cannot read OpenClaw config",
                                         str(OPENCLAW_CONFIG)))
    def _add(self, section: str, severity: str, title: str, detail: str = ""):
        self.findings.append(Finding(section, severity, title, detail))
    # --- A) Agent Health ---
    def check_agents(self):
        agents = self.config.get("agents", {}).get("list", [])
        if not agents:
            self._add("agents", WARN, "No agents found in config")
            return
        for agent in agents:
            aid = agent.get("id", "unknown")
            # Workspace check
            ws = agent.get("workspace", "")
            if ws:
                wp = Path(ws)
                if not wp.exists():
                    self._add("agents", CRITICAL, f"Agent '{aid}' workspace missing", ws)
                elif not os.access(wp, os.W_OK):
                    self._add("agents", WARN, f"Agent '{aid}' workspace not writable", ws)
                else:
                    self._add("agents", INFO, f"Agent '{aid}' workspace OK")
            else:
                self._add("agents", WARN, f"Agent '{aid}' has no workspace configured")
            # Session activity check
            session_dir = OPENCLAW_AGENTS_DIR / aid / "sessions"
            if session_dir.exists():
                sessions = list(session_dir.iterdir())
                if sessions:
                    latest_mtime = max(f.stat().st_mtime for f in sessions if f.is_file())
                    age_days = (time.time() - latest_mtime) / 86400
                    if age_days > 7:
                        self._add("agents", WARN,
                                  f"Agent '{aid}' inactive for {age_days:.0f} days",
                                  f"Last session activity: {datetime.fromtimestamp(latest_mtime).isoformat()}")
                    else:
                        self._add("agents", INFO,
                                  f"Agent '{aid}' last active {age_days:.1f} days ago")
                else:
                    self._add("agents", INFO, f"Agent '{aid}' has no session files")
            else:
                self._add("agents", INFO, f"Agent '{aid}' session dir not found")
            # Model reachability
            model = agent.get("model", {}).get("primary", "")
            if model.startswith("ollama"):
                self._check_ollama_model(aid, model)
            elif model:
                self._add("agents", INFO, f"Agent '{aid}' uses cloud model: {model}")
    def _check_ollama_model(self, aid: str, model: str):
        """Check if ollama model is reachable."""
        try:
            req = urllib.request.Request(OLLAMA_URL, method="GET")
            with urllib.request.urlopen(req, timeout=5) as resp:
                data = json.loads(resp.read())
                model_name = model.split("/", 1)[-1] if "/" in model else model
                available = [m.get("name", "") for m in data.get("models", [])]
                if any(model_name in m for m in available):
                    self._add("agents", INFO, f"Agent '{aid}' ollama model available: {model_name}")
                else:
                    self._add("agents", WARN,
                              f"Agent '{aid}' ollama model not found: {model_name}",
                              f"Available: {', '.join(available[:10])}")
        except Exception as e:
            self._add("agents", WARN, f"Agent '{aid}' ollama unreachable for model check",
                       str(e))
    # --- B) Resource Trends ---
    def check_resources(self):
        # Disk usage
        self._check_disk()
        # Memory
        self._check_memory()
        # Session file accumulation
        self._check_session_files()
        # SQLite DB sizes
        self._check_db_sizes()
        # Log file sizes
        self._check_log_sizes()
    def _check_disk(self):
        usage = shutil.disk_usage("/")
        pct = usage.used / usage.total * 100
        free_gb = usage.free / (1024 ** 3)
        if pct > 95:
            self._add("resources", CRITICAL, f"Disk {pct:.1f}% full ({free_gb:.1f}GB free)")
        elif pct > 85:
            self._add("resources", WARN, f"Disk {pct:.1f}% full ({free_gb:.1f}GB free)")
        else:
            self._add("resources", INFO, f"Disk {pct:.1f}% used ({free_gb:.1f}GB free)")
        # Trend tracking
        self._track_disk_trend(usage.used)
    def _track_disk_trend(self, current_bytes: int):
        try:
            DISK_HISTORY_FILE.parent.mkdir(parents=True, exist_ok=True)
            history = []
            if DISK_HISTORY_FILE.exists():
                history = json.loads(DISK_HISTORY_FILE.read_text())
            now = time.time()
            history.append({"ts": now, "used": current_bytes})
            # Keep last 7 days
            cutoff = now - 7 * 86400
            history = [h for h in history if h["ts"] > cutoff]
            DISK_HISTORY_FILE.write_text(json.dumps(history))
            if len(history) >= 2:
                oldest, newest = history[0], history[-1]
                dt = newest["ts"] - oldest["ts"]
                if dt > 3600:  # at least 1 hour of data
                    growth_per_day = (newest["used"] - oldest["used"]) / dt * 86400
                    gb_per_day = growth_per_day / (1024 ** 3)
                    if gb_per_day > 1:
                        total = shutil.disk_usage("/").total
                        remaining = total - current_bytes
                        days_left = remaining / growth_per_day if growth_per_day > 0 else 999
                        self._add("resources", WARN,
                                  f"Disk growing {gb_per_day:.1f}GB/day, ~{days_left:.0f} days until full")
        except Exception:
            pass
    def _check_memory(self):
        try:
            with open("/proc/meminfo") as f:
                info = {}
                for line in f:
                    parts = line.split(":")
                    if len(parts) == 2:
                        key = parts[0].strip()
                        val = int(parts[1].strip().split()[0])  # kB
                        info[key] = val
            total = info.get("MemTotal", 1)
            available = info.get("MemAvailable", total)
            used_pct = (1 - available / total) * 100
            if used_pct > 90:
                self._add("resources", CRITICAL, f"Memory {used_pct:.0f}% used")
            elif used_pct > 80:
                self._add("resources", WARN, f"Memory {used_pct:.0f}% used")
            else:
                self._add("resources", INFO, f"Memory {used_pct:.0f}% used")
        except Exception as e:
            self._add("resources", WARN, "Cannot read memory info", str(e))
    def _check_session_files(self):
        if not OPENCLAW_AGENTS_DIR.exists():
            return
        for agent_dir in OPENCLAW_AGENTS_DIR.iterdir():
            sessions = agent_dir / "sessions"
            if sessions.exists():
                count = sum(1 for _ in sessions.iterdir())
                if count > 1000:
                    self._add("resources", WARN,
                              f"Agent '{agent_dir.name}' has {count} session files")
                elif count > 500:
                    self._add("resources", INFO,
                              f"Agent '{agent_dir.name}' has {count} session files")
    def _check_db_sizes(self):
        """Check for large SQLite/DB files."""
        search_paths = [
            Path.home() / ".openclaw",
            Path.home() / "clawd",
        ]
        for base in search_paths:
            if not base.exists():
                continue
            try:
                for db_file in base.rglob("*.db"):
                    size_mb = db_file.stat().st_size / (1024 ** 2)
                    if size_mb > 500:
                        self._add("resources", WARN,
                                  f"Large DB: {db_file} ({size_mb:.0f}MB)")
                for db_file in base.rglob("*.sqlite"):
                    size_mb = db_file.stat().st_size / (1024 ** 2)
                    if size_mb > 500:
                        self._add("resources", WARN,
                                  f"Large DB: {db_file} ({size_mb:.0f}MB)")
            except PermissionError:
                pass
    def _check_log_sizes(self):
        log_dirs = [
            Path.home() / ".openclaw" / "logs",
            Path.home() / "clawd" / "logs",
            Path("/tmp"),
        ]
        for d in log_dirs:
            if not d.exists():
                continue
            try:
                for f in d.iterdir():
                    if f.suffix in (".log", ".txt") and f.is_file():
                        size_mb = f.stat().st_size / (1024 ** 2)
                        if size_mb > 100:
                            self._add("resources", WARN,
                                      f"Large log: {f} ({size_mb:.0f}MB)")
            except PermissionError:
                pass
    # --- C) Dependency Health ---
    def check_deps(self):
        self._check_nats()
        self._check_typedb()
        self._check_chromadb()
        self._check_ollama()
        self._check_key_expiry()
    def _run_cmd(self, cmd: list[str], timeout: int = 5) -> tuple[int, str]:
        try:
            r = subprocess.run(cmd, capture_output=True, text=True, timeout=timeout)
            return r.returncode, r.stdout.strip()
        except subprocess.TimeoutExpired:
            return -1, "timeout"
        except FileNotFoundError:
            return -2, "not found"
        except Exception as e:
            return -3, str(e)
    def _check_docker_container(self, name: str) -> bool:
        """Check if a service is running as a Docker container."""
        rc, out = self._run_cmd(
            ["sg", "docker", "-c", f"docker ps --filter name={name} --format '{{{{.Names}}}} {{{{.Status}}}}'"],
            timeout=10
        )
        if rc == 0 and out.strip():
            return True
        return False
    def _check_nats(self):
        rc, out = self._run_cmd(["systemctl", "--user", "is-active", "nats-server"])
        if rc == 0 and out == "active":
            self._add("deps", INFO, "NATS server active")
        elif self._check_docker_container("nats"):
            self._add("deps", INFO, "NATS server active (Docker)")
        else:
            self._add("deps", CRITICAL, "NATS server not active", out)
    def _check_typedb(self):
        # Check for typedb process
        rc, out = self._run_cmd(["pgrep", "-f", "typedb"])
        if rc == 0:
            self._add("deps", INFO, "TypeDB running")
        elif self._check_docker_container("typedb"):
            self._add("deps", INFO, "TypeDB running (Docker)")
        else:
            rc2, out2 = self._run_cmd(["systemctl", "--user", "is-active", "typedb"])
            if rc2 == 0 and out2 == "active":
                self._add("deps", INFO, "TypeDB service active")
            else:
                self._add("deps", WARN, "TypeDB not detected", "May not be running")
    def _check_chromadb(self):
        rag_dirs = list(Path.home().glob("**/.rag-db"))[:3]
        clawd_rag = Path.home() / "clawd" / ".rag-db"
        if clawd_rag.exists():
            age_hours = (time.time() - clawd_rag.stat().st_mtime) / 3600
            if age_hours > 48:
                self._add("deps", WARN,
                          f"ChromaDB (.rag-db) last modified {age_hours:.0f}h ago")
            else:
                self._add("deps", INFO, f"ChromaDB (.rag-db) fresh ({age_hours:.0f}h)")
        else:
            self._add("deps", INFO, "No .rag-db found in clawd workspace")
    def _check_ollama(self):
        try:
            req = urllib.request.Request(OLLAMA_URL, method="GET")
            with urllib.request.urlopen(req, timeout=5) as resp:
                data = json.loads(resp.read())
                count = len(data.get("models", []))
                self._add("deps", INFO, f"Ollama reachable ({count} models)")
        except Exception as e:
            self._add("deps", WARN, "Ollama not reachable", str(e))
    def _check_key_expiry(self):
        """Scan env files for date-like patterns that might indicate key expiry."""
        env_files = list(Path.home().glob(".config/**/*.env"))
        env_files += list(Path.home().glob("clawd/**/.env"))
        env_files += [Path.home() / ".env"]
        now = datetime.now()
        date_pattern = re.compile(r'(\d{4}-\d{2}-\d{2})')
        for ef in env_files:
            if not ef.exists() or not ef.is_file():
                continue
            try:
                content = ef.read_text()
                for match in date_pattern.finditer(content):
                    try:
                        d = datetime.fromisoformat(match.group(1))
                        if now < d < now + timedelta(days=30):
                            self._add("deps", WARN,
                                      f"Possible expiry date {match.group(1)} in {ef.name}",
                                      str(ef))
                    except ValueError:
                        pass
            except Exception:
                pass
    # --- D) Configuration Drift ---
    def check_config(self):
        self._check_deprecated_models()
        self._check_config_hash()
    def _check_deprecated_models(self):
        agents = self.config.get("agents", {}).get("list", [])
        defaults = self.config.get("agents", {}).get("defaults", {})
        now = datetime.now()
        all_models = set()
        # Collect from defaults
        dm = defaults.get("model", {})
        if dm.get("primary"):
            all_models.add(dm["primary"])
        for fb in dm.get("fallbacks", []):
            all_models.add(fb)
        for m in defaults.get("models", {}):
            all_models.add(m)
        # Collect from agents
        for agent in agents:
            am = agent.get("model", {})
            if am.get("primary"):
                all_models.add(am["primary"])
            for fb in am.get("fallbacks", []):
                all_models.add(fb)
            hb = agent.get("heartbeat", {})
            if hb.get("model"):
                all_models.add(hb["model"])
        # Also check defaults heartbeat
        dhb = defaults.get("heartbeat", {})
        if dhb.get("model"):
            all_models.add(dhb["model"])
        for model in all_models:
            for dep_model, eol_date in DEPRECATED_MODELS.items():
                if dep_model in model:
                    eol = datetime.fromisoformat(eol_date)
                    days_left = (eol - now).days
                    if days_left < 0:
                        self._add("config", CRITICAL,
                                  f"Model '{model}' is past EOL ({eol_date})")
                    elif days_left < 14:
                        self._add("config", WARN,
                                  f"Model '{model}' EOL in {days_left} days ({eol_date})")
                    else:
                        self._add("config", INFO,
                                  f"Model '{model}' EOL on {eol_date} ({days_left} days)")
    def _check_config_hash(self):
        """Check if config file has changed since last scan."""
        hash_file = Path.home() / ".cache" / "health-scanner" / "config_hash.txt"
        hash_file.parent.mkdir(parents=True, exist_ok=True)
        try:
            current_hash = hashlib.sha256(OPENCLAW_CONFIG.read_bytes()).hexdigest()[:16]
            if hash_file.exists():
                prev_hash = hash_file.read_text().strip()
                if prev_hash != current_hash:
                    self._add("config", INFO, "Config file changed since last scan",
                              f"Old: {prev_hash}, New: {current_hash}")
            hash_file.write_text(current_hash)
        except Exception as e:
            self._add("config", WARN, "Cannot track config hash", str(e))
    # --- Run ---
    def run(self, sections: list[str] | None = None) -> dict:
        section_map = {
            "agents": self.check_agents,
            "resources": self.check_resources,
            "deps": self.check_deps,
            "config": self.check_config,
        }
        targets = sections if sections else list(section_map.keys())
        for s in targets:
            if s in section_map:
                try:
                    section_map[s]()
                except Exception as e:
                    self._add(s, CRITICAL, f"Section '{s}' check failed", str(e))
        # Build report
        worst = INFO
        for f in self.findings:
            if _severity_rank(f.severity) > _severity_rank(worst):
                worst = f.severity
        return {
            "timestamp": datetime.now().isoformat(),
            "overall": worst,
            "findings_count": {
                INFO: sum(1 for f in self.findings if f.severity == INFO),
                WARN: sum(1 for f in self.findings if f.severity == WARN),
                CRITICAL: sum(1 for f in self.findings if f.severity == CRITICAL),
            },
            "findings": [f.to_dict() for f in self.findings],
        }
 def format_human(report: dict) -> str:
    lines = []
    overall = report["overall"]
    icon = {"INFO": "✅", "WARN": "⚠️", "CRITICAL": "🚨"}.get(overall, "❓")
    lines.append(f"{icon} Health Report — {overall}")
    lines.append(f"   {report['findings_count']}")
    lines.append(f"   {report['timestamp']}")
    lines.append("")
    for sev in [CRITICAL, WARN, INFO]:
        items = [f for f in report["findings"] if f["severity"] == sev]
        if not items:
            continue
        icon = {"CRITICAL": "🚨", "WARN": "⚠️", "INFO": "ℹ️"}[sev]
        lines.append(f"--- {sev} ({len(items)}) ---")
        for f in items:
            lines.append(f"  {icon} [{f['section']}] {f['title']}")
            if f["detail"]:
                lines.append(f"     {f['detail']}")
        lines.append("")
    return "\n".join(lines)
 def main():
    parser = argparse.ArgumentParser(description="Proactive Health Scanner")
    parser.add_argument("--json", action="store_true", help="Output JSON")
    parser.add_argument("--section", type=str, help="Comma-separated sections: agents,resources,deps,config")
    args = parser.parse_args()
    sections = args.section.split(",") if args.section else None
    scanner = HealthScanner()
    report = scanner.run(sections)
    if args.json:
        print(json.dumps(report, indent=2))
    else:
        print(format_human(report))
    # Exit code: 2 for CRITICAL, 1 for WARN, 0 for INFO
    if report["overall"] == CRITICAL:
        sys.exit(2)
    elif report["overall"] == WARN:
        sys.exit(1)
    sys.exit(0)
 if __name__ == "__main__":
    main()
--- a/cortex/intent_classifier.py
+++ b/cortex/intent_classifier.py
@ -0,0 +1,191 @@
 #!/usr/bin/env python3
 """
 Intent Classifier — Classify memory queries into WHO/WHEN/WHY/WHAT intents
 using regex-based heuristics. No LLM call, <5ms per query.
 Output: intent type + suggested weight adjustments for composite scorer.
 """
 import json
 import re
 import time
 from dataclasses import dataclass, field
 from pathlib import Path
 from typing import Optional
 CONFIG_PATH = Path(__file__).parent / "config.json"
@dataclass
 class IntentResult:
    """Classification result for a query."""
    intent: str  # WHO, WHEN, WHY, WHAT
    confidence: float  # 0.0 to 1.0
    weight_adjustments: dict = field(default_factory=dict)
    matched_signals: list = field(default_factory=list)
    classification_ms: float = 0.0
 # Compiled patterns cache
 _compiled_patterns: dict[str, list[re.Pattern]] = {}
 _config_cache: Optional[dict] = None
 def _load_config(path: Optional[Path] = None) -> dict:
    """Load intent classification config."""
    global _config_cache
    if _config_cache is not None:
        return _config_cache
    p = path or CONFIG_PATH
    if p.exists():
        with open(p) as f:
            _config_cache = json.load(f).get("intent_classification", {})
            return _config_cache
    _config_cache = {}
    return _config_cache
 def _get_patterns(intent: str, config: dict) -> list[re.Pattern]:
    """Get compiled regex patterns for an intent (cached)."""
    if intent not in _compiled_patterns:
        raw = config.get(intent, {}).get("patterns", [])
        _compiled_patterns[intent] = [re.compile(p, re.IGNORECASE) for p in raw]
    return _compiled_patterns[intent]
 def classify(query: str, config: Optional[dict] = None) -> IntentResult:
    """Classify a query into WHO/WHEN/WHY/WHAT intent.
    Uses keyword matching and regex patterns. Designed for <5ms execution.
    Args:
        query: The search query string.
        config: Optional config dict. Loaded from config.json if None.
    Returns:
        IntentResult with intent type, confidence, and weight adjustments.
    """
    start = time.perf_counter()
    cfg = config or _load_config()
    if not query or not query.strip():
        elapsed = (time.perf_counter() - start) * 1000
        return IntentResult(intent="WHAT", confidence=0.1, classification_ms=elapsed,
                            matched_signals=["empty_query"])
    query_lower = query.lower().strip()
    scores: dict[str, float] = {"WHO": 0.0, "WHEN": 0.0, "WHY": 0.0, "WHAT": 0.0}
    signals: dict[str, list[str]] = {"WHO": [], "WHEN": [], "WHY": [], "WHAT": []}
    for intent in ("WHO", "WHEN", "WHY", "WHAT"):
        intent_cfg = cfg.get(intent, {})
        # Keyword matching (fast)
        keywords = intent_cfg.get("keywords", [])
        for kw in keywords:
            if kw.lower() in query_lower:
                scores[intent] += 1.0
                signals[intent].append(f"kw:{kw}")
        # Regex pattern matching
        for pattern in _get_patterns(intent, cfg):
            if pattern.search(query_lower):
                scores[intent] += 2.0  # patterns are more specific
                signals[intent].append(f"re:{pattern.pattern[:30]}")
    # Additional heuristics
    # Names (capitalized words not at start) suggest WHO — but exclude known non-person terms
    # German nouns are capitalized — so caps heuristic needs extra guard:
    # Only count as person-name if the word is NOT a common German/tech noun
    # and there's additional WHO signal (keyword/pattern already scored).
    _NON_PERSON_CAPS = {
        "sparkasse", "taskboard", "uptime", "kuma", "forgejo", "traefik", "nginx",
        "docker", "chromadb", "typedb", "nats", "kafka", "pinecone", "odoo",
        "mondo", "gate", "vainplex", "openclaw", "telegram", "discord", "matrix",
        "opus", "sonnet", "haiku", "claude", "gemini", "ollama", "mona", "vera",
        "stella", "viola", "hetzner", "proxmox", "debian", "linux", "python",
        "api", "cli", "dns", "ssl", "tls", "ssh", "http", "https", "sepa",
        "bafin", "iso", "iban", "postgres", "sqlite", "redis", "github",
        # Common German capitalized nouns that aren't people
        "aufgabe", "zugang", "status", "server", "konto", "liste", "daten",
        "problem", "fehler", "lösung", "version", "projekt", "system", "email",
        "rechnung", "zahlung", "vertrag", "termin", "meeting", "deploy",
        "update", "config", "setup", "deployment", "monitoring", "backup",
        "migration", "integration", "infrastruktur", "netzwerk", "sicherheit",
    }
    words = query.split()
    if len(words) >= 2:
        # Check ALL words for name-like capitalization (including first word)
        caps = [w for w in words if w[0].isupper() and len(w) > 2
                and not w.isupper() and w.lower() not in _NON_PERSON_CAPS]
        if len(caps) >= 2:
            # Two+ unknown capitalized words strongly suggest names (e.g. "Sebastian Baier")
            scores["WHO"] += 0.8 * len(caps)
            signals["WHO"].append(f"multi_caps:{','.join(caps[:3])}")
        elif caps:
            # Single unknown cap word — weak signal in German
            scores["WHO"] += 0.3
            signals["WHO"].append(f"caps:{caps[0]}")
    # Date-like tokens suggest WHEN
    if re.search(r'\b\d{4}[-/]\d{2}', query) or re.search(r'\b(?:jan|feb|mar|apr|may|jun|jul|aug|sep|oct|nov|dec|januar|februar|märz)\b', query_lower):
        scores["WHEN"] += 1.5
        signals["WHEN"].append("date_token")
    # Question words at start
    if query_lower.startswith(("warum ", "why ", "wieso ", "weshalb ")):
        scores["WHY"] += 3.0
        signals["WHY"].append("start_why")
    elif query_lower.startswith(("wer ", "who ")):
        scores["WHO"] += 3.0
        signals["WHO"].append("start_who")
    elif query_lower.startswith(("wann ", "when ")):
        scores["WHEN"] += 3.0
        signals["WHEN"].append("start_when")
    # Pick winner
    best_intent = max(scores, key=scores.get)
    total = sum(scores.values())
    confidence = scores[best_intent] / total if total > 0 else 0.25
    # If no strong signal, default to WHAT
    if scores[best_intent] < 0.5:
        best_intent = "WHAT"
        confidence = 0.3
    # Get weight adjustments
    adjustments = cfg.get(best_intent, {}).get("weight_adjustments", {})
    elapsed = (time.perf_counter() - start) * 1000
    return IntentResult(
        intent=best_intent,
        confidence=round(confidence, 3),
        weight_adjustments=adjustments,
        matched_signals=signals[best_intent],
        classification_ms=round(elapsed, 3),
    )
 def reset_cache():
    """Reset config and pattern caches (for testing)."""
    global _config_cache, _compiled_patterns
    _config_cache = None
    _compiled_patterns = {}
 if __name__ == "__main__":
    import sys
    queries = sys.argv[1:] or [
        "Albert Hild contact",
        "when did we fix the gateway",
        "why did we choose NATS over Kafka",
        "Mondo Gate regulatory status",
        "wer ist Sebastian Baier",
        "wann wurde TypeDB eingerichtet",
        "warum ChromaDB statt Pinecone",
    ]
    for q in queries:
        r = classify(q)
        print(f"  [{r.intent}] ({r.confidence:.2f}, {r.classification_ms:.2f}ms) {q}")
        if r.matched_signals:
            print(f"         signals: {r.matched_signals}")
--- a/cortex/memory_hygiene.py
+++ b/cortex/memory_hygiene.py
@ -0,0 +1,453 @@
 #!/usr/bin/env python3
 """Memory Hygiene Tools — find duplicates, stale content, orphans, stats, archive."""
 import argparse
 import hashlib
 import json
 import os
 import re
 import shutil
 import sys
 from collections import defaultdict
 from datetime import datetime, timedelta
 from pathlib import Path
 MEMORY_DIR = Path.home() / "clawd" / "memory"
 ARCHIVE_DIR = MEMORY_DIR / "archive"
 CONFIG_PATH = Path(__file__).parent / "config.json"
 PERMANENT_FILES = {
    "MEMORY.md", "WORKING.md", "growth-log.md", "BOOT_CONTEXT.md",
    "README.md", "active-context.json", "network-map.md",
    "learned-context.md", "email-contacts.json",
 }
 DAILY_NOTE_RE = re.compile(r"^\d{4}-\d{2}-\d{2}(?:-.+)?\.md$")
 DATE_RE = re.compile(r"\b(20\d{2})-(\d{2})-(\d{2})\b")
 TODO_RE = re.compile(r"(?:TODO|FIXME|HACK|XXX)\b", re.IGNORECASE)
 IN_PROGRESS_RE = re.compile(r"status:\s*in.?progress", re.IGNORECASE)
 LINK_RE = re.compile(r"\[([^\]]*)\]\(([^)]+)\)")
 EMAIL_RE = re.compile(r"[\w.+-]+@[\w-]+\.[\w.-]+")
 PHONE_RE = re.compile(r"(?:\+\d[\d\s\-]{7,}|\(\d+\)\s*[\d\s\-]{5,})")
 def load_config():
    if CONFIG_PATH.exists():
        return json.loads(CONFIG_PATH.read_text())
    return {}
 def get_md_files(base: Path | None = None, recursive: bool = True) -> list[Path]:
    if base is None:
        base = MEMORY_DIR
    if recursive:
        return sorted(base.rglob("*.md"))
    return sorted(base.glob("*.md"))
 def _normalize(text: str) -> str:
    return re.sub(r"\s+", " ", text.lower().strip())
 def _para_hash(para: str) -> str:
    return hashlib.md5(_normalize(para).encode()).hexdigest()
 # --- Duplicates ---
 def find_duplicates(min_length: int = 50, threshold: float = 0.8) -> list[dict]:
    """Find near-duplicate paragraphs across memory files."""
    # Collect paragraphs with their fingerprints
    para_index: dict[str, list[dict]] = defaultdict(list)
    for fp in get_md_files():
        try:
            text = fp.read_text(errors="replace")
        except Exception:
            continue
        paragraphs = re.split(r"\n\s*\n", text)
        line = 1
        for para in paragraphs:
            stripped = para.strip()
            if len(stripped) < min_length:
                line += para.count("\n") + 1
                continue
            h = _para_hash(stripped)
            para_index[h].append({
                "file": str(fp.relative_to(MEMORY_DIR)),
                "line": line,
                "preview": stripped[:100],
            })
            line += para.count("\n") + 1
    dupes = []
    for h, locations in para_index.items():
        if len(locations) > 1:
            # Deduplicate by file (same file same hash = skip)
            seen = set()
            unique = []
            for loc in locations:
                key = (loc["file"], loc["line"])
                if key not in seen:
                    seen.add(key)
                    unique.append(loc)
            if len(unique) > 1:
                dupes.append({"hash": h, "locations": unique})
    return dupes
 # --- Staleness ---
 def find_stale(now: datetime | None = None) -> list[dict]:
    """Find potentially stale content."""
    if now is None:
        now = datetime.now()
    cfg = load_config()
    stale_cfg = cfg.get("staleness", {})
    date_days = stale_cfg.get("date_days", 90)
    todo_days = stale_cfg.get("todo_days", 30)
    progress_days = stale_cfg.get("in_progress_days", 14)
    contact_days = stale_cfg.get("contact_days", 180)
    results = []
    for fp in get_md_files():
        try:
            text = fp.read_text(errors="replace")
            mtime = datetime.fromtimestamp(fp.stat().st_mtime)
        except Exception:
            continue
        rel = str(fp.relative_to(MEMORY_DIR))
        lines = text.split("\n")
        file_age = (now - mtime).days
        for i, line in enumerate(lines, 1):
            # Old dates in non-historical context
            for m in DATE_RE.finditer(line):
                try:
                    d = datetime(int(m.group(1)), int(m.group(2)), int(m.group(3)))
                    age = (now - d).days
                    if age > date_days and "history" not in rel.lower() and "archive" not in rel.lower():
                        results.append({
                            "file": rel, "line": i,
                            "reason": f"Date {m.group(0)} is {age} days old",
                            "severity": "info",
                        })
                except ValueError:
                    pass
            # Old TODOs
            if TODO_RE.search(line) and file_age > todo_days:
                results.append({
                    "file": rel, "line": i,
                    "reason": f"TODO in file not modified for {file_age} days",
                    "severity": "warning",
                })
            # Stale in_progress
            if IN_PROGRESS_RE.search(line) and file_age > progress_days:
                results.append({
                    "file": rel, "line": i,
                    "reason": f"in_progress status, file not updated for {file_age} days",
                    "severity": "warning",
                })
            # Contact info staleness
            if (EMAIL_RE.search(line) or PHONE_RE.search(line)) and file_age > contact_days:
                results.append({
                    "file": rel, "line": i,
                    "reason": f"Contact info in file not updated for {file_age} days",
                    "severity": "info",
                })
    return results
 # --- Orphans ---
 def find_orphans() -> dict:
    """Find orphaned files and broken links."""
    all_files = set()
    for fp in MEMORY_DIR.rglob("*"):
        if fp.is_file():
            all_files.add(str(fp.relative_to(MEMORY_DIR)))
    # Collect all references
    referenced = set()
    broken_links = []
    for fp in get_md_files():
        try:
            text = fp.read_text(errors="replace")
        except Exception:
            continue
        rel = str(fp.relative_to(MEMORY_DIR))
        for m in LINK_RE.finditer(text):
            target = m.group(2)
            if target.startswith("http://") or target.startswith("https://"):
                continue
            # Resolve relative to file's directory
            target_clean = target.split("#")[0].split("?")[0]
            if not target_clean:
                continue
            resolved = (fp.parent / target_clean).resolve()
            try:
                ref_rel = str(resolved.relative_to(MEMORY_DIR))
                referenced.add(ref_rel)
            except ValueError:
                pass
            if not resolved.exists():
                broken_links.append({
                    "file": rel,
                    "link_text": m.group(1),
                    "target": target,
                })
    # Orphaned files (never referenced, not permanent)
    orphaned = []
    for f in sorted(all_files):
        name = Path(f).name
        if name in PERMANENT_FILES:
            continue
        if f.startswith("archive/"):
            continue
        if f not in referenced:
            orphaned.append(f)
    # Empty/near-empty files
    empty = []
    for fp in MEMORY_DIR.rglob("*"):
        if fp.is_file() and fp.stat().st_size < 10:
            empty.append(str(fp.relative_to(MEMORY_DIR)))
    return {
        "orphaned_files": orphaned,
        "broken_links": broken_links,
        "empty_files": sorted(empty),
    }
 # --- Stats ---
 def gather_stats() -> dict:
    """Gather statistics about the memory directory."""
    now = datetime.now()
    files = list(MEMORY_DIR.rglob("*"))
    file_list = [f for f in files if f.is_file()]
    total_size = sum(f.stat().st_size for f in file_list)
    by_ext: dict[str, int] = defaultdict(int)
    mtimes = []
    sizes = []
    word_counts = []
    changed_24h = changed_7d = changed_30d = 0
    for f in file_list:
        ext = f.suffix or "(none)"
        by_ext[ext] += 1
        st = f.stat()
        mt = datetime.fromtimestamp(st.st_mtime)
        mtimes.append((str(f.relative_to(MEMORY_DIR)), mt))
        sizes.append((str(f.relative_to(MEMORY_DIR)), st.st_size))
        age = (now - mt).days
        if age < 1:
            changed_24h += 1
        if age < 7:
            changed_7d += 1
        if age < 30:
            changed_30d += 1
        if f.suffix == ".md":
            try:
                words = len(f.read_text(errors="replace").split())
                word_counts.append((str(f.relative_to(MEMORY_DIR)), words))
            except Exception:
                pass
    mtimes.sort(key=lambda x: x[1])
    sizes.sort(key=lambda x: x[1], reverse=True)
    return {
        "total_files": len(file_list),
        "total_size_bytes": total_size,
        "total_size_human": f"{total_size / 1024:.1f} KB",
        "files_by_extension": dict(sorted(by_ext.items())),
        "oldest": {"file": mtimes[0][0], "date": mtimes[0][1].isoformat()} if mtimes else None,
        "newest": {"file": mtimes[-1][0], "date": mtimes[-1][1].isoformat()} if mtimes else None,
        "largest_files": [{"file": f, "bytes": s} for f, s in sizes[:10]],
        "changed_24h": changed_24h,
        "changed_7d": changed_7d,
        "changed_30d": changed_30d,
        "word_count_top10": sorted(word_counts, key=lambda x: x[1], reverse=True)[:10],
    }
 # --- Archive ---
 def archive_old_notes(older_than_days: int = 90, execute: bool = False, now: datetime | None = None) -> dict:
    """Archive old daily notes."""
    if now is None:
        now = datetime.now()
    cutoff = now - timedelta(days=older_than_days)
    to_move = []
    for fp in MEMORY_DIR.glob("*.md"):
        name = fp.name
        if name in PERMANENT_FILES:
            continue
        if not DAILY_NOTE_RE.match(name):
            continue
        # Extract date from filename
        m = DATE_RE.match(name)
        if not m:
            continue
        try:
            file_date = datetime(int(m.group(1)), int(m.group(2)), int(m.group(3)))
        except ValueError:
            continue
        if file_date < cutoff:
            year = m.group(1)
            dest_dir = ARCHIVE_DIR / year
            to_move.append({
                "source": str(fp.relative_to(MEMORY_DIR)),
                "dest": str(dest_dir.relative_to(MEMORY_DIR) / name),
                "date": file_date.isoformat(),
            })
    manifest = {
        "archived_at": now.isoformat(),
        "older_than_days": older_than_days,
        "dry_run": not execute,
        "files": to_move,
        "count": len(to_move),
    }
    if execute and to_move:
        for item in to_move:
            src = MEMORY_DIR / item["source"]
            dst = MEMORY_DIR / item["dest"]
            dst.parent.mkdir(parents=True, exist_ok=True)
            shutil.move(str(src), str(dst))
        # Write manifest
        manifest_path = ARCHIVE_DIR / f"manifest-{now.strftime('%Y%m%d-%H%M%S')}.json"
        manifest_path.parent.mkdir(parents=True, exist_ok=True)
        manifest_path.write_text(json.dumps(manifest, indent=2))
        manifest["manifest_path"] = str(manifest_path.relative_to(MEMORY_DIR))
    return manifest
 # --- Report ---
 def generate_report() -> tuple[str, bool]:
    """Generate combined markdown report. Returns (report_text, has_critical)."""
    lines = ["# Memory Hygiene Report", f"Generated: {datetime.now().isoformat()}", ""]
    has_critical = False
    # Stats
    stats = gather_stats()
    lines.append("## Stats")
    lines.append(f"- **Files:** {stats['total_files']} ({stats['total_size_human']})")
    lines.append(f"- **Changed 24h/7d/30d:** {stats['changed_24h']}/{stats['changed_7d']}/{stats['changed_30d']}")
    lines.append("")
    # Duplicates
    dupes = find_duplicates()
    lines.append(f"## Duplicates ({len(dupes)} found)")
    for d in dupes[:10]:
        locs = ", ".join(f"`{l['file']}:{l['line']}`" for l in d["locations"])
        lines.append(f"- {locs}: {d['locations'][0]['preview'][:60]}...")
    lines.append("")
    # Staleness
    stale = find_stale()
    warnings = [s for s in stale if s["severity"] == "warning"]
    lines.append(f"## Stale Items ({len(stale)} total, {len(warnings)} warnings)")
    if warnings:
        has_critical = True
    for s in stale[:20]:
        icon = "⚠️" if s["severity"] == "warning" else "ℹ️"
        lines.append(f"- {icon} `{s['file']}:{s['line']}` — {s['reason']}")
    lines.append("")
    # Orphans
    orph = find_orphans()
    bl = orph["broken_links"]
    lines.append(f"## Orphans")
    lines.append(f"- **Orphaned files:** {len(orph['orphaned_files'])}")
    lines.append(f"- **Broken links:** {len(bl)}")
    lines.append(f"- **Empty files:** {len(orph['empty_files'])}")
    if bl:
        has_critical = True
        for b in bl[:10]:
            lines.append(f"  - `{b['file']}` → `{b['target']}` (broken)")
    lines.append("")
    # Archive candidates
    archive = archive_old_notes(older_than_days=90, execute=False)
    lines.append(f"## Archive Candidates ({archive['count']} files older than 90 days)")
    for f in archive["files"][:10]:
        lines.append(f"- `{f['source']}` → `{f['dest']}`")
    lines.append("")
    return "\n".join(lines), has_critical
 def main():
    parser = argparse.ArgumentParser(description="Memory Hygiene Tools")
    sub = parser.add_subparsers(dest="command")
    sub.add_parser("dupes", help="Find duplicate content")
    sub.add_parser("stale", help="Find stale content")
    sub.add_parser("orphans", help="Find orphaned files and broken links")
    sub.add_parser("stats", help="Memory statistics")
    arc = sub.add_parser("archive", help="Archive old daily notes")
    arc.add_argument("--older-than", default="90d", help="Age threshold (e.g., 90d)")
    arc.add_argument("--execute", action="store_true", help="Actually move files (default: dry-run)")
    sub.add_parser("report", help="Full hygiene report")
    args = parser.parse_args()
    if not args.command:
        parser.print_help()
        sys.exit(1)
    if args.command == "dupes":
        dupes = find_duplicates()
        print(json.dumps(dupes, indent=2, ensure_ascii=False))
        print(f"\n{len(dupes)} duplicate groups found.", file=sys.stderr)
    elif args.command == "stale":
        stale = find_stale()
        print(json.dumps(stale, indent=2, ensure_ascii=False))
        print(f"\n{len(stale)} stale items found.", file=sys.stderr)
    elif args.command == "orphans":
        orph = find_orphans()
        print(json.dumps(orph, indent=2, ensure_ascii=False))
    elif args.command == "stats":
        stats = gather_stats()
        print(json.dumps(stats, indent=2, ensure_ascii=False))
    elif args.command == "archive":
        days = int(args.older_than.rstrip("d"))
        result = archive_old_notes(older_than_days=days, execute=args.execute)
        print(json.dumps(result, indent=2, ensure_ascii=False))
        if not args.execute and result["count"] > 0:
            print(f"\nDry run: {result['count']} files would be archived. Use --execute to proceed.", file=sys.stderr)
    elif args.command == "report":
        report, has_critical = generate_report()
        print(report)
        if has_critical:
            sys.exit(1)
 if __name__ == "__main__":
    main()
--- a/cortex/roadmap.py
+++ b/cortex/roadmap.py
@ -0,0 +1,338 @@
 #!/usr/bin/env python3
 """Roadmap Manager — track tasks, deadlines, dependencies, generate reports.
 Usage:
    python3 roadmap.py list [--status open] [--priority P0,P1] [--tag security]
    python3 roadmap.py add "title" --priority P1 --deadline 2026-02-19 --tag infra
    python3 roadmap.py update <id> --status done
    python3 roadmap.py overdue
    python3 roadmap.py upcoming [--days 7]
    python3 roadmap.py report
    python3 roadmap.py check-deps
 """
 import argparse
 import json
 import sys
 import uuid
 from datetime import datetime, timedelta
 from pathlib import Path
 from typing import Any
 ROADMAP_FILE = Path.home() / "clawd" / "memory" / "roadmap.json"
 VALID_STATUSES = {"open", "in_progress", "blocked", "done"}
 VALID_PRIORITIES = {"P0", "P1", "P2", "P3"}
 def load_roadmap(path: Path | None = None) -> dict:
    p = path or ROADMAP_FILE
    if p.exists():
        return json.loads(p.read_text())
    return {"items": []}
 def save_roadmap(data: dict, path: Path | None = None):
    p = path or ROADMAP_FILE
    p.parent.mkdir(parents=True, exist_ok=True)
    p.write_text(json.dumps(data, indent=2, ensure_ascii=False))
 def find_item(data: dict, item_id: str) -> dict | None:
    for item in data["items"]:
        if item["id"] == item_id or item["id"].startswith(item_id):
            return item
    return None
 def now_iso() -> str:
    return datetime.now().isoformat(timespec="seconds")
 def parse_date(s: str | None) -> datetime | None:
    if not s:
        return None
    for fmt in ["%Y-%m-%dT%H:%M:%S", "%Y-%m-%d %H:%M", "%Y-%m-%d"]:
        try:
            return datetime.strptime(s, fmt)
        except ValueError:
            continue
    return None
 # --- Commands ---
 def cmd_list(args, data: dict):
    items = data["items"]
    if args.status:
        statuses = set(args.status.split(","))
        items = [i for i in items if i["status"] in statuses]
    if args.priority:
        priorities = set(args.priority.split(","))
        items = [i for i in items if i["priority"] in priorities]
    if args.tag:
        tags = set(args.tag.split(","))
        items = [i for i in items if tags & set(i.get("tags", []))]
    if not items:
        print("No items found.")
        return
    # Sort by priority then deadline
    prio_order = {"P0": 0, "P1": 1, "P2": 2, "P3": 3}
    items.sort(key=lambda x: (prio_order.get(x["priority"], 9),
                               x.get("deadline") or "9999"))
    for i in items:
        deadline = i.get("deadline", "")
        dl_str = f" ⏰ {deadline}" if deadline else ""
        status_icon = {"open": "⬚", "in_progress": "🔄", "blocked": "🚫", "done": "✅"
                       }.get(i["status"], "?")
        tags = " ".join(f"#{t}" for t in i.get("tags", []))
        print(f"  {status_icon} [{i['priority']}] {i['title']}{dl_str} {tags}")
        print(f"    id: {i['id'][:8]}")
 def cmd_add(args, data: dict):
    item = {
        "id": str(uuid.uuid4()),
        "title": args.title,
        "status": "open",
        "priority": args.priority or "P2",
        "deadline": args.deadline,
        "depends_on": [],
        "tags": args.tag.split(",") if args.tag else [],
        "created": now_iso(),
        "updated": now_iso(),
        "notes": args.notes or "",
    }
    if item["priority"] not in VALID_PRIORITIES:
        print(f"Invalid priority: {item['priority']}")
        sys.exit(1)
    data["items"].append(item)
    save_roadmap(data)
    print(f"Added: {item['title']} (id: {item['id'][:8]})")
 def cmd_update(args, data: dict):
    item = find_item(data, args.id)
    if not item:
        print(f"Item not found: {args.id}")
        sys.exit(1)
    if args.status:
        if args.status not in VALID_STATUSES:
            print(f"Invalid status: {args.status}")
            sys.exit(1)
        item["status"] = args.status
    if args.priority:
        item["priority"] = args.priority
    if args.deadline:
        item["deadline"] = args.deadline
    if args.notes:
        item["notes"] = args.notes
    if args.tag:
        item["tags"] = args.tag.split(",")
    item["updated"] = now_iso()
    save_roadmap(data)
    print(f"Updated: {item['title']}")
 def cmd_overdue(args, data: dict):
    now = datetime.now()
    overdue = []
    for item in data["items"]:
        if item["status"] == "done":
            continue
        dl = parse_date(item.get("deadline"))
        if dl and dl < now:
            overdue.append(item)
    if not overdue:
        print("No overdue items. ✅")
        return
    prio_order = {"P0": 0, "P1": 1, "P2": 2, "P3": 3}
    overdue.sort(key=lambda x: prio_order.get(x["priority"], 9))
    has_critical = any(i["priority"] in ("P0", "P1") for i in overdue)
    print(f"🚨 {len(overdue)} overdue item(s):")
    for i in overdue:
        print(f"  [{i['priority']}] {i['title']} — due {i['deadline']}")
    if has_critical:
        sys.exit(1)
 def cmd_upcoming(args, data: dict):
    now = datetime.now()
    days = args.days or 7
    cutoff = now + timedelta(days=days)
    upcoming = []
    for item in data["items"]:
        if item["status"] == "done":
            continue
        dl = parse_date(item.get("deadline"))
        if dl and now <= dl <= cutoff:
            upcoming.append(item)
    if not upcoming:
        print(f"No items due in the next {days} days.")
        return
    upcoming.sort(key=lambda x: x.get("deadline", ""))
    print(f"📅 {len(upcoming)} item(s) due in the next {days} days:")
    for i in upcoming:
        print(f"  [{i['priority']}] {i['title']} — due {i['deadline']}")
 def cmd_report(args, data: dict):
    now = datetime.now()
    lines = [
        f"# Roadmap Status Report",
        f"*Generated: {now.strftime('%Y-%m-%d %H:%M')}*",
        "",
    ]
    # Summary
    by_status = {}
    for item in data["items"]:
        by_status.setdefault(item["status"], []).append(item)
    lines.append("## Summary")
    for status in ["open", "in_progress", "blocked", "done"]:
        count = len(by_status.get(status, []))
        icon = {"open": "⬚", "in_progress": "🔄", "blocked": "🚫", "done": "✅"}[status]
        lines.append(f"- {icon} {status}: {count}")
    lines.append("")
    # Overdue
    overdue = [i for i in data["items"] if i["status"] != "done"
               and parse_date(i.get("deadline")) and parse_date(i["deadline"]) < now]
    if overdue:
        lines.append("## 🚨 Overdue")
        for i in overdue:
            lines.append(f"- **[{i['priority']}]** {i['title']} — due {i['deadline']}")
        lines.append("")
    # Upcoming (7 days)
    cutoff = now + timedelta(days=7)
    upcoming = [i for i in data["items"] if i["status"] != "done"
                and parse_date(i.get("deadline"))
                and now <= parse_date(i["deadline"]) <= cutoff]
    if upcoming:
        lines.append("## 📅 Upcoming (7 days)")
        for i in sorted(upcoming, key=lambda x: x["deadline"]):
            lines.append(f"- **[{i['priority']}]** {i['title']} — due {i['deadline']}")
        lines.append("")
    # Stale items (in_progress > 7 days without update)
    stale = []
    for item in data["items"]:
        if item["status"] == "in_progress":
            updated = parse_date(item.get("updated"))
            if updated and (now - updated).days > 7:
                stale.append(item)
    if stale:
        lines.append("## ⏳ Stale (in_progress >7 days)")
        for i in stale:
            lines.append(f"- **[{i['priority']}]** {i['title']} — last updated {i['updated']}")
        lines.append("")
    # Active work
    active = by_status.get("in_progress", [])
    if active:
        lines.append("## 🔄 In Progress")
        for i in active:
            dl = f" (due {i['deadline']})" if i.get("deadline") else ""
            lines.append(f"- **[{i['priority']}]** {i['title']}{dl}")
        lines.append("")
    print("\n".join(lines))
 def cmd_check_deps(args, data: dict):
    id_status = {i["id"]: i for i in data["items"]}
    issues = []
    for item in data["items"]:
        if item["status"] == "done":
            continue
        for dep_id in item.get("depends_on", []):
            dep = id_status.get(dep_id)
            if not dep:
                issues.append((item, dep_id, "missing"))
            elif dep["status"] != "done":
                issues.append((item, dep_id, dep["status"]))
    if not issues:
        print("No dependency issues. ✅")
        return
    print(f"⚠️ {len(issues)} dependency issue(s):")
    for item, dep_id, status in issues:
        if status == "missing":
            print(f"  [{item['priority']}] {item['title']} → depends on unknown {dep_id[:8]}")
        else:
            dep = id_status[dep_id]
            print(f"  [{item['priority']}] {item['title']} → blocked by '{dep['title']}' ({status})")
 def main():
    parser = argparse.ArgumentParser(description="Roadmap Manager")
    sub = parser.add_subparsers(dest="command")
    # list
    p_list = sub.add_parser("list")
    p_list.add_argument("--status", type=str)
    p_list.add_argument("--priority", type=str)
    p_list.add_argument("--tag", type=str)
    # add
    p_add = sub.add_parser("add")
    p_add.add_argument("title", type=str)
    p_add.add_argument("--priority", type=str, default="P2")
    p_add.add_argument("--deadline", type=str)
    p_add.add_argument("--tag", type=str)
    p_add.add_argument("--notes", type=str)
    # update
    p_upd = sub.add_parser("update")
    p_upd.add_argument("id", type=str)
    p_upd.add_argument("--status", type=str)
    p_upd.add_argument("--priority", type=str)
    p_upd.add_argument("--deadline", type=str)
    p_upd.add_argument("--tag", type=str)
    p_upd.add_argument("--notes", type=str)
    # overdue
    sub.add_parser("overdue")
    # upcoming
    p_up = sub.add_parser("upcoming")
    p_up.add_argument("--days", type=int, default=7)
    # report
    sub.add_parser("report")
    # check-deps
    sub.add_parser("check-deps")
    args = parser.parse_args()
    if not args.command:
        parser.print_help()
        sys.exit(1)
    data = load_roadmap()
    cmd_map = {
        "list": cmd_list,
        "add": cmd_add,
        "update": cmd_update,
        "overdue": cmd_overdue,
        "upcoming": cmd_upcoming,
        "report": cmd_report,
        "check-deps": cmd_check_deps,
    }
    cmd_map[args.command](args, data)
 if __name__ == "__main__":
    main()
--- a/cortex/triage.py
+++ b/cortex/triage.py
@ -0,0 +1,214 @@
 #!/usr/bin/env python3
 """Priority Triage System — score and rank tasks by urgency, importance, effort, readiness."""
 import json
 import re
 import sys
 from dataclasses import dataclass, asdict
 # --- Keyword banks (DE + EN) ---
 URGENCY_KEYWORDS = {
    # word -> weight (0.0-1.0 contribution)
    "jetzt": 0.9, "sofort": 0.9, "asap": 0.8, "urgent": 0.8, "dringend": 0.8,
    "notfall": 1.0, "emergency": 1.0, "down": 0.9, "broken": 0.7, "kaputt": 0.7,
    "fehler": 0.6, "error": 0.6, "critical": 0.9, "alarm": 0.8, "outage": 0.9,
    "crash": 0.8, "timeout": 0.5, "offline": 0.7, "immediately": 0.8,
    "deadline": 0.7, "frist": 0.7, "heute": 0.5, "today": 0.5,
    "blocker": 0.8, "p0": 1.0, "p1": 0.8, "sev1": 0.9, "sev2": 0.7,
    "morgen": 0.6, "tomorrow": 0.6, "nächste woche": 0.5, "next week": 0.5,
    "fällig": 0.7, "overdue": 0.8, "überfällig": 0.8,
    "beschwer": 0.6, "complaint": 0.6, "problem": 0.4,
 }
 IMPORTANCE_KEYWORDS = {
    "production": 0.9, "prod": 0.9, "security": 0.9, "sicherheit": 0.9,
    "geld": 0.8, "money": 0.8, "finance": 0.8, "finanzen": 0.8,
    "kunde": 0.7, "customer": 0.7, "kunden": 0.7, "bafin": 1.0,
    "regulatory": 0.9, "compliance": 0.9, "gateway": 0.7, "dns": 0.7,
    "albert": 0.6, "chef": 0.6, "boss": 0.6,
    "database": 0.6, "datenbank": 0.6, "backup": 0.7,
    "ssl": 0.7, "certificate": 0.7, "zertifikat": 0.7,
    "auth": 0.7, "login": 0.6, "password": 0.7, "passwort": 0.7,
    "data loss": 1.0, "datenverlust": 1.0,
    # Security keywords
    "breach": 0.95, "compromised": 0.9, "hacked": 0.95, "vulnerability": 0.8,
    "exploit": 0.9, "unauthorized": 0.85, "ssh keys": 0.85,
    # Compliance keywords
    "audit": 0.8, "iso": 0.7, "compliance": 0.9, "regulatory": 0.9,
    "certification": 0.7, "zertifizierung": 0.7,
    # Business keywords
    "revenue": 0.8, "umsatz": 0.8, "zahlung": 0.7, "payment": 0.7,
    "beschwer": 0.7,
 }
 LOW_EFFORT_KEYWORDS = {
    "quick": 0.8, "schnell": 0.8, "einfach": 0.8, "simple": 0.8,
    "typo": 0.9, "tippfehler": 0.9, "config": 0.6, "toggle": 0.9,
    "restart": 0.7, "neustart": 0.7, "one-liner": 0.9, "fix": 0.5,
 }
 HIGH_EFFORT_KEYWORDS = {
    "komplett": 0.8, "refactor": 0.9, "migration": 0.9, "redesign": 0.9,
    "rewrite": 0.9, "umschreiben": 0.9, "architecture": 0.8, "architektur": 0.8,
    "von grund auf": 0.9, "from scratch": 0.9, "multi-step": 0.6,
    "complex": 0.7, "komplex": 0.7, "projekt": 0.5, "project": 0.5,
 }
 NOT_READY_KEYWORDS = {
    "blocked": 0.9, "blockiert": 0.9, "warte auf": 0.8, "waiting for": 0.8,
    "depends on": 0.8, "abhängig von": 0.8, "brauche erst": 0.8, "need first": 0.8,
    "pending": 0.6, "ausstehend": 0.6, "not yet": 0.5, "noch nicht": 0.5,
 }
 def _scan_keywords(text: str, keywords: dict[str, float]) -> float:
    """Scan text for keywords, return max-based score with diminishing boost."""
    t = text.lower()
    hits = []
    for kw, weight in keywords.items():
        if kw in t:
            hits.append(weight)
    if not hits:
        return 0.0
    hits.sort(reverse=True)
    score = hits[0]
    for h in hits[1:]:
        score = min(1.0, score + h * 0.15)  # diminishing returns
    return round(min(1.0, score), 3)
@dataclass
 class TriageScore:
    text: str
    urgency: float
    importance: float
    effort: float  # 0=trivial, 1=massive
    readiness: float  # 1=ready, 0=blocked
    priority: float
    def to_dict(self):
        d = asdict(self)
        d["priority"] = round(d["priority"], 3)
        return d
 def score_task(text: str) -> TriageScore:
    """Score a single task/message."""
    urgency = _scan_keywords(text, URGENCY_KEYWORDS)
    importance = _scan_keywords(text, IMPORTANCE_KEYWORDS)
    low_effort = _scan_keywords(text, LOW_EFFORT_KEYWORDS)
    high_effort = _scan_keywords(text, HIGH_EFFORT_KEYWORDS)
    # effort: 0=trivial, 1=massive. Default 0.5 (medium)
    if low_effort > high_effort:
        effort = max(0.1, 0.5 - low_effort * 0.4)
    elif high_effort > low_effort:
        effort = min(1.0, 0.5 + high_effort * 0.4)
    else:
        effort = 0.5
    not_ready = _scan_keywords(text, NOT_READY_KEYWORDS)
    readiness = round(1.0 - not_ready, 3)
    # priority_score = (urgency * 0.4) + (importance * 0.35) + (1/effort_norm * 0.15) + (ready * 0.1)
    # 1/effort: invert so low effort = high score. Scale effort 0.1-1.0 -> 1.0-10.0 inverted to 0.1-1.0
    effort_inv = round(1.0 - effort, 3)  # simple inversion: low effort -> high score
    priority = (urgency * 0.4) + (importance * 0.35) + (effort_inv * 0.15) + (readiness * 0.1)
    return TriageScore(
        text=text,
        urgency=round(urgency, 3),
        importance=round(importance, 3),
        effort=round(effort, 3),
        readiness=readiness,
        priority=round(priority, 3),
    )
 def rank_tasks(texts: list[str]) -> list[TriageScore]:
    """Score and rank multiple tasks by priority (highest first)."""
    scores = [score_task(t) for t in texts]
    scores.sort(key=lambda s: s.priority, reverse=True)
    return scores
 def analyze_message(text: str) -> dict:
    """Deep analysis of a message — return signals found."""
    score = score_task(text)
    t = text.lower()
    signals = {"urgency": [], "importance": [], "effort": [], "readiness": []}
    for kw in URGENCY_KEYWORDS:
        if kw in t:
            signals["urgency"].append(kw)
    for kw in IMPORTANCE_KEYWORDS:
        if kw in t:
            signals["importance"].append(kw)
    for kw in LOW_EFFORT_KEYWORDS:
        if kw in t:
            signals["effort"].append(f"{kw} (low)")
    for kw in HIGH_EFFORT_KEYWORDS:
        if kw in t:
            signals["effort"].append(f"{kw} (high)")
    for kw in NOT_READY_KEYWORDS:
        if kw in t:
            signals["readiness"].append(f"{kw} (blocker)")
    # Classify
    p = score.priority
    if p >= 0.8:
        classification = "🔴 CRITICAL — handle immediately"
    elif p >= 0.6:
        classification = "🟠 HIGH — handle soon"
    elif p >= 0.4:
        classification = "🟡 MEDIUM — schedule"
    elif p >= 0.2:
        classification = "🔵 LOW — backlog"
    else:
        classification = "⚪ MINIMAL — ignore"
    return {
        "score": score.to_dict(),
        "signals": signals,
        "classification": classification,
    }
 def main():
    if len(sys.argv) < 2:
        print("Usage: python3 triage.py <score|rank|analyze> <text...>")
        sys.exit(1)
    cmd = sys.argv[1]
    if cmd == "score":
        if len(sys.argv) < 3:
            print("Usage: python3 triage.py score \"task description\"")
            sys.exit(1)
        result = score_task(sys.argv[2])
        print(json.dumps(result.to_dict(), indent=2, ensure_ascii=False))
    elif cmd == "rank":
        if len(sys.argv) < 3:
            print("Usage: python3 triage.py rank \"task1\" \"task2\" ...")
            sys.exit(1)
        tasks = sys.argv[2:]
        ranked = rank_tasks(tasks)
        output = [{"rank": i + 1, **s.to_dict()} for i, s in enumerate(ranked)]
        print(json.dumps(output, indent=2, ensure_ascii=False))
    elif cmd == "analyze":
        if len(sys.argv) < 3:
            print("Usage: python3 triage.py analyze \"message\"")
            sys.exit(1)
        result = analyze_message(sys.argv[2])
        print(json.dumps(result, indent=2, ensure_ascii=False))
    else:
        print(f"Unknown command: {cmd}")
        sys.exit(1)
 if __name__ == "__main__":
    main()
--- a/cortex/validate_output.py
+++ b/cortex/validate_output.py
@ -0,0 +1,363 @@
 #!/usr/bin/env python3
 """Sub-Agent Output Validator — post-completion validation of sub-agent work.
 Validates that spawned tasks actually produced what was requested:
 files created, non-empty, syntax-valid, tests passed, errors addressed.
 Usage:
    python3 validate_output.py --transcript /path/to/session.jsonl --task "description"
    python3 validate_output.py --session-key "agent:main:subagent:xxx"
 """
 import argparse
 import ast
 import json
 import os
 import re
 import subprocess
 import sys
 from pathlib import Path
 from typing import Any
 DEFAULT_SESSIONS_DIR = Path(os.path.expanduser("~/.openclaw/agents/main/sessions"))
 def parse_jsonl(path: Path) -> list[dict]:
    entries = []
    with open(path) as f:
        for line in f:
            line = line.strip()
            if not line:
                continue
            try:
                entries.append(json.loads(line))
            except json.JSONDecodeError:
                pass
    return entries
 def find_session_by_key(session_key: str) -> Path | None:
    """Find a session JSONL by its session key (searches session headers)."""
    sessions_dir = DEFAULT_SESSIONS_DIR
    if not sessions_dir.exists():
        return None
    # session key format: agent:main:subagent:UUID — extract UUID
    parts = session_key.split(":")
    uuid_part = parts[-1] if parts else session_key
    candidate = sessions_dir / f"{uuid_part}.jsonl"
    if candidate.exists():
        return candidate
    # Search all files
    for f in sessions_dir.glob("*.jsonl"):
        try:
            with open(f) as fh:
                first_line = fh.readline().strip()
                if first_line:
                    header = json.loads(first_line)
                    if header.get("id") == uuid_part or session_key in json.dumps(header):
                        return f
        except (json.JSONDecodeError, OSError):
            pass
    return None
 def extract_mentioned_files(task: str) -> list[str]:
    """Extract file paths/names mentioned in a task description."""
    patterns = [
        r'`([^`]+\.\w{1,5})`',                # `filename.ext`
        r'(\S+\.(?:py|ts|js|json|md|yaml|yml|toml|sh))',  # bare filenames
    ]
    files = set()
    for pat in patterns:
        for m in re.finditer(pat, task):
            f = m.group(1)
            if "/" not in f and not f.startswith("."):
                files.add(f)
            elif f.startswith("~/") or f.startswith("./") or f.startswith("/"):
                files.add(f)
    return list(files)
 def extract_created_files_from_transcript(entries: list[dict]) -> list[str]:
    """Extract files that were written/created during the session."""
    files = set()
    for entry in entries:
        msg = entry.get("message", {})
        content = msg.get("content", [])
        if isinstance(content, list):
            for item in content:
                if not isinstance(item, dict):
                    continue
                # Tool calls to write/edit
                if item.get("type") == "toolCall":
                    name = item.get("name", "")
                    args = item.get("arguments", {})
                    if isinstance(args, str):
                        try:
                            args = json.loads(args)
                        except json.JSONDecodeError:
                            args = {}
                    if name in ("write", "Write"):
                        fp = args.get("file_path") or args.get("path", "")
                        if fp:
                            files.add(fp)
                    elif name in ("edit", "Edit"):
                        fp = args.get("file_path") or args.get("path", "")
                        if fp:
                            files.add(fp)
        # Also check exec commands for file creation
        if isinstance(content, list):
            for item in content:
                if isinstance(item, dict) and item.get("type") == "toolCall":
                    if item.get("name") in ("exec", "Exec"):
                        args = item.get("arguments", {})
                        if isinstance(args, str):
                            try:
                                args = json.loads(args)
                            except json.JSONDecodeError:
                                args = {}
                        cmd = args.get("command", "")
                        # Detect mkdir, touch, tee, etc.
                        for m in re.finditer(r'(?:tee|>)\s+(\S+)', cmd):
                            files.add(m.group(1))
    return list(files)
 def extract_transcript_errors(entries: list[dict]) -> list[str]:
    """Extract unaddressed error messages from transcript."""
    errors = []
    for entry in entries:
        msg = entry.get("message", {})
        if msg.get("isError"):
            content = msg.get("content", [])
            if isinstance(content, list):
                for item in content:
                    if isinstance(item, dict):
                        errors.append(item.get("text", "unknown error")[:200])
            elif isinstance(content, str):
                errors.append(content[:200])
    return errors
 def check_test_results(entries: list[dict]) -> dict:
    """Scan transcript for test execution results."""
    result = {"tests_found": False, "tests_passed": None, "details": ""}
    for entry in entries:
        msg = entry.get("message", {})
        content = msg.get("content", [])
        if isinstance(content, list):
            for item in content:
                text = ""
                if isinstance(item, dict):
                    text = item.get("text", "")
                if not text:
                    continue
                # pytest output
                if re.search(r'\d+ passed', text):
                    result["tests_found"] = True
                    if "failed" in text.lower():
                        result["tests_passed"] = False
                        result["details"] = text[:200]
                    else:
                        result["tests_passed"] = True
                        result["details"] = text[:200]
                # unittest output
                if re.search(r'OK\s*$', text.strip()):
                    result["tests_found"] = True
                    result["tests_passed"] = True
                if re.search(r'FAILED', text):
                    result["tests_found"] = True
                    result["tests_passed"] = False
                    result["details"] = text[:200]
    return result
 class ValidationReport:
    def __init__(self):
        self.checks: list[dict] = []
        self.passed = 0
        self.failed = 0
        self.warnings = 0
    def add(self, name: str, status: str, detail: str = ""):
        """status: pass, fail, warn"""
        self.checks.append({"name": name, "status": status, "detail": detail})
        if status == "pass":
            self.passed += 1
        elif status == "fail":
            self.failed += 1
        else:
            self.warnings += 1
    @property
    def ok(self) -> bool:
        return self.failed == 0
    def to_json(self) -> dict:
        return {
            "passed": self.passed,
            "failed": self.failed,
            "warnings": self.warnings,
            "ok": self.ok,
            "checks": self.checks,
        }
    def to_human(self) -> str:
        lines = [f"Validation Report: {'✅ PASS' if self.ok else '❌ FAIL'}",
                 f"  {self.passed} passed, {self.failed} failed, {self.warnings} warnings", ""]
        for c in self.checks:
            icon = {"pass": "✅", "fail": "❌", "warn": "⚠️"}.get(c["status"], "?")
            line = f"  {icon} {c['name']}"
            if c["detail"]:
                line += f" — {c['detail']}"
            lines.append(line)
        return "\n".join(lines)
 def validate_file_exists(path: str) -> tuple[bool, str]:
    """Check if file exists and is non-empty."""
    p = Path(os.path.expanduser(path))
    if not p.exists():
        return False, f"File not found: {path}"
    if p.stat().st_size == 0:
        return False, f"File is empty: {path}"
    return True, f"Exists, {p.stat().st_size} bytes"
 def validate_python_syntax(path: str) -> tuple[bool, str]:
    """Check Python file for syntax errors."""
    p = Path(os.path.expanduser(path))
    if not p.exists():
        return False, "File not found"
    try:
        source = p.read_text()
        compile(source, str(p), "exec")
        return True, "Syntax OK"
    except SyntaxError as e:
        return False, f"Syntax error: {e}"
 def validate_typescript_structure(path: str) -> tuple[bool, str]:
    """Basic TypeScript validation — check for exports, no excessive 'any'."""
    p = Path(os.path.expanduser(path))
    if not p.exists():
        return False, "File not found"
    content = p.read_text()
    issues = []
    any_count = len(re.findall(r'\bany\b', content))
    if any_count > 10:
        issues.append(f"Excessive 'any' usage ({any_count} occurrences)")
    if not re.search(r'\bexport\b', content):
        issues.append("No exports found")
    if issues:
        return False, "; ".join(issues)
    return True, "Structure OK"
 def validate_staging_location(files: list[str], staging_dir: str = "staging") -> list[tuple[str, bool, str]]:
    """Check if files are in the staging directory."""
    results = []
    for f in files:
        expanded = os.path.expanduser(f)
        in_staging = staging_dir in expanded
        results.append((f, in_staging, "In staging" if in_staging else "Not in staging dir"))
    return results
 def run_validation(transcript_path: Path, task: str) -> ValidationReport:
    """Main validation logic."""
    report = ValidationReport()
    entries = parse_jsonl(transcript_path)
    if not entries:
        report.add("Transcript readable", "fail", "No entries found")
        return report
    report.add("Transcript readable", "pass", f"{len(entries)} entries")
    # Check mentioned files exist
    mentioned = extract_mentioned_files(task)
    created = extract_created_files_from_transcript(entries)
    all_files = list(set(mentioned + created))
    for f in all_files:
        exists, detail = validate_file_exists(f)
        report.add(f"File exists: {Path(f).name}", "pass" if exists else "fail", detail)
    # Syntax check Python files
    for f in all_files:
        if f.endswith(".py"):
            ok, detail = validate_python_syntax(f)
            report.add(f"Python syntax: {Path(f).name}", "pass" if ok else "fail", detail)
    # Syntax check TypeScript files
    for f in all_files:
        if f.endswith(".ts") or f.endswith(".tsx"):
            ok, detail = validate_typescript_structure(f)
            report.add(f"TS structure: {Path(f).name}", "pass" if ok else "fail", detail)
    # Check staging location if mentioned in task
    if "staging" in task.lower():
        for f in all_files:
            expanded = os.path.expanduser(f)
            in_staging = "staging" in expanded
            report.add(f"In staging: {Path(f).name}",
                       "pass" if in_staging else "warn",
                       "In staging dir" if in_staging else "Not in staging dir")
    # Check test results if tests were requested
    if any(w in task.lower() for w in ["test", "tests", "pytest", "unittest"]):
        test_results = check_test_results(entries)
        if test_results["tests_found"]:
            if test_results["tests_passed"]:
                report.add("Tests passed", "pass", test_results["details"][:100])
            else:
                report.add("Tests passed", "fail", test_results["details"][:100])
        else:
            report.add("Tests executed", "warn", "No test output found in transcript")
    # Check for unaddressed errors
    errors = extract_transcript_errors(entries)
    if errors:
        report.add("Unaddressed errors", "warn", f"{len(errors)} error(s) in transcript")
    else:
        report.add("No unaddressed errors", "pass")
    return report
 def main():
    parser = argparse.ArgumentParser(description="Sub-Agent Output Validator")
    parser.add_argument("--transcript", help="Path to session JSONL file")
    parser.add_argument("--session-key", help="Session key (e.g. agent:main:subagent:xxx)")
    parser.add_argument("--task", default="", help="Original task description")
    parser.add_argument("--json", action="store_true", help="Output JSON only")
    args = parser.parse_args()
    if not args.transcript and not args.session_key:
        parser.error("Either --transcript or --session-key is required")
    if args.session_key:
        path = find_session_by_key(args.session_key)
        if not path:
            print(f"Session not found: {args.session_key}", file=sys.stderr)
            sys.exit(1)
    else:
        path = Path(args.transcript)
        if not path.exists():
            print(f"File not found: {args.transcript}", file=sys.stderr)
            sys.exit(1)
    report = run_validation(path, args.task)
    if args.json:
        print(json.dumps(report.to_json(), indent=2))
    else:
        print(report.to_human())
        print()
        print(json.dumps(report.to_json(), indent=2))
    sys.exit(0 if report.ok else 1)
 if __name__ == "__main__":
    main()
--- a/pyproject.toml
+++ b/pyproject.toml
@ -0,0 +1,23 @@
 [build-system]
 requires = ["setuptools>=68.0", "wheel"]
 build-backend = "setuptools.build_meta"
 [project]
 name = "cortex"
 version = "0.1.0"
 description = "Intelligence layer for OpenClaw — triage, health, feedback, memory hygiene, roadmap, validation"
 readme = "README.md"
 requires-python = ">=3.11"
 license = {text = "MIT"}
 authors = [
    {name = "Claudia & Albert", email = "hildalbert@gmail.com"},
 ]
 [project.scripts]
 cortex = "cortex.cli:main"
 [tool.setuptools.packages.find]
 include = ["cortex*"]
 [tool.pytest.ini_options]
 testpaths = ["tests"]
--- a/tests/test_enhancements.py
+++ b/tests/test_enhancements.py
@ -0,0 +1,303 @@
 #!/usr/bin/env python3
 """
 Tests for memory enhancement components.
 Run: python3 -m pytest test_enhancements.py -v
  or: python3 test_enhancements.py
 """
 import json
 import sys
 import time
 import unittest
 from datetime import date, timedelta
 from pathlib import Path
 # Ensure our modules are importable
 sys.path.insert(0, str(Path(__file__).parent))
 from cortex.composite_scorer import (
    SearchResult, extract_date, recency_score, source_weight,
    multi_term_confidence, score_results,
 )
 from cortex.intent_classifier import classify, reset_cache, IntentResult
 from cortex.auto_handoff import extract_markers, format_handoff, generate_handoff
 class TestCompositeScorer(unittest.TestCase):
    """Tests for composite_scorer.py"""
    def test_extract_date_from_path(self):
        r = SearchResult(text="test", source_path="memory/2026-02-07.md")
        self.assertEqual(extract_date(r), date(2026, 2, 7))
    def test_extract_date_from_content(self):
        r = SearchResult(text="On 2026-01-15 we decided to...", source_path="MEMORY.md")
        self.assertEqual(extract_date(r), date(2026, 1, 15))
    def test_extract_date_none(self):
        r = SearchResult(text="no date here", source_path="README.md")
        self.assertIsNone(extract_date(r))
    def test_recency_today(self):
        today = date.today()
        score = recency_score(today, today)
        self.assertAlmostEqual(score, 1.0, places=2)
    def test_recency_half_life(self):
        today = date.today()
        half_life = 14
        old = today - timedelta(days=half_life)
        score = recency_score(old, today, half_life)
        self.assertAlmostEqual(score, 0.5, places=2)
    def test_recency_very_old(self):
        today = date.today()
        old = today - timedelta(days=365)
        score = recency_score(old, today, 14)
        self.assertLess(score, 0.01)
    def test_recency_no_date(self):
        score = recency_score(None)
        self.assertEqual(score, 0.3)
    def test_source_weight_memory_md(self):
        w = source_weight("MEMORY.md", {"MEMORY.md": 1.0, "default": 0.4})
        self.assertEqual(w, 1.0)
    def test_source_weight_daily_note(self):
        weights = {"memory/": 0.7, "default": 0.4}
        w = source_weight("memory/2026-02-07.md", weights)
        self.assertEqual(w, 0.7)
    def test_source_weight_default(self):
        w = source_weight("random/file.txt", {"MEMORY.md": 1.0, "default": 0.4})
        self.assertEqual(w, 0.4)
    def test_multi_term_all_match(self):
        score = multi_term_confidence("gateway fix watchdog", "The gateway fix for watchdog issue")
        self.assertAlmostEqual(score, 1.0)
    def test_multi_term_partial(self):
        score = multi_term_confidence("gateway fix watchdog", "The gateway is running fine")
        self.assertAlmostEqual(score, 1/3, places=2)
    def test_multi_term_none(self):
        score = multi_term_confidence("gateway fix", "completely unrelated text")
        self.assertEqual(score, 0.0)
    def test_multi_term_empty_query(self):
        score = multi_term_confidence("", "some text")
        self.assertEqual(score, 0.5)
    def test_score_results_ordering(self):
        """Recent high-source results should rank above old high-search-score results."""
        today = date.today()
        recent_date = today.strftime("%Y-%m-%d")
        old_date = (today - timedelta(days=90)).strftime("%Y-%m-%d")
        results = [
            SearchResult(text="old but high match", source_path=f"memory/{old_date}.md", original_score=0.95),
            SearchResult(text="recent in MEMORY", source_path="MEMORY.md", original_score=0.7,
                         metadata={"date": recent_date}),
        ]
        scored = score_results(results, query="test query", reference_date=today)
        # MEMORY.md with recent date should rank higher due to source + recency
        self.assertEqual(scored[0].source_path, "MEMORY.md")
    def test_score_results_empty(self):
        self.assertEqual(score_results([], query="test"), [])
    def test_scoring_performance(self):
        """Composite scoring should be <10ms for 50 results."""
        results = [
            SearchResult(text=f"Result {i} about gateway and NATS",
                         source_path=f"memory/2026-01-{i%28+1:02d}.md",
                         original_score=0.5 + (i % 10) / 20)
            for i in range(50)
        ]
        start = time.perf_counter()
        score_results(results, query="gateway NATS")
        elapsed_ms = (time.perf_counter() - start) * 1000
        self.assertLess(elapsed_ms, 10, f"Scoring took {elapsed_ms:.1f}ms, should be <10ms")
 class TestIntentClassifier(unittest.TestCase):
    """Tests for intent_classifier.py"""
    def setUp(self):
        reset_cache()
    def test_who_query_english(self):
        r = classify("Albert Hild contact")
        self.assertEqual(r.intent, "WHO")
    def test_who_query_german(self):
        r = classify("wer ist Sebastian Baier")
        self.assertEqual(r.intent, "WHO")
    def test_when_query(self):
        r = classify("when did we fix the gateway")
        self.assertEqual(r.intent, "WHEN")
    def test_when_query_german(self):
        r = classify("wann wurde TypeDB eingerichtet")
        self.assertEqual(r.intent, "WHEN")
    def test_why_query(self):
        r = classify("why did we choose NATS over Kafka")
        self.assertEqual(r.intent, "WHY")
    def test_why_query_german(self):
        r = classify("warum ChromaDB statt Pinecone")
        self.assertEqual(r.intent, "WHY")
    def test_what_query(self):
        r = classify("Mondo Gate regulatory status")
        self.assertEqual(r.intent, "WHAT")
    def test_empty_query(self):
        r = classify("")
        self.assertEqual(r.intent, "WHAT")
        self.assertLess(r.confidence, 0.5)
    def test_mixed_language(self):
        r = classify("who is the Ansprechpartner for Mondo Gate")
        self.assertEqual(r.intent, "WHO")
    def test_classification_speed(self):
        """Intent classification must be <5ms."""
        queries = [
            "Albert Hild contact", "when did we fix the gateway",
            "why NATS over Kafka", "infrastructure status",
            "wer ist bei Vainplex", "wann Viola fix",
        ]
        for q in queries:
            r = classify(q)
            self.assertLess(r.classification_ms, 5.0,
                            f"Classification of '{q}' took {r.classification_ms:.2f}ms")
    def test_capitalized_names_boost_who(self):
        r = classify("Sebastian Baier Mondo Gate")
        self.assertEqual(r.intent, "WHO")
    def test_date_tokens_boost_when(self):
        r = classify("watchdog incident February")
        self.assertEqual(r.intent, "WHEN")
    def test_returns_weight_adjustments(self):
        r = classify("warum ChromaDB statt Pinecone")
        self.assertEqual(r.intent, "WHY")
        # WHY should have weight adjustments for MEMORY.md boost
        self.assertIsInstance(r.weight_adjustments, dict)
 class TestAutoHandoff(unittest.TestCase):
    """Tests for auto_handoff.py"""
    SAMPLE_CONTENT = """# Session 2026-02-07
 ## Infrastructure Work
 - Fixed gateway watchdog issue
 - DECISION: Use NATS instead of Kafka for event streaming
 - TODO: Set up monitoring for new NATS cluster
 - BLOCKED: Waiting for DNS propagation for new domain
 ## Open Items
 - QUESTION: Should we migrate old events to new format?
 - [ ] Update documentation
 - [ ] Run integration tests
 DECISION: Switch Mona to Opus model for better reasoning
 TODO: Benchmark Opus vs Sonnet for our workload
 """
    def test_extract_decisions(self):
        result = extract_markers(self.SAMPLE_CONTENT)
        self.assertGreaterEqual(len(result["decisions"]), 2)
        self.assertTrue(any("NATS" in d for d in result["decisions"]))
    def test_extract_todos(self):
        result = extract_markers(self.SAMPLE_CONTENT)
        self.assertGreaterEqual(len(result["todos"]), 3)  # 2 explicit + 2 checkboxes
    def test_extract_blocked(self):
        result = extract_markers(self.SAMPLE_CONTENT)
        self.assertGreaterEqual(len(result["blocked"]), 1)
        self.assertTrue(any("DNS" in b for b in result["blocked"]))
    def test_extract_questions(self):
        result = extract_markers(self.SAMPLE_CONTENT)
        self.assertGreaterEqual(len(result["questions"]), 1)
    def test_extract_headings(self):
        result = extract_markers(self.SAMPLE_CONTENT)
        self.assertGreaterEqual(len(result.get("key_context", [])), 1)
    def test_format_handoff(self):
        extracted = {
            "decisions": ["Use NATS"],
            "todos": ["Set up monitoring"],
            "blocked": ["DNS propagation"],
            "questions": ["Migrate events?"],
        }
        md = format_handoff(extracted, title="Test Handoff")
        self.assertIn("# Test Handoff", md)
        self.assertIn("✅ Decisions", md)
        self.assertIn("Use NATS", md)
        self.assertIn("📋 Next Steps", md)
    def test_format_empty(self):
        md = format_handoff({})
        self.assertIn("Session Handoff", md)
    def test_generate_handoff_regex(self):
        result = generate_handoff(self.SAMPLE_CONTENT, source="test.md")
        self.assertIn("NATS", result)
        self.assertIn("DNS", result)
    def test_real_daily_note(self):
        """Test with a real daily note if available."""
        note_path = Path.home() / "clawd" / "memory" / "2026-02-08.md"
        if note_path.exists():
            content = note_path.read_text()
            result = extract_markers(content)
            # Should at least extract headings
            self.assertIsInstance(result, dict)
            self.assertIn("key_context", result)
 class TestIntegration(unittest.TestCase):
    """Integration tests for the full pipeline."""
    def test_file_search_finds_results(self):
        """File search should find results in memory/."""
        from cortex.enhanced_search import search_files
        results = search_files("gateway")
        # Should find at least something in memory files
        self.assertIsInstance(results, list)
    def test_enhanced_search_pipeline(self):
        """Full pipeline should run without errors."""
        from cortex.enhanced_search import enhanced_search
        result = enhanced_search("gateway", use_unified=False, max_results=5)
        self.assertIn("query", result)
        self.assertIn("intent", result)
        self.assertIn("results", result)
        self.assertIn("timing", result)
        self.assertEqual(result["intent"]["type"], "WHAT")
    def test_pipeline_who_query(self):
        from cortex.enhanced_search import enhanced_search
        result = enhanced_search("Albert Hild contact", use_unified=False, max_results=5)
        self.assertEqual(result["intent"]["type"], "WHO")
    def test_pipeline_timing(self):
        """Full pipeline without unified should be fast."""
        from cortex.enhanced_search import enhanced_search
        result = enhanced_search("test query", use_unified=False, max_results=5)
        # Should complete in reasonable time (< 2 seconds for file search)
        self.assertLess(result["timing"]["total_ms"], 2000)
 if __name__ == "__main__":
    unittest.main(verbosity=2)
--- a/tests/test_intelligence.py
+++ b/tests/test_intelligence.py
@ -0,0 +1,341 @@
 #!/usr/bin/env python3
 """Tests for triage.py and memory_hygiene.py — 35+ tests."""
 import json
 import os
 import shutil
 import sys
 import tempfile
 import unittest
 from datetime import datetime, timedelta
 from pathlib import Path
 from unittest.mock import patch
 sys.path.insert(0, os.path.dirname(__file__))
 from cortex.triage import score_task, rank_tasks, analyze_message, TriageScore
 import cortex.memory_hygiene as mh
 class TestTriageUrgency(unittest.TestCase):
    """Test urgency scoring dimension."""
    def test_high_urgency_german(self):
        s = score_task("Das muss JETZT sofort gefixt werden!")
        self.assertGreater(s.urgency, 0.7)
    def test_high_urgency_english(self):
        s = score_task("URGENT: system is down, critical error!")
        self.assertGreater(s.urgency, 0.7)
    def test_low_urgency(self):
        s = score_task("Update the documentation when you have time")
        self.assertLess(s.urgency, 0.3)
    def test_emergency(self):
        s = score_task("Notfall! Alles kaputt!")
        self.assertGreater(s.urgency, 0.8)
    def test_deadline_urgency(self):
        s = score_task("Deadline today, needs to be done ASAP")
        self.assertGreater(s.urgency, 0.5)
    def test_no_urgency(self):
        s = score_task("Nice to have feature for later")
        self.assertEqual(s.urgency, 0.0)
 class TestTriageImportance(unittest.TestCase):
    """Test importance scoring dimension."""
    def test_production_security(self):
        s = score_task("Production security breach detected")
        self.assertGreater(s.importance, 0.7)
    def test_customer_money(self):
        s = score_task("Kunde verliert Geld wegen Fehler")
        self.assertGreater(s.importance, 0.6)
    def test_regulatory(self):
        s = score_task("BaFin compliance audit next week")
        self.assertGreater(s.importance, 0.8)
    def test_low_importance(self):
        s = score_task("Change button color on internal tool")
        self.assertLess(s.importance, 0.3)
    def test_gateway_dns(self):
        s = score_task("Gateway DNS resolution failing")
        self.assertGreater(s.importance, 0.5)
    def test_albert_request(self):
        s = score_task("Albert wants this done")
        self.assertGreater(s.importance, 0.4)
 class TestTriageEffort(unittest.TestCase):
    """Test effort estimation."""
    def test_quick_fix(self):
        s = score_task("Quick fix: change config value")
        self.assertLess(s.effort, 0.4)
    def test_major_refactor(self):
        s = score_task("Complete refactor of the migration system")
        self.assertGreater(s.effort, 0.6)
    def test_simple_german(self):
        s = score_task("Einfach schnell den Typo fixen")
        self.assertLess(s.effort, 0.3)
    def test_default_effort(self):
        s = score_task("Do something")
        self.assertAlmostEqual(s.effort, 0.5, places=1)
 class TestTriageReadiness(unittest.TestCase):
    """Test readiness/dependency detection."""
    def test_blocked(self):
        s = score_task("Blocked: waiting for API key from vendor")
        self.assertLess(s.readiness, 0.5)
    def test_german_blocked(self):
        s = score_task("Brauche erst die Credentials, warte auf Albert")
        self.assertLess(s.readiness, 0.5)
    def test_ready(self):
        s = score_task("Fix the login page CSS")
        self.assertEqual(s.readiness, 1.0)
    def test_depends_on(self):
        s = score_task("Depends on database migration finishing first")
        self.assertLess(s.readiness, 0.5)
 class TestTriagePriority(unittest.TestCase):
    """Test overall priority scoring."""
    def test_critical_scores_high(self):
        s = score_task("URGENT: Production is down! Critical security breach!")
        self.assertGreater(s.priority, 0.6)
    def test_blocked_lowers_priority(self):
        ready = score_task("Fix production error")
        blocked = score_task("Fix production error, blocked by vendor")
        self.assertGreater(ready.priority, blocked.priority)
    def test_easy_beats_hard_all_else_equal(self):
        easy = score_task("Quick config fix for gateway")
        hard = score_task("Complete refactor redesign for gateway")
        # Both have gateway importance, but effort differs
        self.assertGreater(easy.priority, hard.priority)
 class TestTriageRanking(unittest.TestCase):
    """Test ranking multiple tasks."""
    def test_rank_order(self):
        ranked = rank_tasks([
            "Write docs",
            "URGENT: Production down!",
            "Update OpenClaw config",
        ])
        self.assertEqual(ranked[0].text, "URGENT: Production down!")
        self.assertEqual(len(ranked), 3)
    def test_rank_preserves_all(self):
        tasks = ["a", "b", "c", "d"]
        ranked = rank_tasks(tasks)
        self.assertEqual(len(ranked), 4)
    def test_rank_descending(self):
        ranked = rank_tasks(["Fix docs", "CRITICAL production down", "Nice to have"])
        for i in range(len(ranked) - 1):
            self.assertGreaterEqual(ranked[i].priority, ranked[i + 1].priority)
 class TestTriageAnalyze(unittest.TestCase):
    """Test message analysis."""
    def test_analyze_returns_signals(self):
        r = analyze_message("JETZT sofort Production fixen!")
        self.assertIn("jetzt", r["signals"]["urgency"])
        self.assertIn("sofort", r["signals"]["urgency"])
        self.assertIn("production", r["signals"]["importance"])
    def test_analyze_classification_critical(self):
        r = analyze_message("URGENT critical production security down!")
        self.assertIn("CRITICAL", r["classification"])
    def test_analyze_classification_low(self):
        r = analyze_message("Maybe someday update the readme")
        self.assertIn("LOW", r["classification"])
 class TestMemoryDuplicates(unittest.TestCase):
    """Test duplicate detection."""
    def setUp(self):
        self.tmpdir = Path(tempfile.mkdtemp())
        self.orig_dir = mh.MEMORY_DIR
        mh.MEMORY_DIR = self.tmpdir
    def tearDown(self):
        mh.MEMORY_DIR = self.orig_dir
        shutil.rmtree(self.tmpdir)
    def test_finds_exact_duplicates(self):
        para = "This is a sufficiently long paragraph that should be detected as duplicate content across files."
        (self.tmpdir / "a.md").write_text(f"# A\n\n{para}\n\nOther stuff.")
        (self.tmpdir / "b.md").write_text(f"# B\n\n{para}\n\nDifferent stuff.")
        dupes = mh.find_duplicates(min_length=20)
        self.assertGreater(len(dupes), 0)
    def test_no_false_positives(self):
        (self.tmpdir / "a.md").write_text("# Unique content A\n\nCompletely different paragraph about apples.")
        (self.tmpdir / "b.md").write_text("# Unique content B\n\nTotally unrelated text about oranges.")
        dupes = mh.find_duplicates(min_length=20)
        self.assertEqual(len(dupes), 0)
    def test_short_paragraphs_ignored(self):
        (self.tmpdir / "a.md").write_text("Hi\n\nHi")
        (self.tmpdir / "b.md").write_text("Hi\n\nHi")
        dupes = mh.find_duplicates(min_length=50)
        self.assertEqual(len(dupes), 0)
 class TestMemoryStaleness(unittest.TestCase):
    """Test staleness detection."""
    def setUp(self):
        self.tmpdir = Path(tempfile.mkdtemp())
        self.orig_dir = mh.MEMORY_DIR
        mh.MEMORY_DIR = self.tmpdir
    def tearDown(self):
        mh.MEMORY_DIR = self.orig_dir
        shutil.rmtree(self.tmpdir)
    def test_old_todo(self):
        f = self.tmpdir / "notes.md"
        f.write_text("# Notes\n\nTODO: fix this thing\n")
        # Set mtime to 60 days ago
        old = (datetime.now() - timedelta(days=60)).timestamp()
        os.utime(f, (old, old))
        stale = mh.find_stale()
        reasons = [s["reason"] for s in stale]
        self.assertTrue(any("TODO" in r for r in reasons))
    def test_old_date(self):
        f = self.tmpdir / "info.md"
        old_date = (datetime.now() - timedelta(days=120)).strftime("%Y-%m-%d")
        f.write_text(f"Meeting on {old_date} decided X.\n")
        stale = mh.find_stale()
        self.assertGreater(len(stale), 0)
    def test_fresh_content_ok(self):
        f = self.tmpdir / "fresh.md"
        today = datetime.now().strftime("%Y-%m-%d")
        f.write_text(f"Updated {today}: everything is fine.\n")
        stale = mh.find_stale()
        date_stale = [s for s in stale if "days old" in s.get("reason", "")]
        self.assertEqual(len(date_stale), 0)
 class TestMemoryOrphans(unittest.TestCase):
    """Test orphan detection."""
    def setUp(self):
        self.tmpdir = Path(tempfile.mkdtemp())
        self.orig_dir = mh.MEMORY_DIR
        mh.MEMORY_DIR = self.tmpdir
    def tearDown(self):
        mh.MEMORY_DIR = self.orig_dir
        shutil.rmtree(self.tmpdir)
    def test_finds_orphaned_files(self):
        (self.tmpdir / "orphan.md").write_text("Nobody links to me")
        (self.tmpdir / "main.md").write_text("# Main\nSome text.")
        orph = mh.find_orphans()
        self.assertIn("orphan.md", orph["orphaned_files"])
    def test_finds_broken_links(self):
        (self.tmpdir / "a.md").write_text("[click](nonexistent.md)")
        orph = mh.find_orphans()
        self.assertGreater(len(orph["broken_links"]), 0)
    def test_finds_empty_files(self):
        (self.tmpdir / "empty.md").write_text("")
        orph = mh.find_orphans()
        self.assertIn("empty.md", orph["empty_files"])
    def test_permanent_files_not_orphaned(self):
        (self.tmpdir / "WORKING.md").write_text("Current work")
        orph = mh.find_orphans()
        self.assertNotIn("WORKING.md", orph["orphaned_files"])
 class TestMemoryStats(unittest.TestCase):
    """Test stats generation."""
    def setUp(self):
        self.tmpdir = Path(tempfile.mkdtemp())
        self.orig_dir = mh.MEMORY_DIR
        mh.MEMORY_DIR = self.tmpdir
    def tearDown(self):
        mh.MEMORY_DIR = self.orig_dir
        shutil.rmtree(self.tmpdir)
    def test_stats_structure(self):
        (self.tmpdir / "a.md").write_text("Hello world")
        (self.tmpdir / "b.json").write_text("{}")
        stats = mh.gather_stats()
        self.assertEqual(stats["total_files"], 2)
        self.assertIn(".md", stats["files_by_extension"])
        self.assertIn(".json", stats["files_by_extension"])
        self.assertIsNotNone(stats["oldest"])
        self.assertIsNotNone(stats["newest"])
    def test_empty_dir(self):
        stats = mh.gather_stats()
        self.assertEqual(stats["total_files"], 0)
 class TestMemoryArchive(unittest.TestCase):
    """Test archive functionality."""
    def setUp(self):
        self.tmpdir = Path(tempfile.mkdtemp())
        self.orig_dir = mh.MEMORY_DIR
        self.orig_archive = mh.ARCHIVE_DIR
        mh.MEMORY_DIR = self.tmpdir
        mh.ARCHIVE_DIR = self.tmpdir / "archive"
    def tearDown(self):
        mh.MEMORY_DIR = self.orig_dir
        mh.ARCHIVE_DIR = self.orig_archive
        shutil.rmtree(self.tmpdir)
    def test_dry_run_doesnt_move(self):
        (self.tmpdir / "2025-01-01.md").write_text("Old note")
        result = mh.archive_old_notes(older_than_days=30, execute=False)
        self.assertTrue(result["dry_run"])
        self.assertEqual(result["count"], 1)
        self.assertTrue((self.tmpdir / "2025-01-01.md").exists())
    def test_execute_moves_files(self):
        (self.tmpdir / "2025-01-01.md").write_text("Old note")
        result = mh.archive_old_notes(older_than_days=30, execute=True)
        self.assertFalse((self.tmpdir / "2025-01-01.md").exists())
        self.assertTrue((self.tmpdir / "archive" / "2025" / "2025-01-01.md").exists())
    def test_permanent_files_kept(self):
        (self.tmpdir / "WORKING.md").write_text("Keep me")
        result = mh.archive_old_notes(older_than_days=1, execute=True)
        self.assertTrue((self.tmpdir / "WORKING.md").exists())
 if __name__ == "__main__":
    unittest.main()
--- a/tests/test_proactive.py
+++ b/tests/test_proactive.py
@ -0,0 +1,346 @@
 #!/usr/bin/env python3
 """Tests for health_scanner.py and roadmap.py — 30+ tests."""
 import json
 import os
 import sys
 import tempfile
 import unittest
 from datetime import datetime, timedelta
 from pathlib import Path
 from unittest.mock import patch, MagicMock
 # Add parent to path
 sys.path.insert(0, str(Path(__file__).parent))
 from cortex.health_scanner import HealthScanner, Finding, _severity_rank, format_human, DEPRECATED_MODELS
 import cortex.roadmap as roadmap
 class TestSeverityRank(unittest.TestCase):
    def test_ordering(self):
        self.assertLess(_severity_rank("INFO"), _severity_rank("WARN"))
        self.assertLess(_severity_rank("WARN"), _severity_rank("CRITICAL"))
    def test_unknown(self):
        self.assertEqual(_severity_rank("UNKNOWN"), -1)
 class TestFinding(unittest.TestCase):
    def test_to_dict(self):
        f = Finding("agents", "WARN", "test title", "detail")
        d = f.to_dict()
        self.assertEqual(d["section"], "agents")
        self.assertEqual(d["severity"], "WARN")
        self.assertEqual(d["title"], "test title")
    def test_to_dict_no_detail(self):
        f = Finding("deps", "INFO", "ok")
        self.assertEqual(f.to_dict()["detail"], "")
 class TestHealthScanner(unittest.TestCase):
    def _make_scanner(self, config=None):
        with patch.object(HealthScanner, '_load_config') as mock_load:
            scanner = HealthScanner()
            scanner.config = config or {"agents": {"list": [], "defaults": {}}}
            scanner.findings = []
            return scanner
    def test_no_agents(self):
        scanner = self._make_scanner({"agents": {"list": []}})
        scanner.check_agents()
        self.assertTrue(any("No agents" in f.title for f in scanner.findings))
    def test_missing_workspace(self):
        scanner = self._make_scanner({"agents": {"list": [
            {"id": "test", "workspace": "/nonexistent/path/xyz", "model": {"primary": "anthropic/test"}}
        ]}})
        scanner.check_agents()
        self.assertTrue(any("missing" in f.title.lower() for f in scanner.findings))
    def test_valid_workspace(self):
        with tempfile.TemporaryDirectory() as td:
            scanner = self._make_scanner({"agents": {"list": [
                {"id": "test", "workspace": td, "model": {"primary": "anthropic/test"}}
            ]}})
            scanner.check_agents()
            self.assertTrue(any("OK" in f.title for f in scanner.findings))
    @patch('cortex.health_scanner.urllib.request.urlopen')
    def test_ollama_check_reachable(self, mock_urlopen):
        mock_resp = MagicMock()
        mock_resp.read.return_value = json.dumps({"models": [{"name": "mymodel:latest"}]}).encode()
        mock_resp.__enter__ = lambda s: s
        mock_resp.__exit__ = MagicMock(return_value=False)
        mock_urlopen.return_value = mock_resp
        scanner = self._make_scanner()
        scanner._check_ollama_model("test", "ollama-desktop/mymodel:latest")
        self.assertTrue(any("available" in f.title for f in scanner.findings))
    @patch('cortex.health_scanner.urllib.request.urlopen')
    def test_ollama_check_unreachable(self, mock_urlopen):
        mock_urlopen.side_effect = Exception("connection refused")
        scanner = self._make_scanner()
        scanner._check_ollama_model("test", "ollama-desktop/model:latest")
        self.assertTrue(any("unreachable" in f.title.lower() for f in scanner.findings))
    def test_memory_check(self):
        scanner = self._make_scanner()
        scanner._check_memory()
        self.assertTrue(any("Memory" in f.title for f in scanner.findings))
    def test_disk_check(self):
        scanner = self._make_scanner()
        scanner._check_disk()
        self.assertTrue(any("Disk" in f.title for f in scanner.findings))
    @patch('cortex.health_scanner.subprocess.run')
    def test_nats_active(self, mock_run):
        mock_run.return_value = MagicMock(returncode=0, stdout="active")
        scanner = self._make_scanner()
        scanner._check_nats()
        self.assertTrue(any("NATS" in f.title and f.severity == "INFO" for f in scanner.findings))
    @patch('cortex.health_scanner.subprocess.run')
    def test_nats_inactive(self, mock_run):
        mock_run.return_value = MagicMock(returncode=3, stdout="inactive")
        scanner = self._make_scanner()
        scanner._check_nats()
        self.assertTrue(any("NATS" in f.title and f.severity == "CRITICAL" for f in scanner.findings))
    def test_deprecated_model_detection(self):
        scanner = self._make_scanner({"agents": {
            "list": [{"id": "test", "model": {"primary": "anthropic/claude-3-5-haiku-latest", "fallbacks": []}}],
            "defaults": {"model": {}, "models": {}, "heartbeat": {}}
        }})
        scanner.check_config()
        self.assertTrue(any("EOL" in f.title for f in scanner.findings))
    def test_run_all_sections(self):
        scanner = self._make_scanner({"agents": {"list": [], "defaults": {"model": {}, "models": {}, "heartbeat": {}}}})
        report = scanner.run()
        self.assertIn("timestamp", report)
        self.assertIn("overall", report)
        self.assertIn("findings", report)
    def test_run_single_section(self):
        scanner = self._make_scanner({"agents": {"list": []}})
        report = scanner.run(["agents"])
        self.assertTrue(all(f["section"] == "agents" for f in report["findings"]))
    def test_format_human(self):
        report = {
            "timestamp": "2026-02-08T20:00:00",
            "overall": "WARN",
            "findings_count": {"INFO": 1, "WARN": 1, "CRITICAL": 0},
            "findings": [
                {"section": "agents", "severity": "WARN", "title": "test warn", "detail": ""},
                {"section": "deps", "severity": "INFO", "title": "test info", "detail": ""},
            ]
        }
        output = format_human(report)
        self.assertIn("WARN", output)
        self.assertIn("test warn", output)
 class TestRoadmap(unittest.TestCase):
    def setUp(self):
        self.tmpdir = tempfile.mkdtemp()
        self.roadmap_file = Path(self.tmpdir) / "roadmap.json"
        self.seed_data = {
            "items": [
                {
                    "id": "item-001",
                    "title": "Test task 1",
                    "status": "open",
                    "priority": "P0",
                    "deadline": (datetime.now() - timedelta(days=1)).strftime("%Y-%m-%d"),
                    "depends_on": [],
                    "tags": ["infra"],
                    "created": "2026-01-01T00:00:00",
                    "updated": "2026-01-01T00:00:00",
                    "notes": ""
                },
                {
                    "id": "item-002",
                    "title": "Test task 2",
                    "status": "in_progress",
                    "priority": "P1",
                    "deadline": (datetime.now() + timedelta(days=3)).strftime("%Y-%m-%d"),
                    "depends_on": ["item-001"],
                    "tags": ["business"],
                    "created": "2026-01-01T00:00:00",
                    "updated": "2026-01-01T00:00:00",
                    "notes": ""
                },
                {
                    "id": "item-003",
                    "title": "Done task",
                    "status": "done",
                    "priority": "P2",
                    "deadline": "2026-01-01",
                    "depends_on": [],
                    "tags": ["infra"],
                    "created": "2026-01-01T00:00:00",
                    "updated": "2026-01-01T00:00:00",
                    "notes": ""
                },
                {
                    "id": "item-004",
                    "title": "Stale task",
                    "status": "in_progress",
                    "priority": "P2",
                    "deadline": null if False else None,
                    "depends_on": ["item-999"],
                    "tags": [],
                    "created": "2026-01-01T00:00:00",
                    "updated": (datetime.now() - timedelta(days=10)).strftime("%Y-%m-%dT%H:%M:%S"),
                    "notes": ""
                }
            ]
        }
        self.roadmap_file.write_text(json.dumps(self.seed_data))
    def tearDown(self):
        import shutil
        shutil.rmtree(self.tmpdir)
    def test_load(self):
        data = roadmap.load_roadmap(self.roadmap_file)
        self.assertEqual(len(data["items"]), 4)
    def test_load_nonexistent(self):
        data = roadmap.load_roadmap(Path(self.tmpdir) / "nope.json")
        self.assertEqual(data, {"items": []})
    def test_save_and_reload(self):
        data = roadmap.load_roadmap(self.roadmap_file)
        data["items"].append({"id": "new", "title": "new"})
        roadmap.save_roadmap(data, self.roadmap_file)
        reloaded = roadmap.load_roadmap(self.roadmap_file)
        self.assertEqual(len(reloaded["items"]), 5)
    def test_find_item_full_id(self):
        data = roadmap.load_roadmap(self.roadmap_file)
        item = roadmap.find_item(data, "item-001")
        self.assertIsNotNone(item)
        self.assertEqual(item["title"], "Test task 1")
    def test_find_item_prefix(self):
        data = roadmap.load_roadmap(self.roadmap_file)
        item = roadmap.find_item(data, "item-00")
        self.assertIsNotNone(item)
    def test_find_item_missing(self):
        data = roadmap.load_roadmap(self.roadmap_file)
        self.assertIsNone(roadmap.find_item(data, "nonexistent"))
    def test_parse_date_iso(self):
        d = roadmap.parse_date("2026-02-08")
        self.assertEqual(d.year, 2026)
        self.assertEqual(d.month, 2)
    def test_parse_date_with_time(self):
        d = roadmap.parse_date("2026-02-08 09:00")
        self.assertEqual(d.hour, 9)
    def test_parse_date_none(self):
        self.assertIsNone(roadmap.parse_date(None))
        self.assertIsNone(roadmap.parse_date("not-a-date"))
    def test_overdue_detection(self, ):
        """Item-001 has deadline in the past → overdue."""
        data = roadmap.load_roadmap(self.roadmap_file)
        now = datetime.now()
        overdue = [i for i in data["items"] if i["status"] != "done"
                   and roadmap.parse_date(i.get("deadline"))
                   and roadmap.parse_date(i["deadline"]) < now]
        self.assertEqual(len(overdue), 1)
        self.assertEqual(overdue[0]["id"], "item-001")
    def test_upcoming_detection(self):
        data = roadmap.load_roadmap(self.roadmap_file)
        now = datetime.now()
        cutoff = now + timedelta(days=7)
        upcoming = [i for i in data["items"] if i["status"] != "done"
                    and roadmap.parse_date(i.get("deadline"))
                    and now <= roadmap.parse_date(i["deadline"]) <= cutoff]
        self.assertEqual(len(upcoming), 1)
        self.assertEqual(upcoming[0]["id"], "item-002")
    def test_dep_check_missing(self):
        data = roadmap.load_roadmap(self.roadmap_file)
        id_map = {i["id"]: i for i in data["items"]}
        # item-004 depends on item-999 which doesn't exist
        item = id_map["item-004"]
        for dep_id in item["depends_on"]:
            self.assertNotIn(dep_id, id_map)
    def test_dep_check_incomplete(self):
        data = roadmap.load_roadmap(self.roadmap_file)
        id_map = {i["id"]: i for i in data["items"]}
        # item-002 depends on item-001 which is not done
        item = id_map["item-002"]
        for dep_id in item["depends_on"]:
            dep = id_map.get(dep_id)
            self.assertIsNotNone(dep)
            self.assertNotEqual(dep["status"], "done")
    def test_stale_detection(self):
        data = roadmap.load_roadmap(self.roadmap_file)
        now = datetime.now()
        stale = [i for i in data["items"]
                 if i["status"] == "in_progress"
                 and roadmap.parse_date(i.get("updated"))
                 and (now - roadmap.parse_date(i["updated"])).days > 7]
        self.assertTrue(len(stale) >= 1)
        stale_ids = [s["id"] for s in stale]
        self.assertIn("item-004", stale_ids)
    def test_valid_statuses(self):
        for s in ["open", "in_progress", "blocked", "done"]:
            self.assertIn(s, roadmap.VALID_STATUSES)
    def test_valid_priorities(self):
        for p in ["P0", "P1", "P2", "P3"]:
            self.assertIn(p, roadmap.VALID_PRIORITIES)
    def test_now_iso(self):
        ts = roadmap.now_iso()
        # Should be parseable
        dt = datetime.fromisoformat(ts)
        self.assertIsInstance(dt, datetime)
 class TestReportGeneration(unittest.TestCase):
    def test_report_contains_sections(self):
        """Capture report output and verify structure."""
        import io
        from contextlib import redirect_stdout
        data = {
            "items": [
                {"id": "r1", "title": "Overdue thing", "status": "open", "priority": "P0",
                 "deadline": "2020-01-01", "depends_on": [], "tags": [], "created": "2020-01-01T00:00:00",
                 "updated": "2020-01-01T00:00:00", "notes": ""},
                {"id": "r2", "title": "Active thing", "status": "in_progress", "priority": "P1",
                 "deadline": (datetime.now() + timedelta(days=2)).strftime("%Y-%m-%d"),
                 "depends_on": [], "tags": [], "created": "2020-01-01T00:00:00",
                 "updated": "2020-01-01T00:00:00", "notes": ""},
            ]
        }
        f = io.StringIO()
        args = type('Args', (), {})()
        with redirect_stdout(f):
            roadmap.cmd_report(args, data)
        output = f.getvalue()
        self.assertIn("Roadmap Status Report", output)
        self.assertIn("Overdue", output)
        self.assertIn("Overdue thing", output)
 if __name__ == "__main__":
    unittest.main()
--- a/tests/test_selfheal.py
+++ b/tests/test_selfheal.py
@ -0,0 +1,425 @@
 #!/usr/bin/env python3
 """Tests for feedback_loop.py and validate_output.py — 30+ tests."""
 import json
 import os
 import sys
 import tempfile
 import unittest
 from pathlib import Path
 from datetime import datetime, timedelta, timezone
 sys.path.insert(0, str(Path(__file__).parent))
 from cortex.feedback_loop import (
    parse_since, parse_jsonl, get_text_content, get_tool_name,
    detect_corrections, detect_retries, detect_tool_failures,
    detect_self_errors, detect_knowledge_gaps, analyze_session,
    finding_to_markdown, deduplicate_findings, load_config,
    get_session_timestamp, Finding, append_to_growth_log,
 )
 from cortex.validate_output import (
    extract_mentioned_files, extract_created_files_from_transcript,
    extract_transcript_errors, check_test_results, validate_file_exists,
    validate_python_syntax, validate_typescript_structure, run_validation,
    ValidationReport, parse_jsonl as v_parse_jsonl,
 )
 DEFAULT_CONFIG = load_config()
 def make_entry(role="user", text="hello", entry_type="message", **kwargs):
    """Helper to create a transcript entry."""
    e = {"type": entry_type, "message": {"role": role, "content": [{"type": "text", "text": text}]}}
    e.update(kwargs)
    return e
 def make_tool_call(name="exec", args=None):
    return {"type": "message", "message": {"role": "assistant", "content": [
        {"type": "toolCall", "name": name, "arguments": args or {}}
    ]}}
 def make_tool_result(text="ok", is_error=False):
    return {"type": "message", "message": {"role": "toolResult", "content": [
        {"type": "text", "text": text}
    ], "isError": is_error}}
 def write_jsonl(path, entries):
    with open(path, "w") as f:
        for e in entries:
            f.write(json.dumps(e) + "\n")
 # === Feedback Loop Tests ===
 class TestParseSince(unittest.TestCase):
    def test_hours(self):
        result = parse_since("24h")
        self.assertAlmostEqual(
            (datetime.now(timezone.utc) - result).total_seconds(), 86400, delta=5)
    def test_days(self):
        result = parse_since("7d")
        self.assertAlmostEqual(
            (datetime.now(timezone.utc) - result).total_seconds(), 604800, delta=5)
    def test_minutes(self):
        result = parse_since("30m")
        self.assertAlmostEqual(
            (datetime.now(timezone.utc) - result).total_seconds(), 1800, delta=5)
    def test_invalid(self):
        with self.assertRaises(ValueError):
            parse_since("abc")
 class TestGetTextContent(unittest.TestCase):
    def test_list_content(self):
        entry = make_entry(text="hello world")
        self.assertEqual(get_text_content(entry), "hello world")
    def test_string_content(self):
        entry = {"message": {"content": "plain string"}}
        self.assertEqual(get_text_content(entry), "plain string")
    def test_empty(self):
        entry = {"message": {}}
        self.assertEqual(get_text_content(entry), "")
 class TestGetToolName(unittest.TestCase):
    def test_tool_call(self):
        entry = make_tool_call("read")
        self.assertEqual(get_tool_name(entry), "read")
    def test_no_tool(self):
        entry = make_entry()
        self.assertIsNone(get_tool_name(entry))
 class TestDetectCorrections(unittest.TestCase):
    def test_detects_nein(self):
        entries = [
            make_entry("assistant", "Here is the result"),
            make_entry("user", "nein, das ist falsch"),
        ]
        findings = detect_corrections(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertTrue(len(findings) >= 1)
        self.assertEqual(findings[0].category, "correction")
    def test_detects_wrong(self):
        entries = [
            make_entry("assistant", "Done!"),
            make_entry("user", "That's wrong"),
        ]
        findings = detect_corrections(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertTrue(len(findings) >= 1)
    def test_no_false_positive(self):
        entries = [
            make_entry("assistant", "Here you go"),
            make_entry("user", "Thanks, great job!"),
        ]
        findings = detect_corrections(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertEqual(len(findings), 0)
    def test_requires_assistant_before(self):
        entries = [
            make_entry("user", "nein"),
        ]
        findings = detect_corrections(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertEqual(len(findings), 0)
 class TestDetectRetries(unittest.TestCase):
    def test_detects_3_retries(self):
        entries = [make_tool_call("exec") for _ in range(4)]
        findings = detect_retries(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertEqual(len(findings), 1)
        self.assertIn("4 times", findings[0].trigger)
    def test_no_retry_under_threshold(self):
        entries = [make_tool_call("exec") for _ in range(2)]
        findings = detect_retries(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertEqual(len(findings), 0)
    def test_different_tools_no_retry(self):
        entries = [make_tool_call("exec"), make_tool_call("read"), make_tool_call("write")]
        findings = detect_retries(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertEqual(len(findings), 0)
 class TestDetectToolFailures(unittest.TestCase):
    def test_detects_is_error(self):
        entries = [make_tool_result("something failed", is_error=True)]
        findings = detect_tool_failures(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertTrue(len(findings) >= 1)
    def test_detects_error_text(self):
        entries = [make_tool_result("Error: command not found")]
        # toolResult role needed
        entries[0]["message"]["role"] = "toolResult"
        findings = detect_tool_failures(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertTrue(len(findings) >= 1)
    def test_no_error(self):
        entries = [make_tool_result("All good")]
        entries[0]["message"]["role"] = "toolResult"
        findings = detect_tool_failures(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertEqual(len(findings), 0)
 class TestDetectSelfErrors(unittest.TestCase):
    def test_detects_sorry(self):
        entries = [make_entry("assistant", "Sorry, I made a mistake there")]
        findings = detect_self_errors(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertEqual(len(findings), 1)
    def test_detects_entschuldigung(self):
        entries = [make_entry("assistant", "Entschuldigung, das war falsch")]
        findings = detect_self_errors(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertEqual(len(findings), 1)
    def test_no_apology(self):
        entries = [make_entry("assistant", "Here is your answer")]
        findings = detect_self_errors(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertEqual(len(findings), 0)
 class TestDetectKnowledgeGaps(unittest.TestCase):
    def test_detects_gap(self):
        entries = [
            make_entry("assistant", "I couldn't find that information"),
            make_entry("user", "The answer is actually in the config file at /etc/app/config.yaml"),
        ]
        findings = detect_knowledge_gaps(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertEqual(len(findings), 1)
    def test_no_gap_short_reply(self):
        entries = [
            make_entry("assistant", "I couldn't find it"),
            make_entry("user", "ok"),
        ]
        findings = detect_knowledge_gaps(entries, DEFAULT_CONFIG, "test.jsonl")
        self.assertEqual(len(findings), 0)
 class TestFindingToMarkdown(unittest.TestCase):
    def test_format(self):
        f = Finding("correction", "User said 'nein'", (10, 12), "test.jsonl")
        md = finding_to_markdown(f, DEFAULT_CONFIG)
        self.assertIn("Auto-detected: User Correction", md)
        self.assertIn("User said 'nein'", md)
        self.assertIn("lines 10-12", md)
 class TestDeduplicate(unittest.TestCase):
    def test_removes_dupes(self):
        f1 = Finding("correction", "User said nein after agent response", (1, 2), "a.jsonl")
        f2 = Finding("correction", "User said nein after agent response", (5, 6), "a.jsonl")
        result = deduplicate_findings([f1, f2])
        self.assertEqual(len(result), 1)
 class TestParseJsonl(unittest.TestCase):
    def test_parses_valid(self):
        with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as f:
            f.write('{"a":1}\n{"b":2}\n')
            f.flush()
            result = parse_jsonl(Path(f.name))
            self.assertEqual(len(result), 2)
            os.unlink(f.name)
    def test_skips_bad_lines(self):
        with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as f:
            f.write('{"a":1}\nBAD LINE\n{"b":2}\n')
            f.flush()
            result = parse_jsonl(Path(f.name))
            self.assertEqual(len(result), 2)
            os.unlink(f.name)
 # === Validator Tests ===
 class TestExtractMentionedFiles(unittest.TestCase):
    def test_backtick_files(self):
        task = "Create `feedback_loop.py` and `config.json`"
        files = extract_mentioned_files(task)
        self.assertIn("feedback_loop.py", files)
        self.assertIn("config.json", files)
    def test_bare_files(self):
        task = "Write test_selfheal.py with 25 tests"
        files = extract_mentioned_files(task)
        self.assertIn("test_selfheal.py", files)
 class TestExtractCreatedFiles(unittest.TestCase):
    def test_write_calls(self):
        entries = [{"type": "message", "message": {"role": "assistant", "content": [
            {"type": "toolCall", "name": "Write", "arguments": {"path": "/tmp/test.py"}}
        ]}}]
        files = extract_created_files_from_transcript(entries)
        self.assertIn("/tmp/test.py", files)
 class TestValidateFileExists(unittest.TestCase):
    def test_existing_file(self):
        with tempfile.NamedTemporaryFile(mode="w", delete=False, suffix=".py") as f:
            f.write("print('hi')")
            f.flush()
            ok, detail = validate_file_exists(f.name)
            self.assertTrue(ok)
            os.unlink(f.name)
    def test_missing_file(self):
        ok, _ = validate_file_exists("/tmp/nonexistent_xyz_abc.py")
        self.assertFalse(ok)
    def test_empty_file(self):
        with tempfile.NamedTemporaryFile(mode="w", delete=False) as f:
            f.flush()
            ok, detail = validate_file_exists(f.name)
            self.assertFalse(ok)
            self.assertIn("empty", detail)
            os.unlink(f.name)
 class TestValidatePythonSyntax(unittest.TestCase):
    def test_valid_python(self):
        with tempfile.NamedTemporaryFile(mode="w", suffix=".py", delete=False) as f:
            f.write("def hello():\n    return 42\n")
            f.flush()
            ok, _ = validate_python_syntax(f.name)
            self.assertTrue(ok)
            os.unlink(f.name)
    def test_invalid_python(self):
        with tempfile.NamedTemporaryFile(mode="w", suffix=".py", delete=False) as f:
            f.write("def hello(\n")
            f.flush()
            ok, detail = validate_python_syntax(f.name)
            self.assertFalse(ok)
            self.assertIn("Syntax error", detail)
            os.unlink(f.name)
 class TestValidateTypescript(unittest.TestCase):
    def test_valid_ts(self):
        with tempfile.NamedTemporaryFile(mode="w", suffix=".ts", delete=False) as f:
            f.write("export function hello(): string { return 'hi'; }\n")
            f.flush()
            ok, _ = validate_typescript_structure(f.name)
            self.assertTrue(ok)
            os.unlink(f.name)
    def test_excessive_any(self):
        with tempfile.NamedTemporaryFile(mode="w", suffix=".ts", delete=False) as f:
            f.write("export " + "const x: any = 1;\n" * 15)
            f.flush()
            ok, detail = validate_typescript_structure(f.name)
            self.assertFalse(ok)
            self.assertIn("any", detail)
            os.unlink(f.name)
 class TestCheckTestResults(unittest.TestCase):
    def test_pytest_pass(self):
        entries = [make_tool_result("10 passed in 0.5s")]
        entries[0]["message"]["role"] = "toolResult"
        result = check_test_results(entries)
        self.assertTrue(result["tests_found"])
        self.assertTrue(result["tests_passed"])
    def test_pytest_fail(self):
        entries = [make_tool_result("3 failed, 7 passed")]
        entries[0]["message"]["role"] = "toolResult"
        result = check_test_results(entries)
        self.assertTrue(result["tests_found"])
        self.assertFalse(result["tests_passed"])
 class TestValidationReport(unittest.TestCase):
    def test_report_pass(self):
        r = ValidationReport()
        r.add("check1", "pass")
        self.assertTrue(r.ok)
        self.assertEqual(r.passed, 1)
    def test_report_fail(self):
        r = ValidationReport()
        r.add("check1", "fail", "broken")
        self.assertFalse(r.ok)
    def test_to_json(self):
        r = ValidationReport()
        r.add("check1", "pass")
        j = r.to_json()
        self.assertIn("checks", j)
        self.assertTrue(j["ok"])
 class TestIntegration(unittest.TestCase):
    """Integration test with a mock session."""
    def test_full_feedback_loop(self):
        entries = [
            {"type": "session", "id": "test-123", "timestamp": "2026-02-08T10:00:00Z"},
            make_entry("assistant", "Here is the file"),
            make_entry("user", "nein, das ist falsch"),
            make_tool_call("exec"),
            make_tool_call("exec"),
            make_tool_call("exec"),
            make_tool_call("exec"),
            make_entry("assistant", "Sorry, I made an error"),
            make_tool_result("Error: permission denied", is_error=True),
        ]
        with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as f:
            write_jsonl(f.name, entries)
            findings = analyze_session(parse_jsonl(Path(f.name)), DEFAULT_CONFIG, f.name)
            os.unlink(f.name)
        categories = {f.category for f in findings}
        self.assertIn("correction", categories)
        self.assertIn("retry", categories)
        self.assertIn("self_error", categories)
        self.assertIn("tool_failure", categories)
    def test_full_validation(self):
        # Create a real file to validate
        with tempfile.NamedTemporaryFile(mode="w", suffix=".py", delete=False) as pyf:
            pyf.write("print('hello')\n")
            pyf.flush()
            py_path = pyf.name
        entries = [
            {"type": "session", "id": "val-test", "timestamp": "2026-02-08T10:00:00Z"},
            {"type": "message", "message": {"role": "assistant", "content": [
                {"type": "toolCall", "name": "Write", "arguments": {"path": py_path}}
            ]}},
            make_tool_result("25 passed in 1.2s"),
        ]
        with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as f:
            write_jsonl(f.name, entries)
            report = run_validation(Path(f.name), f"Create {py_path} with tests")
            os.unlink(f.name)
        os.unlink(py_path)
        self.assertIsInstance(report, ValidationReport)
        self.assertTrue(report.passed > 0)
 class TestAppendToGrowthLog(unittest.TestCase):
    def test_dry_run(self):
        f = Finding("correction", "test trigger", (1, 2), "test.jsonl")
        text = append_to_growth_log([f], DEFAULT_CONFIG, dry_run=True)
        self.assertIn("Auto-detected", text)
    def test_empty_findings(self):
        text = append_to_growth_log([], DEFAULT_CONFIG, dry_run=True)
        self.assertEqual(text, "")
 if __name__ == "__main__":
    unittest.main()
		`@ -0,0 +1,3 @@`
							`"""Cortex — Intelligence layer for OpenClaw."""`

							`__version__ = "0.1.0"`