Initial implementation of CheddahBot personal AI assistant

Multi-model AI assistant with Gradio UI, persistent memory, 15+ tools, and meta-tools for runtime tool creation. Routes Claude models through Claude Code SDK (Max subscription), cloud models through OpenRouter, and local models through Ollama/LM Studio. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-13 20:20:39 -06:00 · 2026-02-13 20:20:39 -06:00 · 1b73cf2e5d
commit 1b73cf2e5d
29 changed files with 2429 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,10 @@
 .env
 __pycache__/
 *.pyc
 data/
 memory/embeddings.db
 memory/*.md
 *.egg-info/
 dist/
 build/
 .venv/
--- a/cheddahbot/init.py
+++ b/cheddahbot/init.py
@ -0,0 +1,3 @@
 """CheddahBot - Personal AI assistant."""
 __version__ = "0.1.0"
--- a/cheddahbot/main.py
+++ b/cheddahbot/main.py
@ -0,0 +1,77 @@
 """Entry point: python -m cheddahbot"""
 import logging
 import sys
 from .config import load_config
 from .db import Database
 from .llm import LLMAdapter
 from .agent import Agent
 from .ui import create_ui
 logging.basicConfig(
    level=logging.INFO,
    format="%(asctime)s [%(name)s] %(levelname)s: %(message)s",
    datefmt="%H:%M:%S",
 )
 log = logging.getLogger("cheddahbot")
 def main():
    log.info("Loading configuration...")
    config = load_config()
    log.info("Initializing database...")
    db = Database(config.db_path)
    log.info("Initializing LLM adapter (default model: %s)...", config.default_model)
    llm = LLMAdapter(
        default_model=config.default_model,
        openrouter_key=config.openrouter_api_key,
        ollama_url=config.ollama_url,
        lmstudio_url=config.lmstudio_url,
    )
    log.info("Creating agent...")
    agent = Agent(config, db, llm)
    # Phase 2+: Memory system
    try:
        from .memory import MemorySystem
        log.info("Initializing memory system...")
        memory = MemorySystem(config, db)
        agent.set_memory(memory)
    except Exception as e:
        log.warning("Memory system not available: %s", e)
    # Phase 3+: Tool system
    try:
        from .tools import ToolRegistry
        log.info("Initializing tool system...")
        tools = ToolRegistry(config, db, agent)
        agent.set_tools(tools)
    except Exception as e:
        log.warning("Tool system not available: %s", e)
    # Phase 3+: Scheduler
    try:
        from .scheduler import Scheduler
        log.info("Starting scheduler...")
        scheduler = Scheduler(config, db, agent)
        scheduler.start()
    except Exception as e:
        log.warning("Scheduler not available: %s", e)
    log.info("Launching Gradio UI on %s:%s...", config.host, config.port)
    app, css = create_ui(agent, config, llm)
    app.launch(
        server_name=config.host,
        server_port=config.port,
        pwa=True,
        show_error=True,
        css=css,
    )
 if __name__ == "__main__":
    main()
--- a/cheddahbot/agent.py
+++ b/cheddahbot/agent.py
@ -0,0 +1,134 @@
 """Core agent loop - the brain of CheddahBot."""
 from __future__ import annotations
 import json
 import logging
 import uuid
 from typing import Generator
 from .config import Config
 from .db import Database
 from .llm import LLMAdapter
 from .router import build_system_prompt, format_messages_for_llm
 log = logging.getLogger(__name__)
 MAX_TOOL_ITERATIONS = 10
 class Agent:
    def __init__(self, config: Config, db: Database, llm: LLMAdapter):
        self.config = config
        self.db = db
        self.llm = llm
        self.conv_id: str | None = None
        self._memory = None   # set by app after memory system init
        self._tools = None    # set by app after tool system init
    def set_memory(self, memory):
        self._memory = memory
    def set_tools(self, tools):
        self._tools = tools
    def ensure_conversation(self) -> str:
        if not self.conv_id:
            self.conv_id = uuid.uuid4().hex[:12]
            self.db.create_conversation(self.conv_id)
        return self.conv_id
    def new_conversation(self) -> str:
        self.conv_id = uuid.uuid4().hex[:12]
        self.db.create_conversation(self.conv_id)
        return self.conv_id
    def respond(self, user_input: str, files: list | None = None) -> Generator[str, None, None]:
        """Process user input and yield streaming response text."""
        conv_id = self.ensure_conversation()
        # Store user message
        self.db.add_message(conv_id, "user", user_input)
        # Build system prompt
        memory_context = ""
        if self._memory:
            memory_context = self._memory.get_context(user_input)
        tools_schema = []
        tools_description = ""
        if self._tools:
            tools_schema = self._tools.get_tools_schema()
            tools_description = self._tools.get_tools_description()
        system_prompt = build_system_prompt(
            identity_dir=self.config.identity_dir,
            memory_context=memory_context,
            tools_description=tools_description,
        )
        # Load conversation history
        history = self.db.get_messages(conv_id, limit=self.config.memory.max_context_messages)
        messages = format_messages_for_llm(system_prompt, history, self.config.memory.max_context_messages)
        # Agent loop: LLM call → tool execution → repeat
        for iteration in range(MAX_TOOL_ITERATIONS):
            full_response = ""
            tool_calls = []
            for chunk in self.llm.chat(messages, tools=tools_schema or None, stream=True):
                if chunk["type"] == "text":
                    full_response += chunk["content"]
                    yield chunk["content"]
                elif chunk["type"] == "tool_use":
                    tool_calls.append(chunk)
            # If no tool calls, we're done
            if not tool_calls:
                if full_response:
                    self.db.add_message(conv_id, "assistant", full_response, model=self.llm.current_model)
                break
            # Store assistant message with tool calls
            self.db.add_message(
                conv_id, "assistant", full_response,
                tool_calls=[{"name": tc["name"], "input": tc["input"]} for tc in tool_calls],
                model=self.llm.current_model,
            )
            # Execute tools
            if self._tools:
                messages.append({"role": "assistant", "content": full_response or "I'll use some tools to help with that."})
                for tc in tool_calls:
                    yield f"\n\n🔧 **Using tool: {tc['name']}**\n"
                    try:
                        result = self._tools.execute(tc["name"], tc.get("input", {}))
                    except Exception as e:
                        result = f"Tool error: {e}"
                    yield f"```\n{result[:2000]}\n```\n\n"
                    self.db.add_message(conv_id, "tool", result, tool_result=tc["name"])
                    messages.append({"role": "user", "content": f'[Tool "{tc["name"]}" result]\n{result}'})
            else:
                # No tool system configured - just mention tool was requested
                if full_response:
                    self.db.add_message(conv_id, "assistant", full_response, model=self.llm.current_model)
                for tc in tool_calls:
                    yield f"\n(Tool requested: {tc['name']} - tool system not yet initialized)\n"
                break
        else:
            yield "\n(Reached maximum tool iterations)"
        # Check if memory flush is needed
        if self._memory:
            msg_count = self.db.count_messages(conv_id)
            if msg_count > self.config.memory.flush_threshold:
                self._memory.auto_flush(conv_id)
    def respond_to_prompt(self, prompt: str) -> str:
        """Non-streaming response for scheduled tasks / internal use."""
        result_parts = []
        for chunk in self.respond(prompt):
            result_parts.append(chunk)
        return "".join(result_parts)
--- a/cheddahbot/config.py
+++ b/cheddahbot/config.py
@ -0,0 +1,98 @@
 """Configuration loader: env vars → config.yaml → defaults."""
 from __future__ import annotations
 import os
 from dataclasses import dataclass, field
 from pathlib import Path
 import yaml
 from dotenv import load_dotenv
 ROOT_DIR = Path(__file__).resolve().parent.parent
 load_dotenv(ROOT_DIR / ".env")
@dataclass
 class MemoryConfig:
    max_context_messages: int = 50
    flush_threshold: int = 40
    embedding_model: str = "all-MiniLM-L6-v2"
    search_top_k: int = 5
@dataclass
 class SchedulerConfig:
    heartbeat_interval_minutes: int = 30
    poll_interval_seconds: int = 60
@dataclass
 class ShellConfig:
    blocked_commands: list[str] = field(default_factory=lambda: ["rm -rf /", "format", ":(){:|:&};:"])
    require_approval: bool = False
@dataclass
 class Config:
    default_model: str = "claude-sonnet-4-20250514"
    host: str = "0.0.0.0"
    port: int = 7860
    ollama_url: str = "http://localhost:11434"
    lmstudio_url: str = "http://localhost:1234"
    openrouter_api_key: str = ""
    memory: MemoryConfig = field(default_factory=MemoryConfig)
    scheduler: SchedulerConfig = field(default_factory=SchedulerConfig)
    shell: ShellConfig = field(default_factory=ShellConfig)
    # Derived paths
    root_dir: Path = field(default_factory=lambda: ROOT_DIR)
    data_dir: Path = field(default_factory=lambda: ROOT_DIR / "data")
    identity_dir: Path = field(default_factory=lambda: ROOT_DIR / "identity")
    memory_dir: Path = field(default_factory=lambda: ROOT_DIR / "memory")
    skills_dir: Path = field(default_factory=lambda: ROOT_DIR / "skills")
    db_path: Path = field(default_factory=lambda: ROOT_DIR / "data" / "cheddahbot.db")
 def load_config() -> Config:
    """Load config from env vars → config.yaml → defaults."""
    cfg = Config()
    # Load YAML if exists
    yaml_path = ROOT_DIR / "config.yaml"
    if yaml_path.exists():
        with open(yaml_path) as f:
            data = yaml.safe_load(f) or {}
        for key in ("default_model", "host", "port", "ollama_url", "lmstudio_url"):
            if key in data:
                setattr(cfg, key, data[key])
        if "memory" in data and isinstance(data["memory"], dict):
            for k, v in data["memory"].items():
                if hasattr(cfg.memory, k):
                    setattr(cfg.memory, k, v)
        if "scheduler" in data and isinstance(data["scheduler"], dict):
            for k, v in data["scheduler"].items():
                if hasattr(cfg.scheduler, k):
                    setattr(cfg.scheduler, k, v)
        if "shell" in data and isinstance(data["shell"], dict):
            for k, v in data["shell"].items():
                if hasattr(cfg.shell, k):
                    setattr(cfg.shell, k, v)
    # Env var overrides (CHEDDAH_ prefix)
    cfg.openrouter_api_key = os.getenv("OPENROUTER_API_KEY", "")
    if m := os.getenv("CHEDDAH_DEFAULT_MODEL"):
        cfg.default_model = m
    if h := os.getenv("CHEDDAH_HOST"):
        cfg.host = h
    if p := os.getenv("CHEDDAH_PORT"):
        cfg.port = int(p)
    # Ensure data directories exist
    cfg.data_dir.mkdir(parents=True, exist_ok=True)
    (cfg.data_dir / "uploads").mkdir(exist_ok=True)
    (cfg.data_dir / "generated").mkdir(exist_ok=True)
    cfg.memory_dir.mkdir(parents=True, exist_ok=True)
    cfg.skills_dir.mkdir(parents=True, exist_ok=True)
    return cfg
--- a/cheddahbot/db.py
+++ b/cheddahbot/db.py
@ -0,0 +1,187 @@
 """SQLite persistence layer."""
 from __future__ import annotations
 import json
 import sqlite3
 import threading
 from datetime import datetime, timezone
 from pathlib import Path
 class Database:
    def __init__(self, db_path: Path):
        self._path = db_path
        self._local = threading.local()
        self._init_schema()
    @property
    def _conn(self) -> sqlite3.Connection:
        if not hasattr(self._local, "conn"):
            self._local.conn = sqlite3.connect(str(self._path))
            self._local.conn.row_factory = sqlite3.Row
            self._local.conn.execute("PRAGMA journal_mode=WAL")
            self._local.conn.execute("PRAGMA foreign_keys=ON")
        return self._local.conn
    def _init_schema(self):
        self._conn.executescript("""
            CREATE TABLE IF NOT EXISTS conversations (
                id          TEXT PRIMARY KEY,
                title       TEXT,
                created_at  TEXT NOT NULL,
                updated_at  TEXT NOT NULL
            );
            CREATE TABLE IF NOT EXISTS messages (
                id          INTEGER PRIMARY KEY AUTOINCREMENT,
                conv_id     TEXT NOT NULL REFERENCES conversations(id),
                role        TEXT NOT NULL,
                content     TEXT NOT NULL,
                tool_calls  TEXT,
                tool_result TEXT,
                model       TEXT,
                created_at  TEXT NOT NULL
            );
            CREATE INDEX IF NOT EXISTS idx_messages_conv ON messages(conv_id, created_at);
            CREATE TABLE IF NOT EXISTS scheduled_tasks (
                id          INTEGER PRIMARY KEY AUTOINCREMENT,
                name        TEXT NOT NULL,
                prompt      TEXT NOT NULL,
                schedule    TEXT NOT NULL,
                enabled     INTEGER NOT NULL DEFAULT 1,
                next_run    TEXT,
                created_at  TEXT NOT NULL
            );
            CREATE TABLE IF NOT EXISTS task_run_logs (
                id          INTEGER PRIMARY KEY AUTOINCREMENT,
                task_id     INTEGER NOT NULL REFERENCES scheduled_tasks(id),
                started_at  TEXT NOT NULL,
                finished_at TEXT,
                result      TEXT,
                error       TEXT
            );
            CREATE TABLE IF NOT EXISTS kv_store (
                key   TEXT PRIMARY KEY,
                value TEXT NOT NULL
            );
        """)
        self._conn.commit()
    # -- Conversations --
    def create_conversation(self, conv_id: str, title: str = "New Chat") -> str:
        now = _now()
        self._conn.execute(
            "INSERT INTO conversations (id, title, created_at, updated_at) VALUES (?, ?, ?, ?)",
            (conv_id, title, now, now),
        )
        self._conn.commit()
        return conv_id
    def list_conversations(self, limit: int = 50) -> list[dict]:
        rows = self._conn.execute(
            "SELECT id, title, updated_at FROM conversations ORDER BY updated_at DESC LIMIT ?",
            (limit,),
        ).fetchall()
        return [dict(r) for r in rows]
    # -- Messages --
    def add_message(
        self,
        conv_id: str,
        role: str,
        content: str,
        tool_calls: list | None = None,
        tool_result: str | None = None,
        model: str | None = None,
    ) -> int:
        now = _now()
        cur = self._conn.execute(
            """INSERT INTO messages (conv_id, role, content, tool_calls, tool_result, model, created_at)
               VALUES (?, ?, ?, ?, ?, ?, ?)""",
            (
                conv_id,
                role,
                content,
                json.dumps(tool_calls) if tool_calls else None,
                tool_result,
                model,
                now,
            ),
        )
        self._conn.execute(
            "UPDATE conversations SET updated_at = ? WHERE id = ?", (now, conv_id)
        )
        self._conn.commit()
        return cur.lastrowid
    def get_messages(self, conv_id: str, limit: int = 100) -> list[dict]:
        rows = self._conn.execute(
            """SELECT role, content, tool_calls, tool_result, model, created_at
               FROM messages WHERE conv_id = ? ORDER BY created_at ASC LIMIT ?""",
            (conv_id, limit),
        ).fetchall()
        result = []
        for r in rows:
            msg = dict(r)
            if msg["tool_calls"]:
                msg["tool_calls"] = json.loads(msg["tool_calls"])
            result.append(msg)
        return result
    def count_messages(self, conv_id: str) -> int:
        row = self._conn.execute(
            "SELECT COUNT(*) as cnt FROM messages WHERE conv_id = ?", (conv_id,)
        ).fetchone()
        return row["cnt"]
    # -- Scheduled Tasks --
    def add_scheduled_task(self, name: str, prompt: str, schedule: str) -> int:
        now = _now()
        cur = self._conn.execute(
            "INSERT INTO scheduled_tasks (name, prompt, schedule, created_at) VALUES (?, ?, ?, ?)",
            (name, prompt, schedule, now),
        )
        self._conn.commit()
        return cur.lastrowid
    def get_due_tasks(self) -> list[dict]:
        now = _now()
        rows = self._conn.execute(
            "SELECT * FROM scheduled_tasks WHERE enabled = 1 AND (next_run IS NULL OR next_run <= ?)",
            (now,),
        ).fetchall()
        return [dict(r) for r in rows]
    def update_task_next_run(self, task_id: int, next_run: str):
        self._conn.execute(
            "UPDATE scheduled_tasks SET next_run = ? WHERE id = ?", (next_run, task_id)
        )
        self._conn.commit()
    def log_task_run(self, task_id: int, result: str | None = None, error: str | None = None):
        now = _now()
        self._conn.execute(
            "INSERT INTO task_run_logs (task_id, started_at, finished_at, result, error) VALUES (?, ?, ?, ?, ?)",
            (task_id, now, now, result, error),
        )
        self._conn.commit()
    # -- Key-Value Store --
    def kv_set(self, key: str, value: str):
        self._conn.execute(
            "INSERT OR REPLACE INTO kv_store (key, value) VALUES (?, ?)", (key, value)
        )
        self._conn.commit()
    def kv_get(self, key: str) -> str | None:
        row = self._conn.execute("SELECT value FROM kv_store WHERE key = ?", (key,)).fetchone()
        return row["value"] if row else None
 def _now() -> str:
    return datetime.now(timezone.utc).isoformat()
--- a/cheddahbot/llm.py
+++ b/cheddahbot/llm.py
@ -0,0 +1,334 @@
 """Model-agnostic LLM adapter.
 Routing:
  - Claude models → Claude Code SDK (subprocess, uses Max subscription)
  - Cloud models  → OpenRouter (single API key, OpenAI-compatible)
  - Local models  → direct HTTP (Ollama / LM Studio, OpenAI-compatible)
 """
 from __future__ import annotations
 import json
 import logging
 import os
 import shutil
 import subprocess
 import sys
 from dataclasses import dataclass
 from typing import Generator
 import httpx
 log = logging.getLogger(__name__)
@dataclass
 class ModelInfo:
    id: str
    name: str
    provider: str  # "claude" | "openrouter" | "ollama" | "lmstudio"
    context_length: int | None = None
 # Well-known Claude models that route through the SDK
 CLAUDE_MODELS = {
    "claude-sonnet-4-20250514",
    "claude-opus-4-20250514",
    "claude-haiku-4-20250514",
 }
 def _is_claude_model(model_id: str) -> bool:
    return model_id in CLAUDE_MODELS or model_id.startswith("claude-")
 def _provider_for(model_id: str, openrouter_key: str, ollama_url: str, lmstudio_url: str) -> str:
    if _is_claude_model(model_id):
        return "claude"
    if model_id.startswith("local/ollama/"):
        return "ollama"
    if model_id.startswith("local/lmstudio/"):
        return "lmstudio"
    if openrouter_key:
        return "openrouter"
    return "openrouter"
 class LLMAdapter:
    def __init__(
        self,
        default_model: str = "claude-sonnet-4-20250514",
        openrouter_key: str = "",
        ollama_url: str = "http://localhost:11434",
        lmstudio_url: str = "http://localhost:1234",
    ):
        self.current_model = default_model
        self.openrouter_key = openrouter_key
        self.ollama_url = ollama_url.rstrip("/")
        self.lmstudio_url = lmstudio_url.rstrip("/")
        self._openai_mod = None  # lazy import
    @property
    def provider(self) -> str:
        return _provider_for(self.current_model, self.openrouter_key, self.ollama_url, self.lmstudio_url)
    def switch_model(self, model_id: str):
        self.current_model = model_id
        log.info("Switched to model: %s (provider: %s)", model_id, self.provider)
    # ── Main entry point ──
    def chat(
        self,
        messages: list[dict],
        tools: list[dict] | None = None,
        stream: bool = True,
    ) -> Generator[dict, None, None]:
        """Yield chunks: {"type": "text", "content": "..."} or {"type": "tool_use", ...}."""
        provider = self.provider
        if provider == "claude":
            yield from self._chat_claude_sdk(messages, tools, stream)
        else:
            base_url, api_key = self._resolve_endpoint(provider)
            model_id = self._resolve_model_id(provider)
            yield from self._chat_openai_sdk(messages, tools, stream, base_url, api_key, model_id)
    # ── Claude Code SDK (subprocess) ──
    def _chat_claude_sdk(
        self, messages: list[dict], tools: list[dict] | None, stream: bool
    ) -> Generator[dict, None, None]:
        # Separate system prompt from user messages
        system_prompt = ""
        user_prompt_parts = []
        for m in messages:
            role = m.get("role", "user")
            content = m.get("content", "")
            if isinstance(content, list):
                content = " ".join(c.get("text", "") for c in content if c.get("type") == "text")
            if role == "system":
                system_prompt += content + "\n"
            elif role == "assistant":
                user_prompt_parts.append(f"[Assistant]\n{content}")
            else:
                user_prompt_parts.append(content)
        user_prompt = "\n\n".join(user_prompt_parts)
        # Find claude CLI - on Windows needs .cmd extension for npm-installed binaries
        claude_bin = shutil.which("claude")
        if not claude_bin:
            yield {"type": "text", "content": "Error: `claude` CLI not found in PATH. Install Claude Code: npm install -g @anthropic-ai/claude-code"}
            return
        cmd = [claude_bin, "-p", user_prompt, "--model", self.current_model,
               "--output-format", "json", "--tools", ""]
        if system_prompt.strip():
            cmd.extend(["--system-prompt", system_prompt.strip()])
        log.debug("Claude SDK using: %s", claude_bin)
        # Strip CLAUDECODE env var so the subprocess doesn't think it's nested
        env = {k: v for k, v in os.environ.items() if k != "CLAUDECODE"}
        try:
            proc = subprocess.Popen(
                cmd,
                stdout=subprocess.PIPE,
                stderr=subprocess.PIPE,
                text=True,
                encoding="utf-8",
                shell=(sys.platform == "win32"),
                env=env,
            )
        except FileNotFoundError:
            yield {"type": "text", "content": "Error: `claude` CLI not found. Install Claude Code: npm install -g @anthropic-ai/claude-code"}
            return
        stdout, stderr = proc.communicate(timeout=120)
        if proc.returncode != 0:
            yield {"type": "text", "content": f"Claude SDK error: {stderr or 'unknown error'}"}
            return
        # --output-format json returns a single JSON object
        try:
            result = json.loads(stdout)
            text = result.get("result", "")
            if text:
                yield {"type": "text", "content": text}
            elif result.get("is_error"):
                yield {"type": "text", "content": f"Claude error: {result.get('result', 'unknown')}"}
            return
        except json.JSONDecodeError:
            # Fallback: treat as plain text
            if stdout.strip():
                yield {"type": "text", "content": stdout.strip()}
    # ── OpenAI-compatible SDK (OpenRouter / Ollama / LM Studio) ──
    def _chat_openai_sdk(
        self,
        messages: list[dict],
        tools: list[dict] | None,
        stream: bool,
        base_url: str,
        api_key: str,
        model_id: str,
    ) -> Generator[dict, None, None]:
        openai = self._get_openai()
        client = openai.OpenAI(base_url=base_url, api_key=api_key)
        kwargs: dict = {
            "model": model_id,
            "messages": messages,
            "stream": stream,
        }
        if tools:
            kwargs["tools"] = tools
        try:
            if stream:
                response = client.chat.completions.create(**kwargs)
                tool_calls_accum: dict[int, dict] = {}
                for chunk in response:
                    delta = chunk.choices[0].delta if chunk.choices else None
                    if not delta:
                        continue
                    if delta.content:
                        yield {"type": "text", "content": delta.content}
                    if delta.tool_calls:
                        for tc in delta.tool_calls:
                            idx = tc.index
                            if idx not in tool_calls_accum:
                                tool_calls_accum[idx] = {
                                    "id": tc.id or "",
                                    "name": tc.function.name if tc.function and tc.function.name else "",
                                    "arguments": "",
                                }
                            if tc.function and tc.function.arguments:
                                tool_calls_accum[idx]["arguments"] += tc.function.arguments
                            if tc.id:
                                tool_calls_accum[idx]["id"] = tc.id
                for _, tc in sorted(tool_calls_accum.items()):
                    try:
                        args = json.loads(tc["arguments"])
                    except json.JSONDecodeError:
                        args = {}
                    yield {
                        "type": "tool_use",
                        "id": tc["id"],
                        "name": tc["name"],
                        "input": args,
                    }
            else:
                response = client.chat.completions.create(**kwargs)
                msg = response.choices[0].message
                if msg.content:
                    yield {"type": "text", "content": msg.content}
                if msg.tool_calls:
                    for tc in msg.tool_calls:
                        try:
                            args = json.loads(tc.function.arguments)
                        except json.JSONDecodeError:
                            args = {}
                        yield {
                            "type": "tool_use",
                            "id": tc.id,
                            "name": tc.function.name,
                            "input": args,
                        }
        except Exception as e:
            yield {"type": "text", "content": f"LLM error ({self.provider}): {e}"}
    # ── Helpers ──
    def _resolve_endpoint(self, provider: str) -> tuple[str, str]:
        if provider == "openrouter":
            return "https://openrouter.ai/api/v1", self.openrouter_key or "sk-placeholder"
        elif provider == "ollama":
            return f"{self.ollama_url}/v1", "ollama"
        elif provider == "lmstudio":
            return f"{self.lmstudio_url}/v1", "lm-studio"
        return "https://openrouter.ai/api/v1", self.openrouter_key or "sk-placeholder"
    def _resolve_model_id(self, provider: str) -> str:
        model = self.current_model
        if provider == "ollama" and model.startswith("local/ollama/"):
            return model.removeprefix("local/ollama/")
        if provider == "lmstudio" and model.startswith("local/lmstudio/"):
            return model.removeprefix("local/lmstudio/")
        return model
    def _messages_to_prompt(self, messages: list[dict]) -> str:
        """Flatten messages into a single prompt string for Claude SDK -p flag."""
        parts = []
        for m in messages:
            role = m.get("role", "user")
            content = m.get("content", "")
            if isinstance(content, list):
                # multimodal - extract text parts
                content = " ".join(
                    c.get("text", "") for c in content if c.get("type") == "text"
                )
            if role == "system":
                parts.append(f"[System]\n{content}")
            elif role == "assistant":
                parts.append(f"[Assistant]\n{content}")
            else:
                parts.append(content)
        return "\n\n".join(parts)
    def _get_openai(self):
        if self._openai_mod is None:
            import openai
            self._openai_mod = openai
        return self._openai_mod
    # ── Model Discovery ──
    def discover_local_models(self) -> list[ModelInfo]:
        models = []
        # Ollama
        try:
            r = httpx.get(f"{self.ollama_url}/api/tags", timeout=3)
            if r.status_code == 200:
                for m in r.json().get("models", []):
                    models.append(ModelInfo(
                        id=f"local/ollama/{m['name']}",
                        name=f"[Ollama] {m['name']}",
                        provider="ollama",
                    ))
        except Exception:
            pass
        # LM Studio
        try:
            r = httpx.get(f"{self.lmstudio_url}/v1/models", timeout=3)
            if r.status_code == 200:
                for m in r.json().get("data", []):
                    models.append(ModelInfo(
                        id=f"local/lmstudio/{m['id']}",
                        name=f"[LM Studio] {m['id']}",
                        provider="lmstudio",
                    ))
        except Exception:
            pass
        return models
    def list_available_models(self) -> list[ModelInfo]:
        """Return all available models across all providers."""
        models = [
            ModelInfo("claude-sonnet-4-20250514", "Claude Sonnet 4", "claude"),
            ModelInfo("claude-opus-4-20250514", "Claude Opus 4", "claude"),
            ModelInfo("claude-haiku-4-20250514", "Claude Haiku 4", "claude"),
        ]
        if self.openrouter_key:
            models.extend([
                ModelInfo("openai/gpt-4o", "GPT-4o", "openrouter"),
                ModelInfo("openai/gpt-4o-mini", "GPT-4o Mini", "openrouter"),
                ModelInfo("google/gemini-2.0-flash-001", "Gemini 2.0 Flash", "openrouter"),
                ModelInfo("google/gemini-2.5-pro-preview", "Gemini 2.5 Pro", "openrouter"),
                ModelInfo("mistralai/mistral-large", "Mistral Large", "openrouter"),
                ModelInfo("meta-llama/llama-3.3-70b-instruct", "Llama 3.3 70B", "openrouter"),
            ])
        models.extend(self.discover_local_models())
        return models
--- a/cheddahbot/media.py
+++ b/cheddahbot/media.py
@ -0,0 +1,115 @@
 """Audio/video processing: STT, TTS, video frame extraction."""
 from __future__ import annotations
 import asyncio
 import logging
 import subprocess
 import tempfile
 from pathlib import Path
 log = logging.getLogger(__name__)
 # ── Speech-to-Text ──
 def transcribe_audio(audio_path: str | Path) -> str:
    """Transcribe audio to text. Tries OpenAI Whisper API, falls back to local whisper."""
    audio_path = Path(audio_path)
    if not audio_path.exists():
        return ""
    # Try local whisper first (no API key needed)
    try:
        return _transcribe_local(audio_path)
    except ImportError:
        pass
    except Exception as e:
        log.warning("Local whisper failed: %s", e)
    # Fallback: try OpenAI API
    try:
        return _transcribe_openai_api(audio_path)
    except Exception as e:
        log.warning("OpenAI whisper API failed: %s", e)
    return f"(Could not transcribe audio from {audio_path.name})"
 def _transcribe_local(audio_path: Path) -> str:
    import whisper
    model = whisper.load_model("base")
    result = model.transcribe(str(audio_path))
    return result.get("text", "").strip()
 def _transcribe_openai_api(audio_path: Path) -> str:
    import openai
    import os
    key = os.getenv("OPENAI_API_KEY") or os.getenv("OPENROUTER_API_KEY")
    if not key:
        raise ValueError("No API key for Whisper")
    client = openai.OpenAI(api_key=key)
    with open(audio_path, "rb") as f:
        transcript = client.audio.transcriptions.create(model="whisper-1", file=f)
    return transcript.text.strip()
 # ── Text-to-Speech ──
 def text_to_speech(text: str, output_path: str | Path | None = None, voice: str = "en-US-AriaNeural") -> Path:
    """Convert text to speech using edge-tts (free, no API key)."""
    if output_path is None:
        output_path = Path(tempfile.mktemp(suffix=".mp3"))
    else:
        output_path = Path(output_path)
    try:
        import edge_tts
        async def _generate():
            communicate = edge_tts.Communicate(text, voice)
            await communicate.save(str(output_path))
        asyncio.run(_generate())
        return output_path
    except ImportError:
        log.warning("edge-tts not installed. Run: pip install edge-tts")
        # Write a placeholder
        output_path.write_text("TTS not available", encoding="utf-8")
        return output_path
 # ── Video Frame Extraction ──
 def extract_video_frames(video_path: str | Path, max_frames: int = 5) -> list[Path]:
    """Extract key frames from a video using ffmpeg."""
    video_path = Path(video_path)
    if not video_path.exists():
        return []
    output_dir = Path(tempfile.mkdtemp(prefix="cheddah_frames_"))
    try:
        # Get video duration
        result = subprocess.run(
            ["ffprobe", "-v", "error", "-show_entries", "format=duration",
             "-of", "default=noprint_wrappers=1:nokey=1", str(video_path)],
            capture_output=True, text=True, timeout=10,
        )
        duration = float(result.stdout.strip()) if result.stdout.strip() else 10.0
        interval = max(duration / (max_frames + 1), 1.0)
        # Extract frames
        subprocess.run(
            ["ffmpeg", "-i", str(video_path), "-vf", f"fps=1/{interval}",
             "-frames:v", str(max_frames), str(output_dir / "frame_%03d.jpg")],
            capture_output=True, timeout=30,
        )
        frames = sorted(output_dir.glob("frame_*.jpg"))
        return frames
    except FileNotFoundError:
        log.warning("ffmpeg/ffprobe not found. Video analysis requires ffmpeg.")
        return []
    except Exception as e:
        log.warning("Video frame extraction failed: %s", e)
        return []
--- a/cheddahbot/memory.py
+++ b/cheddahbot/memory.py
@ -0,0 +1,231 @@
 """4-layer memory system.
 Layers:
  1. Identity    - SOUL.md + USER.md (handled by router.py)
  2. Long-term   - memory/MEMORY.md (learned facts, decisions)
  3. Daily logs  - memory/YYYY-MM-DD.md (timestamped entries)
  4. Semantic    - memory/embeddings.db (vector search over all memory)
 """
 from __future__ import annotations
 import logging
 import sqlite3
 import threading
 from datetime import datetime, timezone
 from pathlib import Path
 import numpy as np
 from .config import Config
 from .db import Database
 log = logging.getLogger(__name__)
 class MemorySystem:
    def __init__(self, config: Config, db: Database):
        self.config = config
        self.db = db
        self.memory_dir = config.memory_dir
        self._embedder = None
        self._embed_lock = threading.Lock()
        self._embed_db_path = self.memory_dir / "embeddings.db"
        self._init_embed_db()
    # ── Public API ──
    def get_context(self, query: str) -> str:
        """Build memory context string for the system prompt."""
        parts = []
        # Long-term memory
        lt = self._read_long_term()
        if lt:
            parts.append(f"## Long-Term Memory\n{lt}")
        # Today's log
        today_log = self._read_daily_log()
        if today_log:
            parts.append(f"## Today's Log\n{today_log}")
        # Semantic search results
        if query:
            results = self.search(query, top_k=self.config.memory.search_top_k)
            if results:
                formatted = "\n".join(f"- {r['text']}" for r in results)
                parts.append(f"## Related Memories\n{formatted}")
        return "\n\n".join(parts) if parts else ""
    def remember(self, text: str):
        """Save a fact/instruction to long-term memory."""
        memory_path = self.memory_dir / "MEMORY.md"
        timestamp = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M")
        entry = f"\n- [{timestamp}] {text}\n"
        if memory_path.exists():
            content = memory_path.read_text(encoding="utf-8")
        else:
            content = "# Long-Term Memory\n"
        content += entry
        memory_path.write_text(content, encoding="utf-8")
        self._index_text(text, f"memory:long_term:{timestamp}")
        log.info("Saved to long-term memory: %s", text[:80])
    def log_daily(self, text: str):
        """Append an entry to today's daily log."""
        today = datetime.now(timezone.utc).strftime("%Y-%m-%d")
        log_path = self.memory_dir / f"{today}.md"
        timestamp = datetime.now(timezone.utc).strftime("%H:%M")
        if log_path.exists():
            content = log_path.read_text(encoding="utf-8")
        else:
            content = f"# Daily Log - {today}\n"
        content += f"\n- [{timestamp}] {text}\n"
        log_path.write_text(content, encoding="utf-8")
        self._index_text(text, f"daily:{today}:{timestamp}")
    def search(self, query: str, top_k: int = 5) -> list[dict]:
        """Semantic search over all indexed memory."""
        embedder = self._get_embedder()
        if embedder is None:
            return self._fallback_search(query, top_k)
        query_vec = embedder.encode([query])[0]
        return self._vector_search(query_vec, top_k)
    def auto_flush(self, conv_id: str):
        """Summarize old messages and move to daily log."""
        messages = self.db.get_messages(conv_id, limit=200)
        if len(messages) < self.config.memory.flush_threshold:
            return
        # Take older messages for summarization
        to_summarize = messages[:-10]  # keep last 10 in context
        text_block = "\n".join(
            f"{m['role']}: {m['content'][:200]}" for m in to_summarize
            if m.get("content")
        )
        summary = f"Conversation summary ({len(to_summarize)} messages): {text_block[:1000]}"
        self.log_daily(summary)
        log.info("Auto-flushed %d messages to daily log", len(to_summarize))
    def reindex_all(self):
        """Rebuild the embedding index from all memory files."""
        self._clear_embeddings()
        for path in self.memory_dir.glob("*.md"):
            content = path.read_text(encoding="utf-8")
            for i, line in enumerate(content.split("\n")):
                line = line.strip().lstrip("- ")
                if len(line) > 10:
                    self._index_text(line, f"file:{path.name}:L{i}")
        log.info("Reindexed all memory files")
    # ── Private: Long-term memory ──
    def _read_long_term(self) -> str:
        path = self.memory_dir / "MEMORY.md"
        if path.exists():
            content = path.read_text(encoding="utf-8")
            # Return last 2000 chars to keep prompt manageable
            return content[-2000:] if len(content) > 2000 else content
        return ""
    def _read_daily_log(self) -> str:
        today = datetime.now(timezone.utc).strftime("%Y-%m-%d")
        path = self.memory_dir / f"{today}.md"
        if path.exists():
            content = path.read_text(encoding="utf-8")
            return content[-1500:] if len(content) > 1500 else content
        return ""
    # ── Private: Embedding system ──
    def _init_embed_db(self):
        conn = sqlite3.connect(str(self._embed_db_path))
        conn.execute("""
            CREATE TABLE IF NOT EXISTS embeddings (
                id      TEXT PRIMARY KEY,
                text    TEXT NOT NULL,
                vector  BLOB NOT NULL
            )
        """)
        conn.commit()
        conn.close()
    def _get_embedder(self):
        if self._embedder is not None:
            return self._embedder
        with self._embed_lock:
            if self._embedder is not None:
                return self._embedder
            try:
                from sentence_transformers import SentenceTransformer
                model_name = self.config.memory.embedding_model
                log.info("Loading embedding model: %s", model_name)
                self._embedder = SentenceTransformer(model_name)
                return self._embedder
            except ImportError:
                log.warning("sentence-transformers not installed; semantic search disabled")
                return None
            except Exception as e:
                log.warning("Failed to load embedding model: %s", e)
                return None
    def _index_text(self, text: str, doc_id: str):
        embedder = self._get_embedder()
        if embedder is None:
            return
        vec = embedder.encode([text])[0]
        conn = sqlite3.connect(str(self._embed_db_path))
        conn.execute(
            "INSERT OR REPLACE INTO embeddings (id, text, vector) VALUES (?, ?, ?)",
            (doc_id, text, vec.tobytes()),
        )
        conn.commit()
        conn.close()
    def _vector_search(self, query_vec: np.ndarray, top_k: int) -> list[dict]:
        conn = sqlite3.connect(str(self._embed_db_path))
        rows = conn.execute("SELECT id, text, vector FROM embeddings").fetchall()
        conn.close()
        if not rows:
            return []
        scored = []
        for doc_id, text, vec_bytes in rows:
            vec = np.frombuffer(vec_bytes, dtype=np.float32)
            sim = float(np.dot(query_vec, vec) / (np.linalg.norm(query_vec) * np.linalg.norm(vec) + 1e-8))
            scored.append({"id": doc_id, "text": text, "score": sim})
        scored.sort(key=lambda x: x["score"], reverse=True)
        return scored[:top_k]
    def _clear_embeddings(self):
        conn = sqlite3.connect(str(self._embed_db_path))
        conn.execute("DELETE FROM embeddings")
        conn.commit()
        conn.close()
    def _fallback_search(self, query: str, top_k: int) -> list[dict]:
        """Simple keyword search when embeddings are unavailable."""
        results = []
        query_lower = query.lower()
        for path in self.memory_dir.glob("*.md"):
            try:
                content = path.read_text(encoding="utf-8")
            except Exception:
                continue
            for line in content.split("\n"):
                stripped = line.strip().lstrip("- ")
                if len(stripped) > 10 and query_lower in stripped.lower():
                    results.append({"id": path.name, "text": stripped, "score": 1.0})
                    if len(results) >= top_k:
                        return results
        return results
--- a/cheddahbot/providers/init.py
+++ b/cheddahbot/providers/init.py
@ -0,0 +1 @@
 # Reserved for future custom providers
--- a/cheddahbot/router.py
+++ b/cheddahbot/router.py
@ -0,0 +1,67 @@
 """Message formatting and system prompt construction."""
 from __future__ import annotations
 from pathlib import Path
 def build_system_prompt(
    identity_dir: Path,
    memory_context: str = "",
    tools_description: str = "",
 ) -> str:
    """Build the system prompt from identity files + memory + tools."""
    parts = []
    # 1. Identity: SOUL.md
    soul_path = identity_dir / "SOUL.md"
    if soul_path.exists():
        parts.append(soul_path.read_text(encoding="utf-8").strip())
    # 2. Identity: USER.md
    user_path = identity_dir / "USER.md"
    if user_path.exists():
        parts.append(user_path.read_text(encoding="utf-8").strip())
    # 3. Memory context (injected by memory system)
    if memory_context:
        parts.append(f"# Relevant Memory\n{memory_context}")
    # 4. Available tools
    if tools_description:
        parts.append(f"# Available Tools\n{tools_description}")
    # 5. Core instructions
    parts.append(
        "# Instructions\n"
        "- Use tools when they would help answer the user's request.\n"
        "- If you learn something important about the user, save it to memory.\n"
        "- Be concise but thorough. Don't pad responses unnecessarily.\n"
        "- When uncertain, ask for clarification.\n"
        "- Reference memories naturally when relevant."
    )
    return "\n\n---\n\n".join(parts)
 def format_messages_for_llm(
    system_prompt: str,
    history: list[dict],
    max_messages: int = 50,
 ) -> list[dict]:
    """Format conversation history into LLM message format."""
    messages = [{"role": "system", "content": system_prompt}]
    # Take the most recent messages up to the limit
    recent = history[-max_messages:] if len(history) > max_messages else history
    for msg in recent:
        role = msg.get("role", "user")
        content = msg.get("content", "")
        if role in ("user", "assistant", "system"):
            messages.append({"role": role, "content": content})
        elif role == "tool":
            # Tool results go as a user message with context
            messages.append({"role": "user", "content": f"[Tool Result]\n{content}"})
    return messages
--- a/cheddahbot/scheduler.py
+++ b/cheddahbot/scheduler.py
@ -0,0 +1,118 @@
 """Task scheduler with heartbeat support."""
 from __future__ import annotations
 import logging
 import threading
 import time
 from datetime import datetime, timezone
 from pathlib import Path
 from typing import TYPE_CHECKING
 from croniter import croniter
 if TYPE_CHECKING:
    from .agent import Agent
    from .config import Config
    from .db import Database
 log = logging.getLogger(__name__)
 HEARTBEAT_OK = "HEARTBEAT_OK"
 class Scheduler:
    def __init__(self, config: Config, db: Database, agent: Agent):
        self.config = config
        self.db = db
        self.agent = agent
        self._stop_event = threading.Event()
        self._thread: threading.Thread | None = None
        self._heartbeat_thread: threading.Thread | None = None
    def start(self):
        """Start the scheduler and heartbeat threads."""
        self._thread = threading.Thread(target=self._poll_loop, daemon=True, name="scheduler")
        self._thread.start()
        self._heartbeat_thread = threading.Thread(target=self._heartbeat_loop, daemon=True, name="heartbeat")
        self._heartbeat_thread.start()
        log.info("Scheduler started (poll=%ds, heartbeat=%dm)",
                 self.config.scheduler.poll_interval_seconds,
                 self.config.scheduler.heartbeat_interval_minutes)
    def stop(self):
        self._stop_event.set()
    # ── Scheduled Tasks ──
    def _poll_loop(self):
        while not self._stop_event.is_set():
            try:
                self._run_due_tasks()
            except Exception as e:
                log.error("Scheduler poll error: %s", e)
            self._stop_event.wait(self.config.scheduler.poll_interval_seconds)
    def _run_due_tasks(self):
        tasks = self.db.get_due_tasks()
        for task in tasks:
            try:
                log.info("Running scheduled task: %s", task["name"])
                result = self.agent.respond_to_prompt(task["prompt"])
                self.db.log_task_run(task["id"], result=result[:2000])
                # Calculate next run
                schedule = task["schedule"]
                if schedule.startswith("once:"):
                    # One-time task, disable it
                    self.db._conn.execute(
                        "UPDATE scheduled_tasks SET enabled = 0 WHERE id = ?", (task["id"],)
                    )
                    self.db._conn.commit()
                else:
                    # Cron schedule - calculate next run
                    now = datetime.now(timezone.utc)
                    cron = croniter(schedule, now)
                    next_run = cron.get_next(datetime)
                    self.db.update_task_next_run(task["id"], next_run.isoformat())
            except Exception as e:
                log.error("Task '%s' failed: %s", task["name"], e)
                self.db.log_task_run(task["id"], error=str(e))
    # ── Heartbeat ──
    def _heartbeat_loop(self):
        interval = self.config.scheduler.heartbeat_interval_minutes * 60
        # Wait a bit before first heartbeat
        self._stop_event.wait(60)
        while not self._stop_event.is_set():
            try:
                self._run_heartbeat()
            except Exception as e:
                log.error("Heartbeat error: %s", e)
            self._stop_event.wait(interval)
    def _run_heartbeat(self):
        heartbeat_path = self.config.identity_dir / "HEARTBEAT.md"
        if not heartbeat_path.exists():
            return
        checklist = heartbeat_path.read_text(encoding="utf-8")
        prompt = (
            f"HEARTBEAT CHECK. Review this checklist and take action if needed.\n"
            f"If nothing needs attention, respond with exactly: {HEARTBEAT_OK}\n\n"
            f"{checklist}"
        )
        result = self.agent.respond_to_prompt(prompt)
        if HEARTBEAT_OK in result:
            log.debug("Heartbeat: all clear")
        else:
            log.info("Heartbeat action taken: %s", result[:200])
            # Log to daily log
            if self.agent._memory:
                self.agent._memory.log_daily(f"[Heartbeat] {result[:500]}")
--- a/cheddahbot/skills/init.py
+++ b/cheddahbot/skills/init.py
@ -0,0 +1,63 @@
 """Skill registry with @skill decorator and loader."""
 from __future__ import annotations
 import importlib.util
 import logging
 from pathlib import Path
 from typing import Callable
 log = logging.getLogger(__name__)
 _SKILLS: dict[str, "SkillDef"] = {}
 class SkillDef:
    def __init__(self, name: str, description: str, func: Callable):
        self.name = name
        self.description = description
        self.func = func
 def skill(name: str, description: str):
    """Decorator to register a skill."""
    def decorator(func: Callable) -> Callable:
        _SKILLS[name] = SkillDef(name, description, func)
        return func
    return decorator
 def load_skill(path: Path):
    """Dynamically load a skill from a .py file."""
    spec = importlib.util.spec_from_file_location(path.stem, path)
    if spec and spec.loader:
        mod = importlib.util.module_from_spec(spec)
        spec.loader.exec_module(mod)
        log.info("Loaded skill from %s", path)
 def discover_skills(skills_dir: Path):
    """Load all .py files from the skills directory."""
    if not skills_dir.exists():
        return
    for path in skills_dir.glob("*.py"):
        if path.name.startswith("_"):
            continue
        try:
            load_skill(path)
        except Exception as e:
            log.warning("Failed to load skill %s: %s", path.name, e)
 def list_skills() -> list[SkillDef]:
    return list(_SKILLS.values())
 def run_skill(name: str, **kwargs) -> str:
    if name not in _SKILLS:
        return f"Unknown skill: {name}"
    try:
        result = _SKILLS[name].func(**kwargs)
        return str(result) if result is not None else "Done."
    except Exception as e:
        return f"Skill error: {e}"
--- a/cheddahbot/tools/init.py
+++ b/cheddahbot/tools/init.py
@ -0,0 +1,164 @@
 """Tool registry with @tool decorator and auto-discovery."""
 from __future__ import annotations
 import importlib
 import inspect
 import json
 import logging
 import pkgutil
 from pathlib import Path
 from typing import Any, Callable, TYPE_CHECKING
 if TYPE_CHECKING:
    from ..agent import Agent
    from ..config import Config
    from ..db import Database
 log = logging.getLogger(__name__)
 # Global tool registry
 _TOOLS: dict[str, ToolDef] = {}
 class ToolDef:
    """Metadata for a registered tool."""
    def __init__(self, name: str, description: str, func: Callable, category: str = "general"):
        self.name = name
        self.description = description
        self.func = func
        self.category = category
        self.parameters = _extract_params(func)
    def to_openai_schema(self) -> dict:
        """Convert to OpenAI function-calling format."""
        return {
            "type": "function",
            "function": {
                "name": self.name,
                "description": self.description,
                "parameters": {
                    "type": "object",
                    "properties": self.parameters["properties"],
                    "required": self.parameters["required"],
                },
            },
        }
 def tool(name: str, description: str, category: str = "general"):
    """Decorator to register a tool function."""
    def decorator(func: Callable) -> Callable:
        tool_def = ToolDef(name, description, func, category)
        _TOOLS[name] = tool_def
        func._tool_def = tool_def
        return func
    return decorator
 def _extract_params(func: Callable) -> dict:
    """Extract parameter schema from function signature and type hints."""
    sig = inspect.signature(func)
    properties = {}
    required = []
    for param_name, param in sig.parameters.items():
        if param_name in ("self", "ctx"):
            continue
        prop: dict[str, Any] = {}
        annotation = param.annotation
        if annotation == str or annotation == inspect.Parameter.empty:
            prop["type"] = "string"
        elif annotation == int:
            prop["type"] = "integer"
        elif annotation == float:
            prop["type"] = "number"
        elif annotation == bool:
            prop["type"] = "boolean"
        elif annotation == list:
            prop["type"] = "array"
            prop["items"] = {"type": "string"}
        else:
            prop["type"] = "string"
        # Check for description in docstring (simple parsing)
        prop["description"] = f"Parameter: {param_name}"
        properties[param_name] = prop
        if param.default is inspect.Parameter.empty:
            required.append(param_name)
    return {"properties": properties, "required": required}
 class ToolRegistry:
    """Runtime tool registry with execution and schema generation."""
    def __init__(self, config: "Config", db: "Database", agent: "Agent"):
        self.config = config
        self.db = db
        self.agent = agent
        self._discover_tools()
    def _discover_tools(self):
        """Auto-import all modules in the tools/ package."""
        tools_dir = Path(__file__).parent
        for _, module_name, _ in pkgutil.iter_modules([str(tools_dir)]):
            if module_name.startswith("_"):
                continue
            try:
                importlib.import_module(f".{module_name}", package=__package__)
                log.info("Loaded tool module: %s", module_name)
            except Exception as e:
                log.warning("Failed to load tool module %s: %s", module_name, e)
    def get_tools_schema(self) -> list[dict]:
        """Get all tools in OpenAI function-calling format."""
        return [t.to_openai_schema() for t in _TOOLS.values()]
    def get_tools_description(self) -> str:
        """Human-readable tool list for system prompt."""
        lines = []
        by_cat: dict[str, list[ToolDef]] = {}
        for t in _TOOLS.values():
            by_cat.setdefault(t.category, []).append(t)
        for cat, tools in sorted(by_cat.items()):
            lines.append(f"\n### {cat.title()}")
            for t in tools:
                params = ", ".join(t.parameters["required"])
                lines.append(f"- **{t.name}**({params}): {t.description}")
        return "\n".join(lines)
    def execute(self, name: str, args: dict) -> str:
        """Execute a tool by name and return the result as a string."""
        if name not in _TOOLS:
            return f"Unknown tool: {name}"
        tool_def = _TOOLS[name]
        try:
            # Inject context if the function expects it
            sig = inspect.signature(tool_def.func)
            if "ctx" in sig.parameters:
                args["ctx"] = {
                    "config": self.config,
                    "db": self.db,
                    "agent": self.agent,
                    "memory": self.agent._memory,
                }
            result = tool_def.func(**args)
            return str(result) if result is not None else "Done."
        except Exception as e:
            log.error("Tool %s failed: %s", name, e, exc_info=True)
            return f"Tool error: {e}"
    def register_external(self, tool_def: ToolDef):
        """Register a dynamically created tool."""
        _TOOLS[tool_def.name] = tool_def
        log.info("Registered external tool: %s", tool_def.name)
--- a/cheddahbot/tools/build_skill.py
+++ b/cheddahbot/tools/build_skill.py
@ -0,0 +1,49 @@
 """Meta-skill: create multi-step skills at runtime."""
 from __future__ import annotations
 import textwrap
 from pathlib import Path
 from . import tool
@tool("build_skill", "Create a new multi-step skill from a description", category="meta")
 def build_skill(name: str, description: str, steps: str, ctx: dict = None) -> str:
    """Generate a new skill and save it to the skills directory.
    Args:
        name: Skill name (snake_case)
        description: What the skill does
        steps: Python code implementing the skill steps (must use @skill decorator)
    """
    if not name.isidentifier():
        return f"Invalid skill name: {name}. Must be a valid Python identifier."
    if not ctx or not ctx.get("config"):
        return "Config context not available."
    skills_dir = ctx["config"].skills_dir
    skills_dir.mkdir(parents=True, exist_ok=True)
    module_code = textwrap.dedent(f'''\
        """Auto-generated skill: {description}"""
        from __future__ import annotations
        from cheddahbot.skills import skill
        {steps}
    ''')
    file_path = skills_dir / f"{name}.py"
    if file_path.exists():
        return f"Skill '{name}' already exists. Choose a different name."
    file_path.write_text(module_code, encoding="utf-8")
    # Try to load it
    try:
        from cheddahbot.skills import load_skill
        load_skill(file_path)
        return f"Skill '{name}' created at {file_path}"
    except Exception as e:
        return f"Skill created at {file_path} but failed to load: {e}"
--- a/cheddahbot/tools/build_tool.py
+++ b/cheddahbot/tools/build_tool.py
@ -0,0 +1,48 @@
 """Meta-tool: dynamically create new tools at runtime."""
 from __future__ import annotations
 import importlib
 import textwrap
 from pathlib import Path
 from . import tool
@tool("build_tool", "Create a new tool from a description. The agent writes Python code with @tool decorator.", category="meta")
 def build_tool(name: str, description: str, code: str, ctx: dict = None) -> str:
    """Generate a new tool module and hot-load it.
    Args:
        name: Tool name (snake_case)
        description: What the tool does
        code: Full Python code for the tool function (must use @tool decorator)
    """
    if not name.isidentifier():
        return f"Invalid tool name: {name}. Must be a valid Python identifier."
    # Wrap code in a module with the import
    module_code = textwrap.dedent(f'''\
        """Auto-generated tool: {description}"""
        from __future__ import annotations
        from . import tool
        {code}
    ''')
    # Write to tools directory
    tools_dir = Path(__file__).parent
    file_path = tools_dir / f"{name}.py"
    if file_path.exists():
        return f"Tool module '{name}' already exists. Choose a different name."
    file_path.write_text(module_code, encoding="utf-8")
    # Hot-import the new module
    try:
        importlib.import_module(f".{name}", package=__package__)
        return f"Tool '{name}' created and loaded successfully at {file_path}"
    except Exception as e:
        # Clean up on failure
        file_path.unlink(missing_ok=True)
        return f"Failed to load tool '{name}': {e}"
--- a/cheddahbot/tools/calendar_tool.py
+++ b/cheddahbot/tools/calendar_tool.py
@ -0,0 +1,58 @@
 """Calendar/reminder tools: schedule tasks, set reminders."""
 from __future__ import annotations
 from datetime import datetime, timezone
 from . import tool
@tool("remember_this", "Save an important fact or instruction to long-term memory", category="memory")
 def remember_this(text: str, ctx: dict = None) -> str:
    if ctx and ctx.get("memory"):
        ctx["memory"].remember(text)
        return f"Saved to memory: {text}"
    return "Memory system not available"
@tool("search_memory", "Search through saved memories", category="memory")
 def search_memory(query: str, ctx: dict = None) -> str:
    if ctx and ctx.get("memory"):
        results = ctx["memory"].search(query)
        if results:
            return "\n".join(f"- [{r.get('score', 0):.2f}] {r['text']}" for r in results)
        return "No matching memories found."
    return "Memory system not available"
@tool("log_note", "Add a timestamped note to today's daily log", category="memory")
 def log_note(text: str, ctx: dict = None) -> str:
    if ctx and ctx.get("memory"):
        ctx["memory"].log_daily(text)
        return f"Logged: {text}"
    return "Memory system not available"
@tool("schedule_task", "Schedule a recurring or one-time task", category="scheduling")
 def schedule_task(name: str, prompt: str, schedule: str, ctx: dict = None) -> str:
    """Schedule a task. Schedule format: cron expression or 'once:YYYY-MM-DDTHH:MM'."""
    if ctx and ctx.get("db"):
        task_id = ctx["db"].add_scheduled_task(name, prompt, schedule)
        return f"Scheduled task '{name}' (id={task_id}) with schedule: {schedule}"
    return "Database not available"
@tool("list_tasks", "List all scheduled tasks", category="scheduling")
 def list_tasks(ctx: dict = None) -> str:
    if ctx and ctx.get("db"):
        tasks = ctx["db"]._conn.execute(
            "SELECT id, name, schedule, enabled, next_run FROM scheduled_tasks ORDER BY id"
        ).fetchall()
        if not tasks:
            return "No scheduled tasks."
        lines = []
        for t in tasks:
            status = "enabled" if t["enabled"] else "disabled"
            lines.append(f"[{t['id']}] {t['name']} - {t['schedule']} ({status})")
        return "\n".join(lines)
    return "Database not available"
--- a/cheddahbot/tools/code_exec.py
+++ b/cheddahbot/tools/code_exec.py
@ -0,0 +1,44 @@
 """Python code execution tool (sandboxed via subprocess)."""
 from __future__ import annotations
 import subprocess
 import sys
 import tempfile
 from pathlib import Path
 from . import tool
@tool("run_python", "Execute Python code and return the output", category="code")
 def run_python(code: str, timeout: int = 30) -> str:
    with tempfile.NamedTemporaryFile(mode="w", suffix=".py", delete=False, encoding="utf-8") as f:
        f.write(code)
        f.flush()
        tmp_path = f.name
    try:
        result = subprocess.run(
            [sys.executable, tmp_path],
            capture_output=True,
            text=True,
            timeout=min(timeout, 60),
            encoding="utf-8",
            errors="replace",
        )
        output = ""
        if result.stdout:
            output += result.stdout
        if result.stderr:
            output += f"\n[stderr]\n{result.stderr}"
        if result.returncode != 0:
            output += f"\n[exit code: {result.returncode}]"
        if len(output) > 10000:
            output = output[:10000] + "\n... (truncated)"
        return output.strip() or "(no output)"
    except subprocess.TimeoutExpired:
        return f"Execution timed out after {timeout}s"
    except Exception as e:
        return f"Execution error: {e}"
    finally:
        Path(tmp_path).unlink(missing_ok=True)
--- a/cheddahbot/tools/data_proc.py
+++ b/cheddahbot/tools/data_proc.py
@ -0,0 +1,87 @@
 """Data processing tools: CSV/JSON operations."""
 from __future__ import annotations
 import csv
 import io
 import json
 from pathlib import Path
 from . import tool
@tool("read_csv", "Read a CSV file and return summary or specific rows", category="data")
 def read_csv(path: str, max_rows: int = 20) -> str:
    p = Path(path).resolve()
    if not p.exists():
        return f"File not found: {path}"
    try:
        with open(p, newline="", encoding="utf-8-sig") as f:
            reader = csv.reader(f)
            rows = []
            for i, row in enumerate(reader):
                rows.append(row)
                if i >= max_rows:
                    break
        if not rows:
            return "Empty CSV file."
        # Format as table
        header = rows[0]
        lines = [" | ".join(header), " | ".join("---" for _ in header)]
        for row in rows[1:]:
            lines.append(" | ".join(str(c)[:50] for c in row))
        result = "\n".join(lines)
        total_line_count = sum(1 for _ in open(p, encoding="utf-8-sig"))
        if total_line_count > max_rows + 1:
            result += f"\n\n... ({total_line_count - 1} total rows, showing first {max_rows})"
        return result
    except Exception as e:
        return f"Error reading CSV: {e}"
@tool("read_json", "Read and pretty-print a JSON file", category="data")
 def read_json(path: str) -> str:
    p = Path(path).resolve()
    if not p.exists():
        return f"File not found: {path}"
    try:
        data = json.loads(p.read_text(encoding="utf-8"))
        formatted = json.dumps(data, indent=2, ensure_ascii=False)
        if len(formatted) > 15000:
            formatted = formatted[:15000] + "\n... (truncated)"
        return formatted
    except Exception as e:
        return f"Error reading JSON: {e}"
@tool("query_json", "Extract data from a JSON file using a dot-notation path", category="data")
 def query_json(path: str, json_path: str) -> str:
    """json_path example: 'data.users.0.name' or 'results.*.id'"""
    p = Path(path).resolve()
    if not p.exists():
        return f"File not found: {path}"
    try:
        data = json.loads(p.read_text(encoding="utf-8"))
        result = _navigate(data, json_path.split("."))
        return json.dumps(result, indent=2, ensure_ascii=False) if not isinstance(result, str) else result
    except Exception as e:
        return f"Error: {e}"
 def _navigate(data, parts: list[str]):
    for part in parts:
        if part == "*" and isinstance(data, list):
            return data
        elif isinstance(data, dict):
            data = data.get(part, f"Key '{part}' not found")
        elif isinstance(data, list):
            try:
                data = data[int(part)]
            except (ValueError, IndexError):
                return f"Invalid index '{part}'"
        else:
            return f"Cannot navigate into {type(data).__name__}"
    return data
--- a/cheddahbot/tools/file_ops.py
+++ b/cheddahbot/tools/file_ops.py
@ -0,0 +1,96 @@
 """File operation tools: read, write, edit, search."""
 from __future__ import annotations
 import os
 from pathlib import Path
 from . import tool
@tool("read_file", "Read the contents of a file", category="files")
 def read_file(path: str) -> str:
    p = Path(path).resolve()
    if not p.exists():
        return f"File not found: {path}"
    if not p.is_file():
        return f"Not a file: {path}"
    try:
        content = p.read_text(encoding="utf-8", errors="replace")
        if len(content) > 50000:
            return content[:50000] + f"\n\n... (truncated, {len(content)} total chars)"
        return content
    except Exception as e:
        return f"Error reading file: {e}"
@tool("write_file", "Write content to a file (creates or overwrites)", category="files")
 def write_file(path: str, content: str) -> str:
    p = Path(path).resolve()
    p.parent.mkdir(parents=True, exist_ok=True)
    p.write_text(content, encoding="utf-8")
    return f"Written {len(content)} chars to {p}"
@tool("edit_file", "Replace text in a file (first occurrence)", category="files")
 def edit_file(path: str, old_text: str, new_text: str) -> str:
    p = Path(path).resolve()
    if not p.exists():
        return f"File not found: {path}"
    content = p.read_text(encoding="utf-8")
    if old_text not in content:
        return f"Text not found in {path}"
    content = content.replace(old_text, new_text, 1)
    p.write_text(content, encoding="utf-8")
    return f"Replaced text in {p}"
@tool("list_directory", "List files and folders in a directory", category="files")
 def list_directory(path: str = ".") -> str:
    p = Path(path).resolve()
    if not p.is_dir():
        return f"Not a directory: {path}"
    entries = sorted(p.iterdir(), key=lambda x: (not x.is_dir(), x.name.lower()))
    lines = []
    for e in entries[:200]:
        prefix = "📁 " if e.is_dir() else "📄 "
        size = ""
        if e.is_file():
            s = e.stat().st_size
            if s > 1_000_000:
                size = f" ({s / 1_000_000:.1f} MB)"
            elif s > 1000:
                size = f" ({s / 1000:.1f} KB)"
            else:
                size = f" ({s} B)"
        lines.append(f"{prefix}{e.name}{size}")
    return "\n".join(lines) if lines else "(empty directory)"
@tool("search_files", "Search for files matching a glob pattern", category="files")
 def search_files(pattern: str, directory: str = ".") -> str:
    p = Path(directory).resolve()
    matches = list(p.glob(pattern))[:100]
    if not matches:
        return f"No files matching '{pattern}' in {directory}"
    return "\n".join(str(m) for m in matches)
@tool("search_in_files", "Search for text content across files", category="files")
 def search_in_files(query: str, directory: str = ".", extension: str = "") -> str:
    p = Path(directory).resolve()
    pattern = f"**/*{extension}" if extension else "**/*"
    results = []
    for f in p.glob(pattern):
        if not f.is_file() or f.stat().st_size > 1_000_000:
            continue
        try:
            content = f.read_text(encoding="utf-8", errors="ignore")
            for i, line in enumerate(content.split("\n"), 1):
                if query.lower() in line.lower():
                    results.append(f"{f}:{i}: {line.strip()[:200]}")
                    if len(results) >= 50:
                        return "\n".join(results) + "\n... (truncated)"
        except Exception:
            continue
    return "\n".join(results) if results else f"No matches for '{query}'"
--- a/cheddahbot/tools/image.py
+++ b/cheddahbot/tools/image.py
@ -0,0 +1,41 @@
 """Image analysis tool - delegates to vision-capable LLM."""
 from __future__ import annotations
 import base64
 from pathlib import Path
 from . import tool
@tool("analyze_image", "Describe or analyze an image file", category="media")
 def analyze_image(path: str, question: str = "Describe this image in detail.", ctx: dict = None) -> str:
    p = Path(path).resolve()
    if not p.exists():
        return f"Image not found: {path}"
    suffix = p.suffix.lower()
    mime_map = {".png": "image/png", ".jpg": "image/jpeg", ".jpeg": "image/jpeg",
                ".gif": "image/gif", ".webp": "image/webp", ".bmp": "image/bmp"}
    mime = mime_map.get(suffix, "image/png")
    try:
        data = base64.b64encode(p.read_bytes()).decode("utf-8")
    except Exception as e:
        return f"Error reading image: {e}"
    if ctx and ctx.get("agent"):
        agent = ctx["agent"]
        messages = [
            {"role": "user", "content": [
                {"type": "text", "text": question},
                {"type": "image_url", "image_url": {"url": f"data:{mime};base64,{data}"}},
            ]},
        ]
        result_parts = []
        for chunk in agent.llm.chat(messages, stream=False):
            if chunk["type"] == "text":
                result_parts.append(chunk["content"])
        return "".join(result_parts) or "Could not analyze image."
    return "Agent context not available for image analysis."
--- a/cheddahbot/tools/shell.py
+++ b/cheddahbot/tools/shell.py
@ -0,0 +1,53 @@
 """Shell command execution tool with safety checks."""
 from __future__ import annotations
 import subprocess
 import sys
 from . import tool
 # Commands that are always blocked
 BLOCKED_PATTERNS = [
    "rm -rf /",
    "format c:",
    ":(){:|:&};:",
    "dd if=/dev/zero",
    "mkfs.",
    "> /dev/sda",
 ]
@tool("run_command", "Execute a shell command and return output", category="shell")
 def run_command(command: str, timeout: int = 30) -> str:
    # Safety check
    cmd_lower = command.lower().strip()
    for pattern in BLOCKED_PATTERNS:
        if pattern in cmd_lower:
            return f"Blocked: command matches dangerous pattern '{pattern}'"
    try:
        result = subprocess.run(
            command,
            shell=True,
            capture_output=True,
            text=True,
            timeout=min(timeout, 120),
            encoding="utf-8",
            errors="replace",
        )
        output = ""
        if result.stdout:
            output += result.stdout
        if result.stderr:
            output += f"\n[stderr]\n{result.stderr}"
        if result.returncode != 0:
            output += f"\n[exit code: {result.returncode}]"
        if len(output) > 10000:
            output = output[:10000] + "\n... (truncated)"
        return output.strip() or "(no output)"
    except subprocess.TimeoutExpired:
        return f"Command timed out after {timeout}s"
    except Exception as e:
        return f"Error running command: {e}"
--- a/cheddahbot/tools/web.py
+++ b/cheddahbot/tools/web.py
@ -0,0 +1,64 @@
 """Web tools: search, fetch URL, scrape."""
 from __future__ import annotations
 import httpx
 from bs4 import BeautifulSoup
 from . import tool
@tool("web_search", "Search the web using DuckDuckGo", category="web")
 def web_search(query: str, max_results: int = 5) -> str:
    try:
        # Use DuckDuckGo HTML search (no API key needed)
        r = httpx.get(
            "https://html.duckduckgo.com/html/",
            params={"q": query},
            headers={"User-Agent": "Mozilla/5.0 (compatible; CheddahBot/1.0)"},
            timeout=15,
            follow_redirects=True,
        )
        soup = BeautifulSoup(r.text, "html.parser")
        results = []
        for item in soup.select(".result")[:max_results]:
            title_el = item.select_one(".result__title a")
            snippet_el = item.select_one(".result__snippet")
            if title_el:
                title = title_el.get_text(strip=True)
                url = title_el.get("href", "")
                snippet = snippet_el.get_text(strip=True) if snippet_el else ""
                results.append(f"**{title}**\n{url}\n{snippet}")
        return "\n\n".join(results) if results else "No results found."
    except Exception as e:
        return f"Search error: {e}"
@tool("fetch_url", "Fetch and extract text content from a URL", category="web")
 def fetch_url(url: str) -> str:
    try:
        r = httpx.get(
            url,
            headers={"User-Agent": "Mozilla/5.0 (compatible; CheddahBot/1.0)"},
            timeout=20,
            follow_redirects=True,
        )
        content_type = r.headers.get("content-type", "")
        if "html" in content_type:
            soup = BeautifulSoup(r.text, "html.parser")
            # Remove script/style elements
            for tag in soup(["script", "style", "nav", "footer", "header"]):
                tag.decompose()
            text = soup.get_text(separator="\n", strip=True)
            # Collapse whitespace
            lines = [l.strip() for l in text.split("\n") if l.strip()]
            text = "\n".join(lines)
            if len(text) > 15000:
                text = text[:15000] + "\n... (truncated)"
            return text
        elif "json" in content_type:
            return r.text[:15000]
        else:
            return r.text[:5000]
    except Exception as e:
        return f"Fetch error: {e}"
--- a/cheddahbot/ui.py
+++ b/cheddahbot/ui.py
@ -0,0 +1,195 @@
 """Gradio interface for CheddahBot."""
 from __future__ import annotations
 import logging
 import tempfile
 from pathlib import Path
 from typing import TYPE_CHECKING
 import gradio as gr
 if TYPE_CHECKING:
    from .agent import Agent
    from .config import Config
    from .llm import LLMAdapter
 log = logging.getLogger(__name__)
 _CSS = """
 .contain { max-width: 900px; margin: auto; }
 footer { display: none !important; }
 """
 def create_ui(agent: Agent, config: Config, llm: LLMAdapter) -> gr.Blocks:
    """Build and return the Gradio app."""
    available_models = llm.list_available_models()
    model_choices = [(m.name, m.id) for m in available_models]
    current_model = llm.current_model
    with gr.Blocks(title="CheddahBot") as app:
        gr.Markdown("# CheddahBot", elem_classes=["contain"])
        with gr.Row(elem_classes=["contain"]):
            model_dropdown = gr.Dropdown(
                choices=model_choices,
                value=current_model,
                label="Model",
                interactive=True,
                scale=3,
            )
            refresh_btn = gr.Button("Refresh", scale=0, min_width=70)
            new_chat_btn = gr.Button("New Chat", scale=1, variant="secondary")
        chatbot = gr.Chatbot(
            label="Chat",
            height=500,
            buttons=["copy"],
            elem_classes=["contain"],
        )
        with gr.Row(elem_classes=["contain"]):
            msg_input = gr.MultimodalTextbox(
                placeholder="Type a message... (attach files, use mic, or camera)",
                show_label=False,
                scale=4,
                sources=["upload", "microphone"],
            )
        # -- Voice Chat Mode --
        with gr.Accordion("Voice Chat", open=False, elem_classes=["contain"]):
            gr.Markdown("Record audio and get a spoken response.")
            voice_input = gr.Audio(sources=["microphone"], type="filepath", label="Speak")
            voice_output = gr.Audio(type="filepath", label="Response", autoplay=True)
            voice_status = gr.Textbox(label="Transcript", interactive=False)
        # -- Accordion sections --
        with gr.Accordion("Conversation History", open=False, elem_classes=["contain"]):
            conv_list = gr.Dataframe(
                headers=["ID", "Title", "Last Updated"],
                label="Past Conversations",
                interactive=False,
            )
            load_conv_btn = gr.Button("Load Selected")
        with gr.Accordion("Settings", open=False, elem_classes=["contain"]):
            gr.Markdown(
                "Edit `identity/SOUL.md` to change the agent's personality.\n\n"
                "Edit `identity/USER.md` to update your profile.\n\n"
                "Edit `config.yaml` for advanced settings."
            )
        # -- Event handlers --
        def on_model_change(model_id):
            llm.switch_model(model_id)
            return f"Switched to {model_id}"
        def on_refresh_models():
            models = llm.list_available_models()
            choices = [(m.name, m.id) for m in models]
            return gr.update(choices=choices, value=llm.current_model)
        def on_new_chat():
            agent.new_conversation()
            return [], _load_conversations()
        def _load_conversations():
            convs = agent.db.list_conversations()
            return [[c["id"], c["title"], c["updated_at"][:19]] for c in convs]
        def on_user_message(message, chat_history):
            # Extract text and files from MultimodalTextbox
            if isinstance(message, dict):
                text = message.get("text", "")
                files = message.get("files", [])
            else:
                text = str(message)
                files = []
            if not text and not files:
                yield chat_history, gr.update(value=None)
                return
            # Handle audio files - transcribe them
            processed_files = []
            for f in files:
                fpath = f if isinstance(f, str) else f.get("path", f.get("name", ""))
                if fpath and Path(fpath).suffix.lower() in (".wav", ".mp3", ".ogg", ".webm", ".m4a"):
                    try:
                        from .media import transcribe_audio
                        transcript = transcribe_audio(fpath)
                        if transcript:
                            text = f"{text}\n[Voice message]: {transcript}" if text else f"[Voice message]: {transcript}"
                        continue
                    except Exception as e:
                        log.warning("Audio transcription failed: %s", e)
                processed_files.append(fpath)
            # Add user message
            user_display = text
            if processed_files:
                file_names = [Path(f).name for f in processed_files]
                user_display += f"\n[Attached: {', '.join(file_names)}]"
            chat_history = chat_history + [{"role": "user", "content": user_display}]
            yield chat_history, gr.update(value=None)
            # Stream assistant response
            response_text = ""
            chat_history = chat_history + [{"role": "assistant", "content": ""}]
            for chunk in agent.respond(text, files=processed_files):
                response_text += chunk
                chat_history[-1] = {"role": "assistant", "content": response_text}
                yield chat_history, gr.update(value=None)
        def on_voice_chat(audio_path):
            """Handle voice chat: transcribe -> respond -> TTS."""
            if not audio_path:
                return None, "No audio received."
            try:
                from .media import transcribe_audio, text_to_speech
                # Transcribe
                transcript = transcribe_audio(audio_path)
                if not transcript:
                    return None, "Could not transcribe audio."
                # Get response
                response = agent.respond_to_prompt(transcript)
                # TTS
                output_path = config.data_dir / "generated" / "voice_response.mp3"
                text_to_speech(response, output_path)
                return str(output_path), f"You said: {transcript}\n\nResponse: {response}"
            except Exception as e:
                return None, f"Voice chat error: {e}"
        # -- Wire events --
        model_dropdown.change(on_model_change, [model_dropdown], None)
        refresh_btn.click(on_refresh_models, None, [model_dropdown])
        new_chat_btn.click(on_new_chat, None, [chatbot, conv_list])
        msg_input.submit(
            on_user_message,
            [msg_input, chatbot],
            [chatbot, msg_input],
        )
        voice_input.stop_recording(
            on_voice_chat,
            [voice_input],
            [voice_output, voice_status],
        )
        # Load conversation list on app start
        app.load(_load_conversations, None, [conv_list])
    return app, _CSS
--- a/config.yaml
+++ b/config.yaml
@ -0,0 +1,32 @@
 # CheddahBot Configuration
 # Default model to use on startup
 default_model: "claude-sonnet-4-20250514"
 # Gradio server settings
 host: "0.0.0.0"
 port: 7860
 # Memory settings
 memory:
  max_context_messages: 50       # Messages kept in context window
  flush_threshold: 40            # Trigger summary when messages exceed this
  embedding_model: "all-MiniLM-L6-v2"
  search_top_k: 5                # Number of semantic search results
 # Scheduler settings
 scheduler:
  heartbeat_interval_minutes: 30
  poll_interval_seconds: 60
 # Local model endpoints (auto-detected)
 ollama_url: "http://localhost:11434"
 lmstudio_url: "http://localhost:1234"
 # Safety settings
 shell:
  blocked_commands:
    - "rm -rf /"
    - "format"
    - ":(){:|:&};:"
  require_approval: false        # If true, shell commands need user confirmation
--- a/identity/HEARTBEAT.md
+++ b/identity/HEARTBEAT.md
@ -0,0 +1,7 @@
 # Heartbeat Checklist
 Things to proactively check on each heartbeat cycle:
 - Check if any scheduled tasks failed and need retry
 - Review memory for any pending reminders that are due
 - Check disk space (warn if < 10% free)
--- a/identity/SOUL.md
+++ b/identity/SOUL.md
@ -0,0 +1,20 @@
 # Soul
 You are Cheddah, a sharp and resourceful AI assistant.
 ## Personality
 - Direct, no-nonsense, but warm
 - You use humor when appropriate
 - You're proactive - suggest things before being asked
 - You remember what the user tells you and reference it naturally
 - You adapt your communication style to match the user's preferences
 ## Boundaries
 - Never pretend to be human
 - Be honest about uncertainty - say "I don't know" when you don't
 - Don't make up facts or hallucinate information
 - Ask for clarification rather than guessing on important decisions
 ## Quirks
 - You occasionally use the word "cheddah" as slang for money/value
 - You appreciate efficiency and elegant solutions
--- a/identity/USER.md
+++ b/identity/USER.md
@ -0,0 +1,14 @@
 # User Profile
 ## Identity
 - Name: (your name here)
 - How to address: (first name, nickname, etc.)
 ## Context
 - Technical level: (beginner/intermediate/advanced)
 - Primary language: Python
 - Working on: (current projects)
 ## Preferences
 - Communication style: (concise/detailed)
 - (anything else you want the agent to know)
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,19 @@
 # Core
 gradio>=5.0
 openai>=1.30
 pyyaml>=6.0
 python-dotenv>=1.0
 # Memory
 sentence-transformers>=3.0
 numpy>=1.24
 # Web tools
 httpx>=0.27
 beautifulsoup4>=4.12
 # Scheduling
 croniter>=2.0
 # Audio
 edge-tts>=6.1
		`@ -0,0 +1,3 @@`
							`"""CheddahBot - Personal AI assistant."""`

							`__version__ = "0.1.0"`