feat(brain): Phase B — Vector-DB-Memory, Conversation-Loop, Skills, Tool-Use

OpenClaw (aria-core) ist raus, ARIA laeuft jetzt mit eigenem Agent-Framework im aria-brain Container. Vector-DB-basiertes Gedaechtnis statt Sessions, eigener Conversation-Loop mit Hot+Cold-Memory + Rolling Window, Tool-Use fuer Skills, Memory-Destillat-Pipeline. aria-brain/ (neuer Container) - main.py FastAPI auf 8080, alle Endpoints - agent.py Conversation-Loop mit Tool-Use (skill_create + run_<skill>) - conversation.py Rolling Window, JSONL-Persistenz, Distill-Marker - proxy_client.py httpx-Wrapper zum Claude-Proxy, OpenAI-Format - prompts.py System-Prompt aus Hot+Cold+Skills - migration.py Markdown-Parser fuer brain-import/ → atomare Memories - skills.py Filesystem-Layer fuer /data/skills/<name>/ (Python-only, venv pro Skill, tar.gz Export/Import, Run-Logs) - memory/ Embedder (sentence-transformers, multilingual MiniLM) + VectorStore (Qdrant-Wrapper) docker-compose.yml - aria-core (OpenClaw) raus, openclaw-config Volume raus - aria-brain Service (FastAPI + Memory) - aria-qdrant Service (Vector-DB) mit Bind-Mount aria-data/brain/qdrant/ - Diagnostic teilt jetzt Netzwerk mit Bridge (vorher: aria-core) - Brain bekommt SSH-Mount fuer aria-wohnung + /import fuer brain-import/ bridge/aria_bridge.py - send_to_core → HTTP-Call an aria-brain:8080/chat (statt OpenClaw-WS) - aria-core-spezifische Handler raus: doctor_fix, aria_restart, aria_session_reset, Auto-Compact-Logik, OpenClaw-Handshake - Generischer container_restart-Handler (Whitelist Bridge/Brain/Qdrant) - Side-Channel-Events aus /chat-Response (z.B. skill_created) werden als RVS-Events forwarded - file_list_request / file_delete_request → an Diagnostic forwarded - Tote OpenClaw-Connection-Logik bleibt im Code als Referenz (nicht aktiv) Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-05-11 22:23:17 +02:00
parent d0cb7acd10
commit 70d1500096
14 changed files with 2572 additions and 149 deletions
@@ -0,0 +1,125 @@
+"""
+Claude-Aufruf ueber den lokalen Proxy.
+
+Der Proxy (claude-max-api-proxy) bietet eine OpenAI-kompatible API
+unter http://proxy:3456/v1/chat/completions. Wir nutzen non-streaming
+mit einem laengeren Timeout — Claude Code spawnt pro Anfrage einen
+neuen CLI-Prozess (Cold-Start), das dauert.
+"""
+
+from __future__ import annotations
+
+import logging
+import os
+from typing import List, Optional
+
+import httpx
+from pydantic import BaseModel
+
+logger = logging.getLogger(__name__)
+
+DEFAULT_MODEL = os.environ.get("BRAIN_MODEL", "claude-sonnet-4")
+PROXY_URL = os.environ.get("PROXY_URL", "http://proxy:3456")
+PROXY_TIMEOUT_SEC = float(os.environ.get("PROXY_TIMEOUT_SEC", "300"))
+
+
+class Message(BaseModel):
+    role: str  # "system" | "user" | "assistant" | "tool"
+    content: Optional[str] = None
+    tool_calls: Optional[list] = None
+    tool_call_id: Optional[str] = None
+    name: Optional[str] = None  # nur fuer role=tool
+
+
+class ProxyResult(BaseModel):
+    content: str = ""
+    tool_calls: list = []  # je: {"id", "name", "arguments" (dict)}
+    finish_reason: str = ""
+
+
+class ProxyClient:
+    def __init__(self, base_url: str = PROXY_URL, model: str = DEFAULT_MODEL):
+        self.base_url = base_url.rstrip("/")
+        self.model = model
+        # Persistente Client-Connection — vermeidet TCP-Handshake bei jedem Call
+        self._client = httpx.Client(timeout=PROXY_TIMEOUT_SEC)
+
+    def chat(self, messages: List[Message], model: Optional[str] = None) -> str:
+        """Convenience: einfacher Chat ohne Tools. Gibt nur den Reply-String zurueck."""
+        result = self.chat_full(messages, tools=None, model=model)
+        if not result.content:
+            raise RuntimeError("Proxy lieferte leeren content")
+        return result.content
+
+    def chat_full(
+        self,
+        messages: List[Message],
+        tools: Optional[list] = None,
+        model: Optional[str] = None,
+    ) -> ProxyResult:
+        """Full chat — kann Tool-Calls liefern (wenn tools mitgegeben).
+
+        tools-Format ist OpenAI-Style:
+          [{"type":"function","function":{"name":..,"description":..,"parameters":{...}}}, ...]
+        """
+        url = f"{self.base_url}/v1/chat/completions"
+        # Pydantic-Dumps mit exclude_none damit role=tool ohne tool_calls geht
+        payload = {
+            "model": model or self.model,
+            "messages": [m.model_dump(exclude_none=True) for m in messages],
+        }
+        if tools:
+            payload["tools"] = tools
+        logger.info("Proxy → %s (%d Messages, %d tools, model=%s)",
+                    url, len(messages), len(tools or []), payload["model"])
+        try:
+            r = self._client.post(url, json=payload)
+        except httpx.RequestError as exc:
+            raise RuntimeError(f"Proxy unreachable: {exc}") from exc
+        if r.status_code != 200:
+            raise RuntimeError(f"Proxy HTTP {r.status_code}: {r.text[:300]}")
+        try:
+            data = r.json()
+        except Exception as exc:
+            raise RuntimeError(f"Proxy invalid JSON: {exc}") from exc
+
+        choices = data.get("choices") or []
+        if not choices:
+            raise RuntimeError(f"Proxy ohne choices: {str(data)[:300]}")
+
+        msg = choices[0].get("message") or {}
+        finish_reason = choices[0].get("finish_reason", "")
+
+        content = msg.get("content") or ""
+        if isinstance(content, list):
+            content = "".join(
+                part.get("text", "") for part in content if isinstance(part, dict) and part.get("type") == "text"
+            )
+
+        tool_calls_raw = msg.get("tool_calls") or []
+        tool_calls = []
+        import json as _json
+        for tc in tool_calls_raw:
+            fn = tc.get("function") or {}
+            args_raw = fn.get("arguments", "{}")
+            args: dict
+            if isinstance(args_raw, dict):
+                args = args_raw
+            else:
+                try:
+                    args = _json.loads(args_raw)
+                except Exception:
+                    args = {"_raw": args_raw}
+            tool_calls.append({
+                "id": tc.get("id", ""),
+                "name": fn.get("name", ""),
+                "arguments": args,
+            })
+
+        return ProxyResult(content=content or "", tool_calls=tool_calls, finish_reason=finish_reason)
+
+    def close(self):
+        try:
+            self._client.close()
+        except Exception:
+            pass