Shangri-la-0428
diff --git a/‎oasyce_sdk/agent/runtime.py‎
Lines changed: 1 addition & 0 deletions b/‎oasyce_sdk/agent/runtime.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎oasyce_sdk/samantha/context.py‎
Lines changed: 18 additions & 3 deletions b/‎oasyce_sdk/samantha/context.py‎
Lines changed: 18 additions & 3 deletions
diff --git a/‎oasyce_sdk/samantha/http.py‎
Lines changed: 100 additions & 0 deletions b/‎oasyce_sdk/samantha/http.py‎
Lines changed: 100 additions & 0 deletions
diff --git a/‎oasyce_sdk/samantha/loop.py‎
Lines changed: 8 additions & 3 deletions b/‎oasyce_sdk/samantha/loop.py‎
Lines changed: 8 additions & 3 deletions
diff --git a/‎oasyce_sdk/samantha/memory.py‎
Lines changed: 162 additions & 28 deletions b/‎oasyce_sdk/samantha/memory.py‎
Lines changed: 162 additions & 28 deletions
@@ -49,6 +49,7 @@ class Perception:
     dynamic_context: str = ""
     response_contract: ResponseContract | None = None
     generation_controls: GenerationControls | None = None
+    ambient_priors: dict | None = None
 
     @property
     def has_collective_experience(self) -> bool:
 
@@ -206,6 +206,7 @@ def build_messages(
     history_summary: str = "",
     image_urls: list[str] | None = None,
     recent_posts: list[dict[str, Any]] | None = None,
+    message_matches: list[dict[str, Any]] | None = None,
     context_window: int = DEFAULT_CONTEXT_WINDOW,
 ) -> list[dict[str, Any]]:
     """Assemble the full message list with budget-aware truncation.
@@ -311,14 +312,28 @@ def build_messages(
         system_parts.append(posts_text)
         retrieval_used += _estimate_tokens(posts_text)
 
-    # Memories (FTS5 recalled facts)
+    # Memories (FTS5 recalled facts) + verbatim message matches
+    # Split remaining retrieval budget: ~half for facts, ~half for messages
+    remaining_retrieval = budget.retrieval - retrieval_used
+    fact_budget = remaining_retrieval // 2 if message_matches else remaining_retrieval
+    msg_budget = remaining_retrieval - fact_budget
+
     if memories:
-        mem_budget = budget.retrieval - retrieval_used
         mem_lines = [f"- ({m['category']}) {m['content']}" for m in memories[:5]]
         mem_text = "[Your memories about this user]\n" + "\n".join(mem_lines)
-        mem_text = _truncate_text(mem_text, mem_budget)
+        mem_text = _truncate_text(mem_text, fact_budget)
         system_parts.append(mem_text)
 
+    if message_matches:
+        msg_lines = []
+        for m in message_matches[:5]:
+            role = m.get("role", "user")
+            who = "they said" if role == "user" else "you said"
+            msg_lines.append(f'- {who}: "{m.get("content", "")[:200]}"')
+        msg_text = "[Relevant past exchanges]\n" + "\n".join(msg_lines)
+        msg_text = _truncate_text(msg_text, msg_budget)
+        system_parts.append(msg_text)
+
     messages.append({"role": "system", "content": "\n\n".join(system_parts)})
 
     # ── Vision: inject recent post images (base64, concurrent) ─
 
@@ -0,0 +1,100 @@
+"""HTTP webhook server for Samantha.
+
+Two endpoints:
+  POST /hook/message       — chat message webhook from the App backend
+  POST /hook/post_mention  — @mention webhook from the App backend
+  GET  /health             — liveness + active session list
+
+Kept in its own module so server.py focuses on Samantha itself.
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+from http.server import BaseHTTPRequestHandler, HTTPServer
+from typing import TYPE_CHECKING
+
+if TYPE_CHECKING:
+    from .server import Samantha
+
+logger = logging.getLogger(__name__)
+
+
+def make_handler(samantha: "Samantha") -> type[BaseHTTPRequestHandler]:
+    """Bind a Samantha instance to a BaseHTTPRequestHandler subclass.
+
+    Closure-based wiring avoids a module-level global. The returned class
+    is what HTTPServer expects (it instantiates per request).
+    """
+    from .server import Stimulus  # local import: break cycle
+
+    class WebhookHandler(BaseHTTPRequestHandler):
+        def do_POST(self):
+            length = int(self.headers.get("Content-Length", 0))
+            body = json.loads(self.rfile.read(length)) if length else {}
+
+            if self.path == "/hook/message":
+                session_id = body.get("session_id", 0)
+                sender_id = body.get("sender_id", 0)
+                content = body.get("content", "")
+
+                if not content:
+                    self._respond(200, {"ok": True})
+                    return
+
+                samantha.submit(Stimulus(
+                    kind="chat", content=content,
+                    sender_id=sender_id, session_id=session_id,
+                ))
+                self._respond(200, {"ok": True})
+
+            elif self.path == "/hook/post_mention":
+                post_id = body.get("post_id", 0)
+                comment_id = body.get("comment_id", 0)
+                sender_id = body.get("sender_id", 0)
+                title = body.get("title", "")
+                content = body.get("content", "")
+
+                if not post_id and not content:
+                    self._respond(200, {"ok": True})
+                    return
+
+                samantha.submit(Stimulus(
+                    kind="mention",
+                    content=content,
+                    sender_id=sender_id,
+                    post_id=post_id,
+                    comment_id=comment_id,
+                    metadata={"post_title": title},
+                ))
+                self._respond(200, {"ok": True})
+
+            else:
+                self._respond(404, {"error": "not found"})
+
+        def do_GET(self):
+            if self.path == "/health":
+                sessions = list(samantha._sessions.keys())
+                self._respond(200, {"status": "ok", "active_sessions": sessions})
+            else:
+                self._respond(404, {"error": "not found"})
+
+        def _respond(self, code: int, body: dict):
+            self.send_response(code)
+            self.send_header("Content-Type", "application/json")
+            self.end_headers()
+            self.wfile.write(json.dumps(body).encode())
+
+        def log_message(self, fmt, *args):
+            logger.info(fmt, *args)
+
+    return WebhookHandler
+
+
+def run_http_server(samantha: "Samantha", port: int) -> None:
+    """Block forever serving Samantha's HTTP endpoints on 127.0.0.1:{port}."""
+    handler_cls = make_handler(samantha)
+    server = HTTPServer(("127.0.0.1", port), handler_cls)
+    logger.info("Health endpoint on http://127.0.0.1:%d/health", port)
+    server.serve_forever()
@@ -41,19 +41,24 @@ def proactive_loop(samantha: Samantha, interval: int = 300) -> None:
 
 
 def _memory_maintenance(samantha: Samantha) -> None:
-    """Prune stale facts + Dream consolidation across all active sessions."""
+    """Prune stale facts + Dream consolidation across all active sessions.
+
+    Errors here are warnings, not debug: if maintenance is silently failing
+    then core memory stops updating and stale facts never get pruned, which
+    is a quiet drift of agent behavior over time.
+    """
     for user_id, sess in list(samantha._sessions.items()):
         try:
             pruned = sess.memory.prune(max_age_days=90, min_access=0)
             if pruned:
                 logger.info("User %d: pruned %d stale memories", user_id, pruned)
         except Exception:
-            logger.debug("Prune failed for user %d", user_id, exc_info=True)
+            logger.warning("Prune failed for user %d", user_id, exc_info=True)
 
         try:
             samantha.dream(user_id, sess)
         except Exception:
-            logger.debug("Dream failed for user %d", user_id, exc_info=True)
+            logger.warning("Dream failed for user %d", user_id, exc_info=True)
 
 
 def _scan_feed(samantha: Samantha, seen: set[int]) -> None:
 
@@ -13,6 +13,7 @@
 import json
 import logging
 import sqlite3
+import threading
 from dataclasses import dataclass
 from datetime import datetime, timezone
 from pathlib import Path
@@ -31,38 +32,108 @@ class Fact(NamedTuple):
     access_count: int
 
 
+class Message(NamedTuple):
+    id: int
+    role: str          # 'user' | 'assistant'
+    content: str
+    session_id: int
+    created_at: str
+
+
+# Schema is idempotent (IF NOT EXISTS everywhere) so every freshly-opened
+# connection can run it safely. That's what makes per-thread connections
+# work without coordination: each thread opens its own, runs the same DDL,
+# and gets the same view of the DB.
+_SCHEMA = """
+    CREATE TABLE IF NOT EXISTS facts (
+        id INTEGER PRIMARY KEY AUTOINCREMENT,
+        content TEXT NOT NULL,
+        category TEXT DEFAULT 'general',
+        created_at TEXT NOT NULL,
+        last_accessed TEXT,
+        access_count INTEGER DEFAULT 0
+    );
+    CREATE VIRTUAL TABLE IF NOT EXISTS facts_fts
+        USING fts5(content, category, content='facts', content_rowid='id');
+
+    CREATE TRIGGER IF NOT EXISTS facts_ai AFTER INSERT ON facts BEGIN
+        INSERT INTO facts_fts(rowid, content, category)
+        VALUES (new.id, new.content, new.category);
+    END;
+    CREATE TRIGGER IF NOT EXISTS facts_ad AFTER DELETE ON facts BEGIN
+        INSERT INTO facts_fts(facts_fts, rowid, content, category)
+        VALUES ('delete', old.id, old.content, old.category);
+    END;
+
+    CREATE TABLE IF NOT EXISTS messages (
+        id INTEGER PRIMARY KEY AUTOINCREMENT,
+        role TEXT NOT NULL,
+        content TEXT NOT NULL,
+        session_id INTEGER DEFAULT 0,
+        created_at TEXT NOT NULL
+    );
+    CREATE VIRTUAL TABLE IF NOT EXISTS messages_fts
+        USING fts5(content, content='messages', content_rowid='id');
+    CREATE INDEX IF NOT EXISTS idx_messages_session
+        ON messages(session_id, created_at);
+
+    CREATE TRIGGER IF NOT EXISTS messages_ai AFTER INSERT ON messages BEGIN
+        INSERT INTO messages_fts(rowid, content)
+        VALUES (new.id, new.content);
+    END;
+    CREATE TRIGGER IF NOT EXISTS messages_ad AFTER DELETE ON messages BEGIN
+        INSERT INTO messages_fts(messages_fts, rowid, content)
+        VALUES ('delete', old.id, old.content);
+    END;
+"""
+
+
 class Memory:
-    """Persistent fact store backed by SQLite FTS5."""
+    """Persistent fact store backed by SQLite FTS5.
+
+    Two tables:
+      facts      — LLM-extracted semantic knowledge (the agent's "beliefs")
+      messages   — verbatim turn-by-turn log (the raw conversation)
+
+    Extracted facts are lossy but searchable by concept. Verbatim messages
+    preserve nuance and exact phrasing for recall of specific moments.
+    Recall from both paths is cheap (FTS5) and complementary.
+
+    Threading model
+    ---------------
+    One Memory instance is shared across threads; each thread that touches
+    it opens its own `sqlite3.Connection` stored in a `threading.local`.
+    This matches how the stdlib `sqlite3` module is designed to be used
+    from multi-threaded code: share the database, not the connection.
+
+    SQLite's WAL mode lets readers proceed in parallel with a writer and
+    serializes writers at the file layer, so no Python-level lock is
+    needed — the correctness guarantee comes from SQLite itself.
+    """
 
     def __init__(self, db_path: Path | None = None):
         p = db_path or DEFAULT_DB_PATH
         p.parent.mkdir(parents=True, exist_ok=True)
-        self._conn = sqlite3.connect(str(p))
-        self._conn.execute("PRAGMA journal_mode=WAL")
-        self._init_schema()
-
-    def _init_schema(self) -> None:
-        self._conn.executescript("""
-            CREATE TABLE IF NOT EXISTS facts (
-                id INTEGER PRIMARY KEY AUTOINCREMENT,
-                content TEXT NOT NULL,
-                category TEXT DEFAULT 'general',
-                created_at TEXT NOT NULL,
-                last_accessed TEXT,
-                access_count INTEGER DEFAULT 0
-            );
-            CREATE VIRTUAL TABLE IF NOT EXISTS facts_fts
-                USING fts5(content, category, content='facts', content_rowid='id');
-
-            CREATE TRIGGER IF NOT EXISTS facts_ai AFTER INSERT ON facts BEGIN
-                INSERT INTO facts_fts(rowid, content, category)
-                VALUES (new.id, new.content, new.category);
-            END;
-            CREATE TRIGGER IF NOT EXISTS facts_ad AFTER DELETE ON facts BEGIN
-                INSERT INTO facts_fts(facts_fts, rowid, content, category)
-                VALUES ('delete', old.id, old.content, old.category);
-            END;
-        """)
+        self._path = str(p)
+        self._local = threading.local()
+        # Eager open: if the path is unwritable or the schema fails, surface
+        # the error at construction time rather than on the first operation.
+        self._connect()
+
+    def _connect(self) -> sqlite3.Connection:
+        """Return the current thread's connection, opening it on first use."""
+        conn = getattr(self._local, "conn", None)
+        if conn is None:
+            conn = sqlite3.connect(self._path)
+            conn.execute("PRAGMA journal_mode=WAL")
+            conn.executescript(_SCHEMA)
+            self._local.conn = conn
+        return conn
+
+    @property
+    def _conn(self) -> sqlite3.Connection:
+        """Thread-local connection — lazy-created per thread, never shared."""
+        return self._connect()
 
     def save(self, content: str, category: str = "general") -> int:
         """Store a fact. Returns its id."""
@@ -111,6 +182,59 @@ def count(self) -> int:
         row = self._conn.execute("SELECT COUNT(*) FROM facts").fetchone()
         return row[0] if row else 0
 
+    # ── Verbatim messages ─────────────────────────────────────
+
+    def log_message(self, role: str, content: str, session_id: int = 0) -> int:
+        """Store a verbatim turn. Returns its id."""
+        if not content:
+            return 0
+        now = datetime.now(timezone.utc).isoformat()
+        cur = self._conn.execute(
+            "INSERT INTO messages (role, content, session_id, created_at) "
+            "VALUES (?, ?, ?, ?)",
+            (role, content, session_id, now),
+        )
+        self._conn.commit()
+        return cur.lastrowid  # type: ignore[return-value]
+
+    def search_messages(self, query: str, limit: int = 5) -> list[Message]:
+        """FTS5 search across verbatim messages, ranked by relevance."""
+        if not query.strip():
+            return []
+        rows = self._conn.execute(
+            """
+            SELECT m.id, m.role, m.content, m.session_id, m.created_at
+            FROM messages_fts
+            JOIN messages m ON m.id = messages_fts.rowid
+            WHERE messages_fts MATCH ?
+            ORDER BY messages_fts.rank
+            LIMIT ?
+            """,
+            (query, limit),
+        ).fetchall()
+        return [Message(*r) for r in rows]
+
+    def recent_messages(self, session_id: int = 0, limit: int = 20) -> list[Message]:
+        """Latest messages for a session (or all sessions if session_id=0)."""
+        if session_id:
+            rows = self._conn.execute(
+                "SELECT id, role, content, session_id, created_at "
+                "FROM messages WHERE session_id = ? "
+                "ORDER BY created_at DESC LIMIT ?",
+                (session_id, limit),
+            ).fetchall()
+        else:
+            rows = self._conn.execute(
+                "SELECT id, role, content, session_id, created_at "
+                "FROM messages ORDER BY created_at DESC LIMIT ?",
+                (limit,),
+            ).fetchall()
+        return [Message(*r) for r in rows]
+
+    def message_count(self) -> int:
+        row = self._conn.execute("SELECT COUNT(*) FROM messages").fetchone()
+        return row[0] if row else 0
+
     def prune(self, max_age_days: int = 90, min_access: int = 0) -> int:
         """Remove stale facts. Returns count of deleted rows.
 
@@ -134,7 +258,17 @@ def prune(self, max_age_days: int = 90, min_access: int = 0) -> int:
         return deleted
 
     def close(self) -> None:
-        self._conn.close()
+        """Close the current thread's connection. Best-effort cleanup.
+
+        Connections held by other threads are reclaimed when those threads
+        exit or when the garbage collector runs over their thread-locals.
+        Under WAL every `commit()` is durable, so this cannot cause data
+        loss — it only releases the current thread's file handle.
+        """
+        conn = getattr(self._local, "conn", None)
+        if conn is not None:
+            conn.close()
+            self._local.conn = None
 
 
 # ── Core Memory (MemGPT-inspired) ──────────────────────────────