chore: Remove unnecessary files and folders

Removed: - session.md (user-specific session notes) - migrate_memories.py (one-time migration script) - test_curator.py (test file) - __pycache__/ (Python cache) - tr-compact/ (v1 deprecated) - tr-daily/ (v1 deprecated) - tr-worker/ (empty) - shared/ (empty) - tr-continuous/migrate_add_curated.py - tr-continuous/curator_by_count.py - tr-continuous/curator_turn_based.py - tr-continuous/curator_cron.sh - tr-continuous/turn-curator.service - tr-continuous/README.md (redundant) Remaining core files: - README.md, checklist.md, curator-prompt.md - install.py, push-all.sh, .gitignore - tr-continuous/curator_timer.py - tr-continuous/curator_config.json
2026-02-24 21:42:48 -06:00
parent 198334c0b4
commit a22e6f095a
13 changed files with 0 additions and 1905 deletions
--- a/pycache/migrate_memories.cpython-312.pyc
+++ b/pycache/migrate_memories.cpython-312.pyc
--- a/migrate_memories.py
+++ b/migrate_memories.py
@@ -1,187 +0,0 @@
 #!/usr/bin/env python3
 """
 Migrate memories from kimi_memories to memories_tr
 - Reads from kimi_memories (Qdrant)
 - Cleans/strips noise (metadata, thinking tags)
 - Stores to memories_tr (Qdrant)
 - Keeps original kimi_memories intact
 """
 import json
 import urllib.request
 import urllib.error
 from datetime import datetime
 from typing import List, Dict, Any
 QDRANT_URL = "http://10.0.0.40:6333"
 SOURCE_COLLECTION = "kimi_memories"
 TARGET_COLLECTION = "memories_tr"
 def clean_content(text: str) -> str:
    """Clean noise from content"""
    if not text:
        return ""
    cleaned = text
    # Remove metadata JSON blocks
    import re
    cleaned = re.sub(r'Conversation info \(untrusted metadata\):\s*```json\s*\{[\s\S]*?\}\s*```', '', cleaned)
    # Remove thinking tags
    cleaned = re.sub(r'\[thinking:[^\]]*\]', '', cleaned)
    # Remove timestamp lines
    cleaned = re.sub(r'\[\w{3} \d{4}-\d{2}-\d{2} \d{2}:\d{2} [A-Z]{3}\]', '', cleaned)
    # Clean up whitespace
    cleaned = re.sub(r'\n{3,}', '\n\n', cleaned)
    cleaned = cleaned.strip()
    return cleaned
 def get_all_points(collection: str) -> List[Dict]:
    """Get all points from a collection"""
    all_points = []
    offset = None
    max_iterations = 1000
    iterations = 0
    while iterations < max_iterations:
        iterations += 1
        scroll_data = {
            "limit": 100,
            "with_payload": True,
            "with_vector": True
        }
        if offset:
            scroll_data["offset"] = offset
        req = urllib.request.Request(
            f"{QDRANT_URL}/collections/{collection}/points/scroll",
            data=json.dumps(scroll_data).encode(),
            headers={"Content-Type": "application/json"},
            method="POST"
        )
        try:
            with urllib.request.urlopen(req, timeout=60) as response:
                result = json.loads(response.read().decode())
                points = result.get("result", {}).get("points", [])
                if not points:
                    break
                all_points.extend(points)
                offset = result.get("result", {}).get("next_page_offset")
                if not offset:
                    break
        except urllib.error.HTTPError as e:
            print(f"Error: {e}")
            break
    return all_points
 def store_points(collection: str, points: List[Dict]) -> int:
    """Store points to collection"""
    if not points:
        return 0
    # Batch upload
    batch_size = 100
    stored = 0
    for i in range(0, len(points), batch_size):
        batch = points[i:i+batch_size]
        points_data = {
            "points": batch
        }
        req = urllib.request.Request(
            f"{QDRANT_URL}/collections/{collection}/points",
            data=json.dumps(points_data).encode(),
            headers={"Content-Type": "application/json"},
            method="PUT"
        )
        try:
            with urllib.request.urlopen(req, timeout=60) as response:
                if response.status == 200:
                    stored += len(batch)
        except urllib.error.HTTPError as e:
            print(f"Error storing batch: {e}")
    return stored
 def migrate_point(point: Dict) -> Dict:
    """Clean a single point"""
    payload = point.get("payload", {})
    # Clean user and AI messages
    user_msg = clean_content(payload.get("user_message", ""))
    ai_msg = clean_content(payload.get("ai_response", ""))
    # Keep other fields
    cleaned_payload = {
        **payload,
        "user_message": user_msg,
        "ai_response": ai_msg,
        "migrated_from": "kimi_memories",
        "migrated_at": datetime.now().isoformat()
    }
    return {
        "id": point.get("id"),
        "vector": point.get("vector"),
        "payload": cleaned_payload
    }
 def main():
    print("=" * 60)
    print("Memory Migration: kimi_memories → memories_tr")
    print("=" * 60)
    print()
    # Check source
    print(f"📥 Reading from {SOURCE_COLLECTION}...")
    source_points = get_all_points(SOURCE_COLLECTION)
    print(f"   Found {len(source_points)} points")
    if not source_points:
        print("❌ No points to migrate")
        return
    # Clean points
    print(f"\n🧹 Cleaning {len(source_points)} points...")
    cleaned_points = [migrate_point(p) for p in source_points]
    print(f"   ✓ Cleaned")
    # Store to target
    print(f"\n💾 Storing to {TARGET_COLLECTION}...")
    stored = store_points(TARGET_COLLECTION, cleaned_points)
    print(f"   ✓ Stored {stored} points")
    # Verify
    print(f"\n🔍 Verifying...")
    target_points = get_all_points(TARGET_COLLECTION)
    print(f"   Target now has {len(target_points)} points")
    # Summary
    print()
    print("=" * 60)
    print("Migration Summary:")
    print(f"  Source ({SOURCE_COLLECTION}): {len(source_points)} points")
    print(f"  Target ({TARGET_COLLECTION}): {len(target_points)} points")
    print(f"  Cleaned & migrated: {stored} points")
    print("=" * 60)
    if stored == len(source_points):
        print("\n✅ Migration complete!")
    else:
        print(f"\n⚠️  Warning: Only migrated {stored}/{len(source_points)} points")
 if __name__ == "__main__":
    main()
--- a/session.md
+++ b/session.md
@@ -1,494 +0,0 @@
 # TrueRecall v2 - Session Notes
 **Last Updated:** 2026-02-24 19:02 CST
 **Status:** ✅ Active & Verified
 **Version:** v2.2 (Timer-based curation deployed)
 ---
 ## Session End (18:09 CST)
 **Reason:** User starting new session
 **Current State:**
 - Real-time watcher: ✅ Active (capturing live)
 - Timer curator: ✅ Deployed (every 30 min via cron)
 - Daily curator: ❌ Removed (replaced by timer)
 - Total memories: 12,378 (all tagged with `curated: false`)
 - Gems: 5 (from Feb 18 test)
 **Next session start:** Read this file, then check:
 ```bash
 # Quick status
 python3 ~/.openclaw/workspace/.projects/true-recall-v2/tr-continuous/curator_by_count.py --status
 sudo systemctl status mem-qdrant-watcher
 curl -s http://<QDRANT_IP>:6333/collections/memories_tr | jq '.result.points_count'
 ```
 ---
 ## Executive Summary
 TrueRecall v2 is a complete memory system with real-time capture, daily curation, and context injection. All components are operational.
 ---
 ## Current State (Verified 18:09 CST)
 ### Qdrant Collections
 | Collection | Points | Purpose | Status |
 |------------|--------|---------|--------|
 | `memories_tr` | **12,378** | Full text (live capture) | ✅ Active |
 | `gems_tr` | **5** | Curated gems (injection) | ✅ Active |
 | `true_recall` | existing | Legacy archive | 📦 Preserved |
 | `kimi_memories` | 12,223 | Original backup | 📦 Preserved |
 **Note:** All memories tagged with `curated: false` for timer curator.
 ### Services
 | Service | Status | Uptime |
 |---------|--------|--------|
 | `mem-qdrant-watcher` | ✅ Active | 30+ min |
 | OpenClaw Gateway | ✅ Running | 2026.2.23 |
 | memory-qdrant plugin | ✅ Loaded | recall: gems_tr, capture: memories_tr |
 ---
 ## Architecture
 ### v2.2: Timer-Based Curation (DEPLOYED)
 **Data Flow:**
 ```
 ┌─────────────────┐     ┌──────────────────────┐     ┌─────────────┐
 │  OpenClaw Chat  │────▶│ Real-Time Watcher    │────▶│ memories_tr │
 │  (Session JSONL)│     │ (Python daemon)      │     │ (Qdrant)    │
 └─────────────────┘     └──────────────────────┘     └──────┬──────┘
                                                          │
                                                          │ Every 30 min
                                                          ▼
                                                ┌──────────────────┐
                                                │  Timer Curator   │
                                                │   (cron/qwen3)   │
                                                └────────┬─────────┘
                                                         │
                                                         ▼
                                                ┌──────────────────┐
                                                │    gems_tr       │
                                                │   (Qdrant)       │
                                                └────────┬─────────┘
                                                         │
                                              Per turn   │
                                                         ▼
                                                ┌──────────────────┐
                                                │ memory-qdrant    │
                                                │     plugin       │
                                                └──────────────────┘
 ```
 **Key Changes:**
 - ✅ Replaced daily 2:45 AM batch with 30-minute timer
 - ✅ All memories tagged `curated: false` on write
 - ✅ Migration completed for 12,378 existing memories
 - ✅ No Redis dependency (direct Qdrant only)
 ---
 ## Components
 ### Curation Mode: Timer-Based (DEPLOYED v2.2)
 | Setting | Value | Adjustable |
 |---------|-------|------------|
 | **Trigger** | Cron timer | ✅ |
 | **Interval** | 30 minutes | ✅ Config file |
 | **Batch size** | 100 memories max | ✅ Config file |
 | **Minimum** | None (0 is OK) | — |
 **Config:** `/tr-continuous/curator_config.json`
 ```json
 {
  "timer_minutes": 30,
  "max_batch_size": 100,
  "user_id": "rob",
  "source_collection": "memories_tr",
  "target_collection": "gems_tr"
 }
 ```
 **Cron:**
 ```
 */30 * * * * cd .../tr-continuous && python3 curator_timer.py
 ```
 **Old modes deprecated:**
 - ❌ Turn-based (every N turns)
 - ❌ Hybrid (timer + turn)
 - ❌ Daily batch (2:45 AM)
 ### 1. Real-Time Watcher (Primary Capture)
 **Location:** `~/.openclaw/workspace/skills/qdrant-memory/scripts/realtime_qdrant_watcher.py`
 **Function:**
 - Watches `~/.openclaw/agents/main/sessions/*.jsonl`
 - Parses every conversation turn in real-time
 - Embeds with `snowflake-arctic-embed2` (Ollama @ <OLLAMA_IP>)
 - Stores directly to `memories_tr` (no Redis)
 - **Cleans content:** Removes markdown, tables, metadata, thinking tags
 **Service:** `mem-qdrant-watcher.service`
 - **Status:** Active since 16:46:53 CST
 - **Systemd:** Enabled, auto-restart
 **Log:** `journalctl -u mem-qdrant-watcher -f`
 ---
 ### 2. Content Cleaner (Existing Data)
 **Location:** `~/.openclaw/workspace/skills/qdrant-memory/scripts/clean_memories_tr.py`
 **Function:**
 - Batch-cleans existing `memories_tr` points
 - Removes: `**bold**`, `|tables|`, `` `code` ``, `---` rules, `# headers`
 - Flattens nested content dicts
 - Rate-limited to prevent Qdrant overload
 **Usage:**
 ```bash
 # Dry run (preview)
 python3 clean_memories_tr.py --dry-run
 # Clean all
 python3 clean_memories_tr.py --execute
 # Clean limited (test)
 python3 clean_memories_tr.py --execute --limit 100
 ```
 ---
 ### 3. Timer Curator (v2.2 - DEPLOYED)
 **Replaces:** Daily curator (2:45 AM batch) and turn-based curator
 **Location:** `~/.openclaw/workspace/.projects/true-recall-v2/tr-continuous/curator_timer.py`
 **Schedule:** Every 30 minutes (cron)
 **Flow:**
 1. Query uncurated memories (`curated: false`)
 2. Send batch to qwen3 (max 100)
 3. Extract gems using curator prompt
 4. Store gems to `gems_tr`
 5. Mark processed memories as `curated: true`
 **Files:**
 | File | Purpose |
 |------|---------|
 | `curator_timer.py` | Main curator script |
 | `curator_config.json` | Adjustable settings |
 | `migrate_add_curated.py` | One-time migration (completed) |
 **Usage:**
 ```bash
 # Dry run (preview)
 python3 curator_timer.py --dry-run
 # Manual run
 python3 curator_timer.py --config curator_config.json
 ```
 **Status:** ✅ Deployed, first run will process ~12,378 existing memories
 ### 5. Silent Compacting (NEW - Concept)
 **Idea:** Automatically remove old context from prompt when token limit approached.
 **Behavior:**
 - Trigger: Context window > 80% full
 - Action: Remove oldest messages (silently)
 - Preserve: Gems always kept, recent N turns kept
 - Result: Seamless conversation without "compacting" notification
 **Config:**
 ```json
 {
  "compacting": {
    "enabled": true,
    "triggerAtPercent": 80,
    "keepRecentTurns": 20,
    "preserveGems": true,
    "silent": true
  }
 }
 ```
 **Status:** ⏳ Concept only - requires OpenClaw core changes
 ### 6. memory-qdrant Plugin
 **Location:** `~/.openclaw/extensions/memory-qdrant/`
 **Config:**
 ```json
 {
  "collectionName": "gems_tr",
  "captureCollection": "memories_tr",
  "autoRecall": true,
  "autoCapture": true
 }
 ```
 **Function:**
 - **Recall:** Searches `gems_tr`, injects as context (hidden)
 - **Capture:** Session-level capture to `memories_tr` (backup)
 **Status:** Loaded, dual collection support working
 ---
 ## Files & Locations
 ### Core Project Files
 ```
 ~/.openclaw/workspace/.projects/true-recall-v2/
 ├── README.md                           # Architecture docs
 ├── session.md                          # This file
 ├── curator-prompt.md                   # Gem extraction prompt
 ├── tr-daily/                           # Daily batch curation
 │   └── curate_from_qdrant.py          # Daily curator (2:45 AM)
 ├── tr-continuous/                      # Real-time curation (NEW)
 │   ├── curator_by_count.py           # Turn-based curator
 │   ├── curator_turn_based.py         # Alternative approach
 │   ├── curator_cron.sh               # Cron wrapper
 │   ├── turn-curator.service          # Systemd service
 │   └── README.md                     # Documentation
 └── shared/
    └── (shared resources)
 ```
 ### New Files (2026-02-24 19:00)
 | File | Purpose |
 |------|---------|
 | `tr-continuous/curator_timer.py` | Timer-based curator (deployed) |
 | `tr-continuous/curator_config.json` | Curator settings |
 | `tr-continuous/migrate_add_curated.py` | Migration script (completed) |
 ### Legacy Files (Pre-v2.2)
 | File | Status | Note |
 |------|--------|------|
 | `tr-daily/curate_from_qdrant.py` | 📦 Archived | Replaced by timer |
 | `tr-continuous/curator_by_count.py` | 📦 Archived | Replaced by timer |
 | `tr-continuous/curator_turn_based.py` | 📦 Archived | Replaced by timer |
 ### System Locations
 | File | Purpose |
 |------|---------|
 | `~/.openclaw/extensions/memory-qdrant/` | Plugin code |
 | `~/.openclaw/openclaw.json` | Plugin configuration |
 | `/etc/systemd/system/mem-qdrant-watcher.service` | Systemd service |
 ---
 ## Changes Made Today (2026-02-24 19:00)
 ### 1. Timer Curator Deployed (v2.2)
 - Created `curator_timer.py` — simplified timer-based curation
 - Created `curator_config.json` — adjustable settings
 - Removed daily 2:45 AM cron job
 - Added `*/30 * * * *` cron timer
 - **Status:** ✅ Deployed, logs to `/var/log/true-recall-timer.log`
 ### 2. Migration Completed
 - Created `migrate_add_curated.py`
 - Tagged 12,378 existing memories with `curated: false`
 - Updated watcher to add `curated: false` to new memories
 - **Status:** ✅ Complete
 ### 3. Simplified Architecture
 - ❌ Removed turn-based curator complexity
 - ❌ Removed daily batch processing
 - ✅ Single timer trigger every 30 minutes
 - ✅ No minimum threshold (processes 0-N memories)
 ---
 ## Configuration
 ### memory-qdrant Plugin
 **File:** `~/.openclaw/openclaw.json`
 ```json
 {
  "memory-qdrant": {
    "config": {
      "autoCapture": true,
      "autoRecall": true,
      "collectionName": "gems_tr",
      "captureCollection": "memories_tr",
      "embeddingModel": "snowflake-arctic-embed2",
      "maxRecallResults": 2,
      "minRecallScore": 0.7,
      "ollamaUrl": "http://<OLLAMA_IP>:11434",
      "qdrantUrl": "http://<QDRANT_IP>:6333"
    },
    "enabled": true
  }
 }
 ```
 ### Gateway (OpenClaw Update Fix)
 ```json
 {
  "gateway": {
    "controlUi": {
      "allowedOrigins": ["*"],
      "allowInsecureAuth": false,
      "dangerouslyDisableDeviceAuth": true
    }
  }
 }
 ```
 ---
 ## Validation Commands
 ### Check Collections
 ```bash
 # Points count
 curl -s http://<QDRANT_IP>:6333/collections/memories_tr | jq '.result.points_count'
 curl -s http://<QDRANT_IP>:6333/collections/gems_tr | jq '.result.points_count'
 # Recent points
 curl -s -X POST http://<QDRANT_IP>:6333/collections/memories_tr/points/scroll \
  -H "Content-Type: application/json" \
  -d '{"limit": 5, "with_payload": true}' | jq '.result.points[].payload.content'
 ```
 ### Check Services
 ```bash
 # Watcher status
 sudo systemctl status mem-qdrant-watcher
 # Watcher logs
 sudo journalctl -u mem-qdrant-watcher -n 20
 # OpenClaw status
 openclaw status
 ```
 ---
 ## Troubleshooting
 ### Issue: Watcher Not Capturing
 **Check:**
 1. Service running? `systemctl status mem-qdrant-watcher`
 2. Logs: `journalctl -u mem-qdrant-watcher -f`
 3. Qdrant accessible? `curl http://<QDRANT_IP>:6333/`
 4. Ollama accessible? `curl http://<OLLAMA_IP>:11434/api/tags`
 ### Issue: Cleaner Fails
 **Common causes:**
 - Qdrant connection timeout (add `time.sleep(0.1)` between batches)
 - Nested content dicts (handled in updated script)
 - Type errors (non-string content — handled)
 ### Issue: Plugin Not Loading
 **Check:**
 1. `openclaw.json` syntax valid? `openclaw config validate`
 2. Plugin compiled? `cd ~/.openclaw/extensions/memory-qdrant && npx tsc`
 3. Gateway logs: `tail /tmp/openclaw/openclaw-$(date +%Y-%m-%d).log`
 ---
 ## Cron Schedule (Updated v2.2)
 | Time | Job | Script | Status |
 |------|-----|--------|--------|
 | Every 30 min | Timer curator | `tr-continuous/curator_timer.py` | ✅ Active |
 | Per turn | Capture | `mem-qdrant-watcher` | ✅ Daemon |
 | Per turn | Injection | `memory-qdrant` plugin | ✅ Active |
 **Removed:**
 - ❌ 2:45 AM daily curator
 - ❌ Every-minute turn curator check
 ---
 ## Next Steps
 ### Immediate
 - ⏳ Monitor first timer run (logs: `/var/log/true-recall-timer.log`)
 - ⏳ Validate gem extraction quality from timer curator
 - ⏳ Archive old curator scripts if timer works
 ### Completed ✅
 - ✅ **Compactor config** — Minimal overhead: `mode: default`, `reserveTokensFloor: 0`, `memoryFlush: false`
 ### Future
 - ⏳ Curator tuning based on timer results
 - ⏳ Silent compacting (requires OpenClaw core changes)
 ### Planned Features (Backlog)
 - ⏳ **Interactive install script** — Prompts for embedding model, timer interval, batch size, endpoints
 - ⏳ **Single embedding model option** — Use one model for both collections
 - ⏳ **Configurable thresholds** — Per-user customization via prompts
 **Compactor Settings (Applied):**
 ```json5
 {
  agents: {
    defaults: {
      compaction: {
        mode: "default",
        reserveTokensFloor: 0,
        memoryFlush: { enabled: false }
      }
    }
  }
 }
 ```
 **Note:** Only `mode`, `reserveTokensFloor`, and `memoryFlush` are valid under `agents.defaults.compaction`. Other settings are Pi runtime parameters.
 **Install script prompts:**
 1. Embedding model (snowflake vs mxbai)
 2. Timer interval (5 min / 30 min / hourly)
 3. Batch size (50 / 100 / 500)
 4. Qdrant/Ollama URLs
 5. User ID
 ---
 ## Session Recovery
 If starting fresh:
 1. Read `README.md` for architecture overview
 2. Check service status: `sudo systemctl status mem-qdrant-watcher`
 3. Check timer curator: `tail /var/log/true-recall-timer.log`
 4. Verify collections: `curl http://<QDRANT_IP>:6333/collections`
 ---
 *Last Verified: 2026-02-24 19:29 CST*
 *Version: v2.2 (30b curator, install script planned)*
--- a/test_curator.py
+++ b/test_curator.py
@@ -1,64 +0,0 @@
 #!/usr/bin/env python3
 """Quick test of curator with simple input"""
 import json
 import requests
 # Load prompt from v1
 with open('/root/.openclaw/workspace/.projects/true-recall-v1/curator-prompt.md') as f:
    prompt = f.read()
 # Test with a simple conversation
 test_turns = [
    {
        'turn': 1,
        'user_id': 'rob',
        'user': 'I want to switch from Redis to Qdrant for memory storage',
        'ai': 'Got it - Qdrant is a good choice for vector storage.',
        'conversation_id': 'test123',
        'timestamp': '2026-02-23T10:00:00',
        'date': '2026-02-23'
    },
    {
        'turn': 2,
        'user_id': 'rob',
        'user': 'Yes, and I want the curator to read from Qdrant directly',
        'ai': 'Makes sense - we can modify the curator to query Qdrant instead of Redis.',
        'conversation_id': 'test123',
        'timestamp': '2026-02-23T10:01:00',
        'date': '2026-02-23'
    }
 ]
 conversation_json = json.dumps(test_turns, indent=2)
 prompt_text = f"""## Input Conversation
 ```json
 {conversation_json}
 ```
 ## Output
 """
 response = requests.post(
    'http://10.0.0.10:11434/api/generate',
    json={
        'model': 'qwen3:4b-instruct',
        'system': prompt,
        'prompt': prompt_text,
        'stream': False,
        'options': {'temperature': 0.1, 'num_predict': 2000}
    },
    timeout=120
 )
 result = response.json()
 output = result.get('response', '').strip()
 print('=== RAW OUTPUT ===')
 print(output[:2000])
 print()
 print('=== PARSED ===')
 # Try to extract JSON
 if '```json' in output:
    parsed = output.split('```json')[1].split('```')[0].strip()
    print(parsed)
--- a/tr-compact/hook.py
+++ b/tr-compact/hook.py
@@ -1,105 +0,0 @@
 #!/usr/bin/env python3
 """
 TrueRecall v2 - Compaction Hook
 Fast Redis queue push for compaction events
 Called by OpenClaw session_before_compact hook
 """
 import json
 import sys
 import redis
 from datetime import datetime
 from typing import List, Dict, Any
 # Redis config
 REDIS_HOST = "10.0.0.36"
 REDIS_PORT = 6379
 REDIS_DB = 0
 QUEUE_KEY = "tr:compact_queue"
 TAG_PREFIX = "tr:processed"
 def get_redis_client():
    return redis.Redis(
        host=REDIS_HOST,
        port=REDIS_PORT,
        db=REDIS_DB,
        decode_responses=True
    )
 def tag_turns(messages: List[Dict], user_id: str = "rob"):
    """Tag turns so v1 daily curator skips them"""
    r = get_redis_client()
    pipe = r.pipeline()
    for msg in messages:
        conv_id = msg.get("conversation_id", "unknown")
        turn = msg.get("turn", 0)
        tag_key = f"{TAG_PREFIX}:{conv_id}:{turn}"
        pipe.setex(tag_key, 86400, "1")  # 24h TTL
    pipe.execute()
 def queue_messages(messages: List[Dict], user_id: str = "rob"):
    """Push messages to Redis queue for background processing"""
    r = get_redis_client()
    queue_item = {
        "user_id": user_id,
        "timestamp": datetime.now().isoformat(),
        "message_count": len(messages),
        "messages": messages
    }
    # LPUSH to queue (newest first)
    r.lpush(QUEUE_KEY, json.dumps(queue_item))
    return len(messages)
 def process_compaction_event(event_data: Dict):
    """
    Process session_before_compact event from OpenClaw
    Expected event_data:
    {
        "session_id": "uuid",
        "user_id": "rob",
        "messages_being_compacted": [
            {"role": "user", "content": "...", "turn": 1, "conversation_id": "..."},
            ...
        ],
        "compaction_reason": "context_limit"
    }
    """
    user_id = event_data.get("user_id", "rob")
    messages = event_data.get("messages_being_compacted", [])
    if not messages:
        return {"status": "ok", "queued": 0, "reason": "no_messages"}
    # Tag turns for v1 coordination
    tag_turns(messages, user_id)
    # Queue for background processing
    count = queue_messages(messages, user_id)
    return {
        "status": "ok",
        "queued": count,
        "user_id": user_id,
        "queue_key": QUEUE_KEY
    }
 def main():
    """CLI entry point - reads JSON from stdin"""
    try:
        event_data = json.load(sys.stdin)
        result = process_compaction_event(event_data)
        print(json.dumps(result))
        sys.exit(0)
    except Exception as e:
        print(json.dumps({"status": "error", "error": str(e)}))
        sys.exit(1)
 if __name__ == "__main__":
    main()
--- a/tr-continuous/README.md
+++ b/tr-continuous/README.md
@@ -1,101 +0,0 @@
 # Turn-Based Curator
 Extract gems every N turns instead of waiting for daily curation.
 ## Files
 | File | Purpose |
 |------|---------|
 | `curator_turn_based.py` | Main script - checks turn count, extracts gems |
 | `curator_cron.sh` | Cron wrapper to run every minute |
 | `turn-curator.service` | Alternative systemd service (runs on-demand) |
 ## Usage
 ### Manual Run
 ```bash
 # Check current status
 python3 curator_turn_based.py --status
 # Preview what would be curated
 python3 curator_turn_based.py --threshold 10 --dry-run
 # Execute curation
 python3 curator_turn_based.py --threshold 10 --execute
 ```
 ### Automatic (Cron)
 Add to crontab:
 ```bash
 * * * * * /root/.openclaw/workspace/.projects/true-recall-v2/tr-continuous/curator_cron.sh
 ```
 Or use systemd timer:
 ```bash
 sudo cp turn-curator.service /etc/systemd/system/
 sudo systemctl enable turn-curator.timer  # If you create a timer
 ```
 ### Automatic (Integrated)
 Alternative: Modify `realtime_qdrant_watcher.py` to trigger curation every 10 turns.
 ## How It Works
 1. **Tracks turn count** - Stores last curation turn in `/tmp/curator_turn_state.json`
 2. **Monitors delta** - Compares current turn count vs last curation
 3. **Triggers at threshold** - When 10+ new turns exist, runs curation
 4. **Extracts gems** - Sends conversation to qwen3, gets gems
 5. **Stores results** - Saves gems to `gems_tr` collection
 ## State File
 `/tmp/curator_turn_state.json`:
 ```json
 {
  "last_turn": 150,
  "last_curation": "2026-02-24T17:00:00Z"
 }
 ```
 ## Comparison with Daily Curator
 | Feature | Daily Curator | Turn-Based Curator |
 |---------|--------------|-------------------|
 | Schedule | 2:45 AM daily | Every 10 turns (dynamic) |
 | Time window | 24 hours | Variable (depends on chat frequency) |
 | Trigger | Cron | Turn threshold |
 | Use case | Nightly batch | Real-time-ish extraction |
 | Overlap | Low | Possible with daily curator |
 ## Recommendation
 Use **BOTH**:
 - **Turn-based**: Every 10 turns for active conversations
 - **Daily**: 2:45 AM as backup/catch-all
 They'll deduplicate automatically (same embeddings → skipped).
 ## Testing
 ```bash
 # Simulate 10 turns
 for i in {1..10}; do
  echo "Test message $i" > /dev/null
 done
 # Check status
 python3 curator_turn_based.py --status
 # Run manually
 python3 curator_turn_based.py --threshold 10 --execute
 ```
 ## Status
 - ✅ Script created: `curator_turn_based.py`
 - ✅ Cron wrapper: `curator_cron.sh`
 - ⏳ Deployment: Optional (manual or cron)
 - ⏳ Testing: Pending
--- a/tr-continuous/curator_by_count.py
+++ b/tr-continuous/curator_by_count.py
@@ -1,194 +0,0 @@
 #!/usr/bin/env python3
 """
 Turn-Based Curator: Extract gems every N new memories (turns).
 Usage:
    python3 curator_by_count.py --threshold 10 --dry-run
    python3 curator_by_count.py --threshold 10 --execute
    python3 curator_by_count.py --status
 """
 import argparse
 import json
 import requests
 import sys
 from datetime import datetime, timezone, timedelta
 from pathlib import Path
 QDRANT_URL = "http://10.0.0.40:6333"
 MEMORIES = "memories_tr"
 GEMS = "gems_tr"
 OLLAMA = "http://10.0.0.10:11434"
 MODEL = "ollama-remote/qwen3:30b-a3b-instruct-2507-q8_0"
 STATE_FILE = Path("/tmp/curator_count_state.json")
 def load_state():
    if STATE_FILE.exists():
        with open(STATE_FILE) as f:
            return json.load(f)
    return {"last_count": 0, "last_time": None}
 def save_state(state):
    with open(STATE_FILE, 'w') as f:
        json.dump(state, f)
 def get_total_count():
    try:
        r = requests.get(f"{QDRANT_URL}/collections/{MEMORIES}", timeout=10)
        return r.json()["result"]["points_count"]
    except:
        return 0
 def get_recent_memories(hours=1):
    """Get memories from last N hours."""
    since = (datetime.now(timezone.utc) - timedelta(hours=hours)).isoformat()
    try:
        r = requests.post(
            f"{QDRANT_URL}/collections/{MEMORIES}/points/scroll",
            json={"limit": 1000, "with_payload": True},
            timeout=30
        )
        points = r.json()["result"]["points"]
        # Filter by timestamp
        recent = [p for p in points if p.get("payload", {}).get("timestamp", "") > since]
        return recent
    except:
        return []
 def extract_gems(memories):
    """Send to LLM for gem extraction."""
    if not memories:
        return []
    # Build conversation
    parts = []
    for m in memories:
        role = m["payload"].get("role", "unknown")
        content = m["payload"].get("content", "")[:500]  # Limit per message
        parts.append(f"{role.upper()}: {content}")
    conversation = "\n\n".join(parts[:20])  # Max 20 messages
    prompt = f"""Extract 3-5 key gems (insights, decisions, facts) from this conversation.
 Conversation:
 {conversation}
 Return JSON: [{{"text": "gem", "category": "decision|fact|preference"}}]"""
    try:
        r = requests.post(
            f"{OLLAMA}/v1/chat/completions",
            json={
                "model": MODEL,
                "messages": [{"role": "user", "content": prompt}],
                "temperature": 0.3
            },
            timeout=120
        )
        content = r.json()["choices"][0]["message"]["content"]
        # Parse JSON
        start = content.find('[')
        end = content.rfind(']')
        if start >= 0 and end > start:
            return json.loads(content[start:end+1])
    except:
        pass
    return []
 def store_gem(gem):
    """Store gem to gems_tr."""
    try:
        # Get embedding
        r = requests.post(
            f"{OLLAMA}/api/embeddings",
            json={"model": "snowflake-arctic-embed2", "prompt": gem["text"]},
            timeout=30
        )
        vector = r.json()["embedding"]
        # Store
        r = requests.put(
            f"{QDRANT_URL}/collections/{GEMS}/points",
            json={
                "points": [{
                    "id": abs(hash(gem["text"])) % (2**63),
                    "vector": vector,
                    "payload": {
                        "text": gem["text"],
                        "category": gem.get("category", "other"),
                        "createdAt": datetime.now(timezone.utc).isoformat(),
                        "source": "turn_curator"
                    }
                }]
            },
            timeout=30
        )
        return r.status_code == 200
    except:
        return False
 def main():
    parser = argparse.ArgumentParser()
    parser.add_argument("--threshold", "-t", type=int, default=10)
    parser.add_argument("--execute", "-e", action="store_true")
    parser.add_argument("--dry-run", "-n", action="store_true")
    parser.add_argument("--status", "-s", action="store_true")
    args = parser.parse_args()
    state = load_state()
    current = get_total_count()
    new_points = current - state.get("last_count", 0)
    if args.status:
        print(f"Total memories: {current}")
        print(f"Last curated: {state.get('last_count', 0)}")
        print(f"New since last: {new_points}")
        print(f"Threshold: {args.threshold}")
        print(f"Ready: {'YES' if new_points >= args.threshold else 'NO'}")
        return
    print(f"Curator: {new_points} new / {args.threshold} threshold")
    if new_points < args.threshold:
        print("Not enough new memories")
        return
    # Get recent memories (last hour should cover the new points)
    memories = get_recent_memories(hours=1)
    print(f"Fetched {len(memories)} recent memories")
    if not memories:
        print("No memories to process")
        return
    if args.dry_run:
        print(f"[DRY RUN] Would process {len(memories)} memories")
        return
    if not args.execute:
        print("Use --execute to run or --dry-run to preview")
        return
    # Extract gems
    print("Extracting gems...")
    gems = extract_gems(memories)
    print(f"Extracted {len(gems)} gems")
    # Store
    success = 0
    for gem in gems:
        if store_gem(gem):
            success += 1
            print(f"  Stored: {gem['text'][:60]}...")
    # Update state
    state["last_count"] = current
    state["last_time"] = datetime.now(timezone.utc).isoformat()
    save_state(state)
    print(f"Done: {success}/{len(gems)} gems stored")
 if __name__ == "__main__":
    main()
--- a/tr-continuous/curator_cron.sh
+++ b/tr-continuous/curator_cron.sh
@@ -1,12 +0,0 @@
 #!/bin/bash
 # Turn-based curator cron - runs every minute to check if 10 turns reached
 SCRIPT_DIR="/root/.openclaw/workspace/.projects/true-recall-v2/tr-continuous"
 # Check if enough turns accumulated
 /usr/bin/python3 "${SCRIPT_DIR}/curator_turn_based.py" --threshold 10 --status 2>/dev/null | grep -q "Ready to curate: YES"
 if [ $? -eq 0 ]; then
    # Run curation
    /usr/bin/python3 "${SCRIPT_DIR}/curator_turn_based.py" --threshold 10 --execute 2>&1 | logger -t turn-curator
 fi
--- a/tr-continuous/curator_turn_based.py
+++ b/tr-continuous/curator_turn_based.py
@@ -1,291 +0,0 @@
 #!/usr/bin/env python3
 """
 Turn-Based Curator: Extract gems every N turns (instead of daily).
 Usage:
    python3 curator_turn_based.py --threshold 10 --dry-run
    python3 curator_turn_based.py --threshold 10 --execute
    python3 curator_turn_based.py --status              # Show turn counts
 This tracks turn count since last curation and runs when threshold is reached.
 """
 import argparse
 import json
 import os
 import requests
 import sys
 from datetime import datetime, timezone, timedelta
 from pathlib import Path
 from typing import List, Dict, Any, Optional
 # Config
 QDRANT_URL = "http://10.0.0.40:6333"
 MEMORIES_COLLECTION = "memories_tr"
 GEMS_COLLECTION = "gems_tr"
 OLLAMA_URL = "http://10.0.0.10:11434"
 CURATOR_MODEL = "ollama-remote/qwen3:30b-a3b-instruct-2507-q8_0"
 # State file tracks last curation
 STATE_FILE = Path("/tmp/curator_turn_state.json")
 def get_curator_prompt(conversation_text: str) -> str:
    """Generate prompt for gem extraction."""
    return f"""You are a memory curator. Extract only the most valuable gems (key insights) from this conversation.
 Rules:
 1. Extract only genuinely important information (decisions, preferences, key facts)
 2. Skip transient/trivial content (greetings, questions, temporary requests)
 3. Each gem should be self-contained and useful for future context
 4. Format: concise, factual statements
 5. Max 3-5 gems total
 Conversation to curate:
 ---
 {conversation_text}
 ---
 Return ONLY a JSON array of gems like:
 [{{"text": "User decided to use X approach for Y", "category": "decision"}}]
 Categories: preference, fact, decision, entity, other
 JSON:"""
 def load_state() -> Dict[str, Any]:
    """Load curation state."""
    if STATE_FILE.exists():
        try:
            with open(STATE_FILE) as f:
                return json.load(f)
        except:
            pass
    return {"last_turn": 0, "last_curation": None}
 def save_state(state: Dict[str, Any]):
    """Save curation state."""
    with open(STATE_FILE, 'w') as f:
        json.dump(state, f, indent=2)
 def get_point_count_since(last_time: str) -> int:
    """Get count of points since last curation time."""
    try:
        response = requests.post(
            f"{QDRANT_URL}/collections/{MEMORIES_COLLECTION}/points/count",
            json={
                "filter": {
                    "must": [
                        {
                            "key": "timestamp",
                            "range": {
                                "gt": last_time
                            }
                        }
                    ]
                }
            },
            timeout=30
        )
        response.raise_for_status()
        return response.json().get("result", {}).get("count", 0)
    except Exception as e:
        print(f"Error getting count: {e}", file=sys.stderr)
        return 0
 def get_turns_since(last_turn: int, limit: int = 100) -> List[Dict[str, Any]]:
    """Get all turns since last curation."""
    try:
        response = requests.post(
            f"{QDRANT_URL}/collections/{MEMORIES_COLLECTION}/points/scroll",
            json={"limit": limit, "with_payload": True},
            timeout=30
        )
        response.raise_for_status()
        data = response.json()
        turns = []
        for point in data.get("result", {}).get("points", []):
            turn_num = point.get("payload", {}).get("turn", 0)
            if turn_num > last_turn:
                turns.append(point)
        # Sort by turn number
        turns.sort(key=lambda x: x.get("payload", {}).get("turn", 0))
        return turns
    except Exception as e:
        print(f"Error fetching turns: {e}", file=sys.stderr)
        return []
 def extract_gems_with_llm(conversation_text: str) -> List[Dict[str, str]]:
    """Send conversation to LLM for gem extraction."""
    prompt = get_curator_prompt(conversation_text)
    try:
        response = requests.post(
            f"{OLLAMA_URL}/v1/chat/completions",
            json={
                "model": CURATOR_MODEL,
                "messages": [{"role": "user", "content": prompt}],
                "temperature": 0.3,
                "max_tokens": 1000
            },
            timeout=120
        )
        response.raise_for_status()
        data = response.json()
        content = data.get("choices", [{}])[0].get("message", {}).get("content", "[]")
        # Extract JSON from response
        try:
            # Try to find JSON array in response
            start = content.find('[')
            end = content.rfind(']')
            if start != -1 and end != -1:
                json_str = content[start:end+1]
                gems = json.loads(json_str)
                if isinstance(gems, list):
                    return gems
        except:
            pass
        return []
    except Exception as e:
        print(f"Error calling LLM: {e}", file=sys.stderr)
        return []
 def store_gem(gem: Dict[str, str]) -> bool:
    """Store a single gem to gems_tr."""
    try:
        # Get embedding for gem
        response = requests.post(
            f"{OLLAMA_URL}/api/embeddings",
            json={"model": "snowflake-arctic-embed2", "prompt": gem["text"]},
            timeout=30
        )
        response.raise_for_status()
        vector = response.json().get("embedding", [])
        if not vector:
            return False
        # Store to gems_tr
        response = requests.put(
            f"{QDRANT_URL}/collections/{GEMS_COLLECTION}/points",
            json={
                "points": [{
                    "id": hash(gem["text"]) % (2**63),
                    "vector": vector,
                    "payload": {
                        "text": gem["text"],
                        "category": gem.get("category", "other"),
                        "createdAt": datetime.now(timezone.utc).isoformat(),
                        "source": "turn_based_curator"
                    }
                }]
            },
            timeout=30
        )
        response.raise_for_status()
        return True
    except Exception as e:
        print(f"Error storing gem: {e}", file=sys.stderr)
        return False
 def main():
    parser = argparse.ArgumentParser(description="Turn-based curator")
    parser.add_argument("--threshold", "-t", type=int, default=10,
                       help="Run curation every N turns (default: 10)")
    parser.add_argument("--execute", "-e", action="store_true",
                       help="Execute curation")
    parser.add_argument("--dry-run", "-n", action="store_true",
                       help="Preview what would be curated")
    parser.add_argument("--status", "-s", action="store_true",
                       help="Show current turn status")
    args = parser.parse_args()
    # Load state
    state = load_state()
    current_turn = get_current_turn_count()
    turns_since = current_turn - state["last_turn"]
    if args.status:
        print(f"Current turn: {current_turn}")
        print(f"Last curation: {state['last_turn']}")
        print(f"Turns since last curation: {turns_since}")
        print(f"Threshold: {args.threshold}")
        print(f"Ready to curate: {'YES' if turns_since >= args.threshold else 'NO'}")
        return
    print(f"Turn-based Curator")
    print(f"Current turn: {current_turn}")
    print(f"Last curation: {state['last_turn']}")
    print(f"Turns since: {turns_since}")
    print(f"Threshold: {args.threshold}")
    print()
    if turns_since < args.threshold:
        print(f"Not enough turns. Need {args.threshold}, have {turns_since}")
        return
    # Get turns to process
    print(f"Fetching {turns_since} turns...")
    turns = get_turns_since(state["last_turn"], limit=turns_since + 10)
    if not turns:
        print("No new turns found")
        return
    # Build conversation text
    conversation_parts = []
    for turn in turns:
        role = turn.get("payload", {}).get("role", "unknown")
        content = turn.get("payload", {}).get("content", "")
        conversation_parts.append(f"{role.upper()}: {content}")
    conversation_text = "\n\n".join(conversation_parts)
    print(f"Processing {len(turns)} turns ({len(conversation_text)} chars)")
    print()
    if args.dry_run:
        print("=== CONVERSATION TEXT ===")
        print(conversation_text[:500] + "..." if len(conversation_text) > 500 else conversation_text)
        print()
        print("[DRY RUN] Would extract gems and store to gems_tr")
        return
    if not args.execute:
        print("Use --execute to run curation or --dry-run to preview")
        return
    # Extract gems
    print("Extracting gems with LLM...")
    gems = extract_gems_with_llm(conversation_text)
    if not gems:
        print("No gems extracted")
        return
    print(f"Extracted {len(gems)} gems:")
    for i, gem in enumerate(gems, 1):
        print(f"  {i}. [{gem.get('category', 'other')}] {gem['text'][:80]}...")
    print()
    # Store gems
    print("Storing gems...")
    success = 0
    for gem in gems:
        if store_gem(gem):
            success += 1
    # Update state
    state["last_turn"] = current_turn
    state["last_curation"] = datetime.now(timezone.utc).isoformat()
    save_state(state)
    print(f"Done! Stored {success}/{len(gems)} gems")
 if __name__ == "__main__":
    main()
--- a/tr-continuous/migrate_add_curated.py
+++ b/tr-continuous/migrate_add_curated.py
@@ -1,85 +0,0 @@
 #!/usr/bin/env python3
 """
 Migration: Add 'curated: false' to existing memories_tr entries.
 Run once to update all existing memories for the new timer curator.
 Uses POST /collections/{name}/points/payload with {"points": [ids], "payload": {...}}
 """
 import requests
 import time
 import sys
 QDRANT_URL = "http://10.0.0.40:6333"
 COLLECTION = "memories_tr"
 def update_existing_memories():
    """Add curated=false to all memories that don't have the field."""
    print("🔧 Migrating existing memories...")
    offset = None
    updated = 0
    batch_size = 100
    max_iterations = 200
    iterations = 0
    while iterations < max_iterations:
        iterations += 1
        scroll_data = {
            "limit": batch_size,
            "with_payload": True
        }
        if offset:
            scroll_data["offset"] = offset
        try:
            response = requests.post(
                f"{QDRANT_URL}/collections/{COLLECTION}/points/scroll",
                json=scroll_data,
                headers={"Content-Type": "application/json"},
                timeout=30
            )
            response.raise_for_status()
            result = response.json()
            points = result.get("result", {}).get("points", [])
            if not points:
                break
            # Collect IDs that need curated=false
            ids_to_update = []
            for point in points:
                payload = point.get("payload", {})
                if "curated" not in payload:
                    ids_to_update.append(point["id"])
            if ids_to_update:
                # POST /points/payload with {"points": [ids], "payload": {...}}
                update_response = requests.post(
                    f"{QDRANT_URL}/collections/{COLLECTION}/points/payload",
                    json={
                        "points": ids_to_update,
                        "payload": {"curated": False}
                    },
                    timeout=30
                )
                update_response.raise_for_status()
                updated += len(ids_to_update)
                print(f"  Updated batch: {len(ids_to_update)} memories (total: {updated})")
                time.sleep(0.05)
            offset = result.get("result", {}).get("next_page_offset")
            if not offset:
                break
        except Exception as e:
            print(f"Error: {e}", file=sys.stderr)
            import traceback
            traceback.print_exc()
            break
    print(f"✅ Migration complete: {updated} memories updated with curated=false")
 if __name__ == "__main__":
    update_existing_memories()
--- a/tr-continuous/turn-curator.service
+++ b/tr-continuous/turn-curator.service
@@ -1,14 +0,0 @@
 [Unit]
 Description=TrueRecall Turn-Based Curator (every 10 turns)
 After=network.target mem-qdrant-watcher.service
 [Service]
 Type=simple
 User=root
 WorkingDirectory=/root/.openclaw/workspace/.projects/true-recall-v2/tr-continuous
 ExecStart=/usr/bin/python3 /root/.openclaw/workspace/.projects/true-recall-v2/tr-continuous/curator_turn_based.py --threshold 10 --execute
 Restart=on-failure
 RestartSec=60
 [Install]
 WantedBy=multi-user.target
--- a/tr-daily/pycache/curate_from_qdrant.cpython-312.pyc
+++ b/tr-daily/pycache/curate_from_qdrant.cpython-312.pyc
--- a/tr-daily/curate_from_qdrant.py
+++ b/tr-daily/curate_from_qdrant.py
@@ -1,358 +0,0 @@
 #!/usr/bin/env python3
 """
 True-Recall v2 Curator: Reads from Qdrant kimi_memories
 Reads 24 hours of conversation from Qdrant kimi_memories collection,
 extracts contextual gems using qwen3, stores to Qdrant gems_tr with mxbai embeddings.
 Usage:
    python curate_from_qdrant.py --user-id rob
    python curate_from_qdrant.py --user-id rob --date 2026-02-23
 """
 import json
 import argparse
 import requests
 import urllib.request
 from datetime import datetime, timedelta
 from pathlib import Path
 from typing import List, Dict, Any, Optional
 import hashlib
 # Configuration
 QDRANT_URL = "http://10.0.0.40:6333"
 SOURCE_COLLECTION = "memories_tr"
 TARGET_COLLECTION = "gems_tr"
 OLLAMA_URL = "http://10.0.0.10:11434"
 EMBEDDING_MODEL = "mxbai-embed-large"
 CURATION_MODEL = "qwen3:4b-instruct"
 # Load curator prompt
 CURATOR_PROMPT_PATH = "/root/.openclaw/workspace/.projects/true-recall/curator-prompt.md"
 def load_curator_prompt() -> str:
    """Load the curator system prompt."""
    try:
        with open(CURATOR_PROMPT_PATH, 'r') as f:
            return f.read()
    except FileNotFoundError:
        # Fallback to v2 location
        CURATOR_PROMPT_PATH_V2 = "/root/.openclaw/workspace/.projects/true-recall-v2/curator-prompt.md"
        with open(CURATOR_PROMPT_PATH_V2, 'r') as f:
            return f.read()
 def get_turns_from_qdrant(user_id: str, date_str: str) -> List[Dict[str, Any]]:
    """
    Get all conversation turns from Qdrant for a specific user and date.
    Returns turns sorted by conversation_id and turn_number.
    """
    # Build filter for user_id and date
    filter_data = {
        "must": [
            {"key": "user_id", "match": {"value": user_id}},
            {"key": "date", "match": {"value": date_str}}
        ]
    }
    # Use scroll API to get all matching points
    all_points = []
    offset = None
    max_iterations = 100  # Safety limit
    iterations = 0
    while iterations < max_iterations:
        iterations += 1
        scroll_data = {
            "limit": 100,
            "with_payload": True,
            "filter": filter_data
        }
        if offset:
            scroll_data["offset"] = offset
        req = urllib.request.Request(
            f"{QDRANT_URL}/collections/{SOURCE_COLLECTION}/points/scroll",
            data=json.dumps(scroll_data).encode(),
            headers={"Content-Type": "application/json"},
            method="POST"
        )
        try:
            with urllib.request.urlopen(req, timeout=30) as response:
                result = json.loads(response.read().decode())
                points = result.get("result", {}).get("points", [])
                if not points:
                    break
                all_points.extend(points)
                # Check if there's more
                offset = result.get("result", {}).get("next_page_offset")
                if not offset:
                    break
        except urllib.error.HTTPError as e:
            if e.code == 404:
                print(f"⚠️ Collection {SOURCE_COLLECTION} not found")
                return []
            raise
    # Convert points to turn format (harvested summaries)
    turns = []
    for point in all_points:
        payload = point.get("payload", {})
        # Extract user and AI messages
        user_msg = payload.get("user_message", "")
        ai_msg = payload.get("ai_response", "")
        # Get timestamp from created_at
        created_at = payload.get("created_at", "")
        turn = {
            "turn": payload.get("turn_number", 0),
            "user_id": payload.get("user_id", user_id),
            "user": user_msg,
            "ai": ai_msg,
            "conversation_id": payload.get("conversation_id", ""),
            "session_id": payload.get("session_id", ""),
            "timestamp": created_at,
            "date": payload.get("date", date_str),
            "content_hash": payload.get("content_hash", "")
        }
        # Skip if no content
        if turn["user"] or turn["ai"]:
            turns.append(turn)
    # Sort by conversation_id, then by turn number
    turns.sort(key=lambda x: (x.get("conversation_id", ""), x.get("turn", 0)))
    return turns
 def extract_gems_with_curator(turns: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
    """Use qwen3 to extract gems from conversation turns."""
    if not turns:
        return []
    prompt = load_curator_prompt()
    # Build the conversation input
    conversation_json = json.dumps(turns, indent=2)
    # Call Ollama with native system prompt
    response = requests.post(
        f"{OLLAMA_URL}/api/generate",
        json={
            "model": CURATION_MODEL,
            "system": prompt,
            "prompt": f"## Input Conversation\n\n```json\n{conversation_json}\n```\n\n## Output\n",
            "stream": False,
            "options": {
                "temperature": 0.1,
                "num_predict": 4000
            }
        }
    )
    if response.status_code != 200:
        raise RuntimeError(f"Curation failed: {response.text}")
    result = response.json()
    output = result.get('response', '').strip()
    # Extract JSON from output (handle markdown code blocks)
    if '```json' in output:
        output = output.split('```json')[1].split('```')[0].strip()
    elif '```' in output:
        output = output.split('```')[1].split('```')[0].strip()
    try:
        # Extract JSON array - find first [ and last ]
        start_idx = output.find('[')
        end_idx = output.rfind(']')
        if start_idx != -1 and end_idx != -1 and end_idx > start_idx:
            output = output[start_idx:end_idx+1]
        gems = json.loads(output)
        if not isinstance(gems, list):
            print(f"Warning: Curator returned non-list, wrapping: {type(gems)}")
            gems = [gems] if gems else []
        return gems
    except json.JSONDecodeError as e:
        print(f"Error parsing curator output: {e}")
        print(f"Raw output: {output[:500]}...")
        return []
 def get_embedding(text: str) -> List[float]:
    """Get embedding vector from Ollama using mxbai-embed-large."""
    response = requests.post(
        f"{OLLAMA_URL}/api/embeddings",
        json={
            "model": EMBEDDING_MODEL,
            "prompt": text
        }
    )
    if response.status_code != 200:
        raise RuntimeError(f"Embedding failed: {response.text}")
    return response.json()['embedding']
 def get_gem_id(gem: Dict[str, Any], user_id: str) -> int:
    """Generate deterministic integer ID for a gem."""
    hash_bytes = hashlib.sha256(
        f"{user_id}:{gem.get('conversation_id', '')}:{gem.get('turn_range', '')}".encode()
    ).digest()[:8]
    return int.from_bytes(hash_bytes, byteorder='big') % (2**63)
 def check_duplicate(gem: Dict[str, Any], user_id: str) -> bool:
    """Check if a similar gem already exists in gems_tr."""
    gem_id = get_gem_id(gem, user_id)
    # Check if point exists
    try:
        req = urllib.request.Request(
            f"{QDRANT_URL}/collections/{TARGET_COLLECTION}/points/{gem_id}",
            headers={"Content-Type": "application/json"},
            method="GET"
        )
        with urllib.request.urlopen(req, timeout=10) as response:
            return True  # Point exists
    except urllib.error.HTTPError as e:
        if e.code == 404:
            return False  # Point doesn't exist
        raise
 def store_gem_to_qdrant(gem: Dict[str, Any], user_id: str) -> bool:
    """Store a gem to Qdrant with embedding."""
    # Create embedding from gem text
    embedding_text = f"{gem.get('gem', '')} {gem.get('context', '')} {gem.get('snippet', '')}"
    vector = get_embedding(embedding_text)
    # Prepare payload
    payload = {
        "user_id": user_id,
        **gem
    }
    # Generate deterministic integer ID
    gem_id = get_gem_id(gem, user_id)
    # Store to Qdrant
    response = requests.put(
        f"{QDRANT_URL}/collections/{TARGET_COLLECTION}/points",
        json={
            "points": [{
                "id": gem_id,
                "vector": vector,
                "payload": payload
            }]
        }
    )
    return response.status_code == 200
 def main():
    parser = argparse.ArgumentParser(description="True-Recall Curator v2 - Reads from Qdrant")
    parser.add_argument("--user-id", required=True, help="User ID to process")
    parser.add_argument("--date", help="Specific date to process (YYYY-MM-DD), defaults to yesterday")
    parser.add_argument("--dry-run", action="store_true", help="Don't store, just preview")
    args = parser.parse_args()
    # Determine date (yesterday by default)
    if args.date:
        date_str = args.date
    else:
        yesterday = datetime.now() - timedelta(days=1)
        date_str = yesterday.strftime("%Y-%m-%d")
    print(f"🔍 True-Recall Curator v2 for {args.user_id}")
    print(f"📅 Processing date: {date_str}")
    print(f"🧠 Embedding model: {EMBEDDING_MODEL}")
    print(f"💎 Target collection: {TARGET_COLLECTION}")
    print()
    # Get turns from Qdrant
    print(f"📥 Fetching conversation turns from {SOURCE_COLLECTION}...")
    turns = get_turns_from_qdrant(args.user_id, date_str)
    print(f"✅ Found {len(turns)} turns")
    if not turns:
        print("⚠️ No turns to process. Exiting.")
        return
    # Show sample
    print("\n📄 Sample turns:")
    for i, turn in enumerate(turns[:3], 1):
        user_msg = turn.get("user", "")[:60]
        ai_msg = turn.get("ai", "")[:60]
        print(f"  Turn {turn.get('turn')}: User: {user_msg}...")
        print(f"           AI: {ai_msg}...")
    if len(turns) > 3:
        print(f"  ... and {len(turns) - 3} more")
    # Extract gems
    print("\n🧠 Extracting gems with The Curator (qwen3)...")
    gems = extract_gems_with_curator(turns)
    print(f"✅ Extracted {len(gems)} gems")
    if not gems:
        print("⚠️ No gems extracted. Exiting.")
        return
    # Preview gems
    print("\n💎 Preview of extracted gems:")
    for i, gem in enumerate(gems[:3], 1):
        print(f"\n--- Gem {i} ---")
        print(f"Gem: {gem.get('gem', 'N/A')[:100]}...")
        print(f"Categories: {gem.get('categories', [])}")
        print(f"Importance: {gem.get('importance', 'N/A')}")
        print(f"Confidence: {gem.get('confidence', 'N/A')}")
    if len(gems) > 3:
        print(f"\n... and {len(gems) - 3} more gems")
    if args.dry_run:
        print("\n🏃 DRY RUN: Not storing gems.")
        return
    # Check for duplicates and store
    print("\n💾 Storing gems to Qdrant...")
    stored = 0
    skipped = 0
    failed = 0
    for gem in gems:
        # Check for duplicates
        if check_duplicate(gem, args.user_id):
            print(f"  ⏭️  Skipping duplicate: {gem.get('gem', 'N/A')[:50]}...")
            skipped += 1
            continue
        if store_gem_to_qdrant(gem, args.user_id):
            stored += 1
        else:
            print(f"  ⚠️ Failed to store gem: {gem.get('gem', 'N/A')[:50]}...")
            failed += 1
    print(f"\n✅ Stored: {stored}")
    print(f"⏭️  Skipped (duplicates): {skipped}")
    print(f"❌ Failed: {failed}")
    print("\n🎉 Curation complete!")
 if __name__ == "__main__":
    main()