tr-continuous/curator_timer.py

#!/usr/bin/env python3
"""
TrueRecall v2 - Timer Curator
Runs every 5 minutes via cron
Extracts gems from uncurated memories and stores them in gems_tr

REQUIRES: TrueRecall v1 (provides memories_tr via watcher)
"""

import sys
import json
import hashlib
import requests
from datetime import datetime, timezone
from typing import List, Dict, Any, Optional

# Configuration - EDIT THESE for your environment
QDRANT_URL = "http://<QDRANT_IP>:6333"
OLLAMA_URL = "http://<OLLAMA_IP>:11434"
SOURCE_COLLECTION = "memories_tr"
TARGET_COLLECTION = "gems_tr"
EMBEDDING_MODEL = "snowflake-arctic-embed2"
MAX_BATCH = 100
USER_ID = "<USER_ID>"


def get_uncurated_memories(qdrant_url: str, collection: str, user_id: str, max_batch: int = 100) -> List[Dict[str, Any]]:
    """Fetch uncurated memories from Qdrant."""
    try:
        response = requests.post(
            f"{qdrant_url}/collections/{collection}/points/scroll",
            json={
                "limit": max_batch,
                "filter": {
                    "must": [
                        {"key": "user_id", "match": {"value": user_id}},
                        {"key": "curated", "match": {"value": False}}
                    ]
                },
                "with_payload": True
            },
            timeout=30
        )
        response.raise_for_status()
        data = response.json()
        return data.get("result", {}).get("points", [])
    except Exception as e:
        print(f"Error fetching memories: {e}", file=sys.stderr)
        return []


def extract_gems(memories: List[Dict[str, Any]], ollama_url: str) -> List[Dict[str, Any]]:
    """Send memories to LLM for gem extraction."""
    if not memories:
        return []
    
    SKIP_PATTERNS = [
        "gems extracted", "curator", "curation complete",
        "system is running", "validation round",
    ]
    
    conversation_lines = []
    for i, mem in enumerate(memories):
        payload = mem.get("payload", {})
        text = payload.get("text", "") or payload.get("content", "")
        role = payload.get("role", "")
        
        if not text:
            continue
        text = str(text)
        
        if role == "assistant":
            continue
            
        text_lower = text.lower()
        if len(text) < 20:
            continue
        if any(pattern in text_lower for pattern in SKIP_PATTERNS):
            continue
            
        text = text[:500] if len(text) > 500 else text
        conversation_lines.append(f"[{i+1}] {text}")
    
    if not conversation_lines:
        return []
    
    conversation_text = "\n\n".join(conversation_lines)
    
    prompt = """You are a memory curator. Extract atomic facts from the conversation below.

For each distinct fact/decision/preference, output a JSON object with:
- "text": the atomic fact (1-2 sentences) - use FIRST PERSON ("I" not "User")
- "category": one of [decision, preference, technical, project, knowledge, system]
- "importance": "high" or "medium"

Return ONLY a JSON array. Example:
[
  {"text": "I decided to use Redis for caching", "category": "decision", "importance": "high"},
  {"text": "I prefer dark mode", "category": "preference", "importance": "medium"}
]

If no extractable facts, return [].

CONVERSATION:
"""
    
    full_prompt = f"{prompt}{conversation_text}\n\nJSON:"
    
    try:
        response = requests.post(
            f"{ollama_url}/api/generate",
            json={
                "model": "<CURATOR_MODEL>",
                "system": prompt,
                "prompt": full_prompt,
                "stream": False,
                "options": {
                    "temperature": 0.1,
                    "num_predict": 4000
                }
            },
            timeout=120
        )
        response.raise_for_status()
    except Exception as e:
        print(f"Error calling Ollama: {e}", file=sys.stderr)
        return []
    
    result = response.json()
    response_text = result.get("response", "")
    
    try:
        start = response_text.find('[')
        end = response_text.rfind(']')
        if start == -1 or end == -1:
            return []
        json_str = response_text[start:end+1]
        gems = json.loads(json_str)
        if not isinstance(gems, list):
            return []
        return gems
    except json.JSONDecodeError as e:
        print(f"JSON parse error: {e}", file=sys.stderr)
        return []


def get_embedding(text: str, ollama_url: str) -> Optional[List[float]]:
    """Get embedding from Ollama."""
    try:
        response = requests.post(
            f"{ollama_url}/api/embeddings",
            json={
                "model": EMBEDDING_MODEL,
                "prompt": text
            },
            timeout=30
        )
        response.raise_for_status()
        data = response.json()
        return data.get("embedding")
    except Exception as e:
        print(f"Error getting embedding: {e}", file=sys.stderr)
        return None


def store_gem(gem: Dict[str, Any], vector: List[float], qdrant_url: str, target_collection: str, user_id: str) -> bool:
    """Store a gem in Qdrant."""
    embedding_text = gem.get("text", "") or gem.get("gem", "")
    
    hash_content = f"{user_id}:{embedding_text[:100]}"
    hash_bytes = hashlib.sha256(hash_content.encode()).digest()[:8]
    gem_id = int.from_bytes(hash_bytes, byteorder='big') % (2**63)
    
    payload = {
        "text": embedding_text,
        "category": gem.get("category", "fact"),
        "importance": gem.get("importance", "medium"),
        "user_id": user_id,
        "created_at": datetime.now(timezone.utc).isoformat()
    }
    
    try:
        response = requests.put(
            f"{qdrant_url}/collections/{target_collection}/points",
            json={
                "points": [{
                    "id": abs(gem_id),
                    "vector": vector,
                    "payload": payload
                }]
            },
            timeout=30
        )
        response.raise_for_status()
        return True
    except Exception as e:
        print(f"Error storing gem: {e}", file=sys.stderr)
        return False


def mark_curated(memory_ids: List, qdrant_url: str, collection: str) -> bool:
    """Mark memories as curated."""
    if not memory_ids:
        return True
    
    try:
        response = requests.post(
            f"{qdrant_url}/collections/{collection}/points/payload",
            json={
                "points": memory_ids,
                "payload": {
                    "curated": True,
                    "curated_at": datetime.now(timezone.utc).isoformat()
                }
            },
            timeout=30
        )
        response.raise_for_status()
        return True
    except Exception as e:
        print(f"Error marking curated: {e}", file=sys.stderr)
        return False


def main():
    print("TrueRecall v2 - Timer Curator")
    print(f"User: {USER_ID}")
    print(f"Source: {SOURCE_COLLECTION}")
    print(f"Target: {TARGET_COLLECTION}")
    print(f"Max batch: {MAX_BATCH}\n")
    
    print("Fetching uncurated memories...")
    memories = get_uncurated_memories(QDRANT_URL, SOURCE_COLLECTION, USER_ID, MAX_BATCH)
    print(f"Found {len(memories)} uncurated memories\n")
    
    if not memories:
        print("Nothing to curate. Exiting.")
        return
    
    print("Sending memories to curator...")
    gems = extract_gems(memories, OLLAMA_URL)
    print(f"Extracted {len(gems)} gems\n")
    
    if not gems:
        print("No gems extracted. Exiting.")
        return
    
    print("Gems preview:")
    for i, gem in enumerate(gems[:3], 1):
        text = gem.get("text", "N/A")[:50]
        print(f"  {i}. {text}...")
    if len(gems) > 3:
        print(f"  ... and {len(gems) - 3} more")
    print()
    
    print("Storing gems...")
    stored = 0
    for gem in gems:
        text = gem.get("text", "") or gem.get("gem", "")
        if not text:
            continue
        
        vector = get_embedding(text, OLLAMA_URL)
        if vector:
            if store_gem(gem, vector, QDRANT_URL, TARGET_COLLECTION, USER_ID):
                stored += 1
    
    print(f"Stored: {stored}/{len(gems)}\n")
    
    print("Marking memories as curated...")
    memory_ids = [mem.get("id") for mem in memories if mem.get("id")]
    if mark_curated(memory_ids, QDRANT_URL, SOURCE_COLLECTION):
        print(f"Marked {len(memory_ids)} memories as curated\n")
    else:
        print("Failed to mark memories\n")
    
    print("Curation complete!")


if __name__ == "__main__":
    main()
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`#!/usr/bin/env python3`
			`"""`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`TrueRecall v2 - Timer Curator`
			`Runs every 5 minutes via cron`
			`Extracts gems from uncurated memories and stores them in gems_tr`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`REQUIRES: TrueRecall v1 (provides memories_tr via watcher)`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`"""`

			`import sys`
			`import json`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`import hashlib`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`import requests`
			`from datetime import datetime, timezone`
			`from typing import List, Dict, Any, Optional`

docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`# Configuration - EDIT THESE for your environment`
			`QDRANT_URL = "http://<QDRANT_IP>:6333"`
			`OLLAMA_URL = "http://<OLLAMA_IP>:11434"`
			`SOURCE_COLLECTION = "memories_tr"`
			`TARGET_COLLECTION = "gems_tr"`
			`EMBEDDING_MODEL = "snowflake-arctic-embed2"`
			`MAX_BATCH = 100`
			`USER_ID = "<USER_ID>"`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00

docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`def get_uncurated_memories(qdrant_url: str, collection: str, user_id: str, max_batch: int = 100) -> List[Dict[str, Any]]:`
			`"""Fetch uncurated memories from Qdrant."""`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`try:`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`response = requests.post(`
			`f"{qdrant_url}/collections/{collection}/points/scroll",`
			`json={`
			`"limit": max_batch,`
			`"filter": {`
			`"must": [`
			`{"key": "user_id", "match": {"value": user_id}},`
			`{"key": "curated", "match": {"value": False}}`
			`]`
			`},`
			`"with_payload": True`
			`},`
			`timeout=30`
			`)`
			`response.raise_for_status()`
			`data = response.json()`
			`return data.get("result", {}).get("points", [])`
			`except Exception as e:`
			`print(f"Error fetching memories: {e}", file=sys.stderr)`
			`return []`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00

docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`def extract_gems(memories: List[Dict[str, Any]], ollama_url: str) -> List[Dict[str, Any]]:`
			`"""Send memories to LLM for gem extraction."""`
			`if not memories:`
			`return []`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`SKIP_PATTERNS = [`
			`"gems extracted", "curator", "curation complete",`
			`"system is running", "validation round",`
			`]`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`conversation_lines = []`
			`for i, mem in enumerate(memories):`
			`payload = mem.get("payload", {})`
			`text = payload.get("text", "") or payload.get("content", "")`
			`role = payload.get("role", "")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`if not text:`
			`continue`
			`text = str(text)`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`if role == "assistant":`
			`continue`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`text_lower = text.lower()`
			`if len(text) < 20:`
			`continue`
			`if any(pattern in text_lower for pattern in SKIP_PATTERNS):`
			`continue`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`text = text[:500] if len(text) > 500 else text`
			`conversation_lines.append(f"[{i+1}] {text}")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`if not conversation_lines:`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`return []`

Update docs: watcher fix, plugin capture fix (2026-02-25) - Fixed watcher stuck on old session bug (restarted service) - Fixed plugin capture 0 exchanges (added extractMessageText for OpenAI content arrays) - Updated README, session.md, function_check.md, audit_checklist.md - Verified: 9 exchanges captured per session 2026-02-25 12:45:27 -06:00			`conversation_text = "\n\n".join(conversation_lines)`

			`prompt = """You are a memory curator. Extract atomic facts from the conversation below.`

			`For each distinct fact/decision/preference, output a JSON object with:`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`- "text": the atomic fact (1-2 sentences) - use FIRST PERSON ("I" not "User")`
Update docs: watcher fix, plugin capture fix (2026-02-25) - Fixed watcher stuck on old session bug (restarted service) - Fixed plugin capture 0 exchanges (added extractMessageText for OpenAI content arrays) - Updated README, session.md, function_check.md, audit_checklist.md - Verified: 9 exchanges captured per session 2026-02-25 12:45:27 -06:00			`- "category": one of [decision, preference, technical, project, knowledge, system]`
			`- "importance": "high" or "medium"`

			`Return ONLY a JSON array. Example:`
			`[`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`{"text": "I decided to use Redis for caching", "category": "decision", "importance": "high"},`
			`{"text": "I prefer dark mode", "category": "preference", "importance": "medium"}`
Update docs: watcher fix, plugin capture fix (2026-02-25) - Fixed watcher stuck on old session bug (restarted service) - Fixed plugin capture 0 exchanges (added extractMessageText for OpenAI content arrays) - Updated README, session.md, function_check.md, audit_checklist.md - Verified: 9 exchanges captured per session 2026-02-25 12:45:27 -06:00			`]`

			`If no extractable facts, return [].`

			`CONVERSATION:`
			`"""`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
Update docs: watcher fix, plugin capture fix (2026-02-25) - Fixed watcher stuck on old session bug (restarted service) - Fixed plugin capture 0 exchanges (added extractMessageText for OpenAI content arrays) - Updated README, session.md, function_check.md, audit_checklist.md - Verified: 9 exchanges captured per session 2026-02-25 12:45:27 -06:00			`full_prompt = f"{prompt}{conversation_text}\n\nJSON:"`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
			`try:`
			`response = requests.post(`
			`f"{ollama_url}/api/generate",`
			`json={`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`"model": "<CURATOR_MODEL>",`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`"system": prompt,`
Update docs: watcher fix, plugin capture fix (2026-02-25) - Fixed watcher stuck on old session bug (restarted service) - Fixed plugin capture 0 exchanges (added extractMessageText for OpenAI content arrays) - Updated README, session.md, function_check.md, audit_checklist.md - Verified: 9 exchanges captured per session 2026-02-25 12:45:27 -06:00			`"prompt": full_prompt,`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`"stream": False,`
			`"options": {`
			`"temperature": 0.1,`
			`"num_predict": 4000`
			`}`
			`},`
			`timeout=120`
			`)`
			`response.raise_for_status()`
			`except Exception as e:`
			`print(f"Error calling Ollama: {e}", file=sys.stderr)`
			`return []`

			`result = response.json()`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`response_text = result.get("response", "")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
			`try:`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`start = response_text.find('[')`
			`end = response_text.rfind(']')`
			`if start == -1 or end == -1:`
			`return []`
			`json_str = response_text[start:end+1]`
			`gems = json.loads(json_str)`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`if not isinstance(gems, list):`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`return []`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`return gems`
			`except json.JSONDecodeError as e:`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print(f"JSON parse error: {e}", file=sys.stderr)`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`return []`


			`def get_embedding(text: str, ollama_url: str) -> Optional[List[float]]:`
			`"""Get embedding from Ollama."""`
			`try:`
			`response = requests.post(`
			`f"{ollama_url}/api/embeddings",`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`json={`
			`"model": EMBEDDING_MODEL,`
			`"prompt": text`
			`},`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`timeout=30`
			`)`
			`response.raise_for_status()`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`data = response.json()`
			`return data.get("embedding")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`except Exception as e:`
			`print(f"Error getting embedding: {e}", file=sys.stderr)`
			`return None`


docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`def store_gem(gem: Dict[str, Any], vector: List[float], qdrant_url: str, target_collection: str, user_id: str) -> bool:`
			`"""Store a gem in Qdrant."""`
			`embedding_text = gem.get("text", "") or gem.get("gem", "")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`hash_content = f"{user_id}:{embedding_text[:100]}"`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`hash_bytes = hashlib.sha256(hash_content.encode()).digest()[:8]`
			`gem_id = int.from_bytes(hash_bytes, byteorder='big') % (2**63)`

			`payload = {`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`"text": embedding_text,`
			`"category": gem.get("category", "fact"),`
			`"importance": gem.get("importance", "medium"),`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`"user_id": user_id,`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`"created_at": datetime.now(timezone.utc).isoformat()`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`}`

			`try:`
			`response = requests.put(`
			`f"{qdrant_url}/collections/{target_collection}/points",`
			`json={`
			`"points": [{`
			`"id": abs(gem_id),`
			`"vector": vector,`
			`"payload": payload`
			`}]`
			`},`
			`timeout=30`
			`)`
			`response.raise_for_status()`
			`return True`
			`except Exception as e:`
			`print(f"Error storing gem: {e}", file=sys.stderr)`
			`return False`


			`def mark_curated(memory_ids: List, qdrant_url: str, collection: str) -> bool:`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`"""Mark memories as curated."""`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`if not memory_ids:`
			`return True`

			`try:`
			`response = requests.post(`
			`f"{qdrant_url}/collections/{collection}/points/payload",`
			`json={`
			`"points": memory_ids,`
			`"payload": {`
			`"curated": True,`
			`"curated_at": datetime.now(timezone.utc).isoformat()`
			`}`
			`},`
			`timeout=30`
			`)`
			`response.raise_for_status()`
			`return True`
			`except Exception as e:`
			`print(f"Error marking curated: {e}", file=sys.stderr)`
			`return False`


			`def main():`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print("TrueRecall v2 - Timer Curator")`
			`print(f"User: {USER_ID}")`
			`print(f"Source: {SOURCE_COLLECTION}")`
			`print(f"Target: {TARGET_COLLECTION}")`
			`print(f"Max batch: {MAX_BATCH}\n")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print("Fetching uncurated memories...")`
			`memories = get_uncurated_memories(QDRANT_URL, SOURCE_COLLECTION, USER_ID, MAX_BATCH)`
			`print(f"Found {len(memories)} uncurated memories\n")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
			`if not memories:`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print("Nothing to curate. Exiting.")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`return`

docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print("Sending memories to curator...")`
			`gems = extract_gems(memories, OLLAMA_URL)`
			`print(f"Extracted {len(gems)} gems\n")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
			`if not gems:`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print("No gems extracted. Exiting.")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`return`

docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print("Gems preview:")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`for i, gem in enumerate(gems[:3], 1):`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`text = gem.get("text", "N/A")[:50]`
			`print(f" {i}. {text}...")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`if len(gems) > 3:`
			`print(f" ... and {len(gems) - 3} more")`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print()`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print("Storing gems...")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`stored = 0`
			`for gem in gems:`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`text = gem.get("text", "") or gem.get("gem", "")`
			`if not text:`
			`continue`

			`vector = get_embedding(text, OLLAMA_URL)`
			`if vector:`
			`if store_gem(gem, vector, QDRANT_URL, TARGET_COLLECTION, USER_ID):`
			`stored += 1`

			`print(f"Stored: {stored}/{len(gems)}\n")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print("Marking memories as curated...")`
			`memory_ids = [mem.get("id") for mem in memories if mem.get("id")]`
			`if mark_curated(memory_ids, QDRANT_URL, SOURCE_COLLECTION):`
			`print(f"Marked {len(memory_ids)} memories as curated\n")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00			`else:`
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print("Failed to mark memories\n")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00
docs: simplify README, update validation and curator docs 2026-03-10 12:08:53 -05:00			`print("Curation complete!")`
Initial commit: TrueRecall v2.2 with 30b curator and timer-based curation 2026-02-24 20:27:44 -06:00

			`if __name__ == "__main__":`
			`main()`