riteshverma
diff --git a/‎config/settings.defaults.json‎
Lines changed: 57 additions & 1 deletion b/‎config/settings.defaults.json‎
Lines changed: 57 additions & 1 deletion
diff --git a/‎config/settings.json‎
Lines changed: 58 additions & 2 deletions b/‎config/settings.json‎
Lines changed: 58 additions & 2 deletions
diff --git a/‎config/settings_loader.py‎
Lines changed: 47 additions & 0 deletions b/‎config/settings_loader.py‎
Lines changed: 47 additions & 0 deletions
@@ -29,7 +29,16 @@
         "chunk_overlap": 40,
         "max_chunk_length": 512,
         "semantic_word_limit": 1024,
-        "top_k": 3
+        "top_k": 3,
+        "rerank": {
+            "enabled": false,
+            "provider": "local_oss",
+            "model": "",
+            "candidate_k": 40,
+            "top_k": null,
+            "timeout_seconds": 8.0,
+            "batch_size": 8
+        }
     },
     "agent": {
         "model_provider": "gemini",
@@ -63,6 +72,53 @@
             "read_from_bridge": false,
             "mirror_dir": "memory/gbrain_bridge",
             "server_id": "gbrain"
+        },
+        "policy": {
+            "enabled": true,
+            "write": {
+                "max_text_length": 2000,
+                "blocked_patterns": [],
+                "allowed_sources": [],
+                "denied_sources": [],
+                "allowed_categories": [],
+                "denied_categories": [],
+                "default_ttl_seconds": null,
+                "source_ttl_overrides": {
+                    "run_*": 1209600,
+                    "manual_scan_*": 604800,
+                    "backfill_*": 259200
+                }
+            },
+            "read": {
+                "allowed_sources": [],
+                "denied_sources": [],
+                "allowed_categories": [],
+                "denied_categories": [],
+                "exclude_expired": true,
+                "requester_overrides": {
+                    "run_context": {
+                        "allowed_sources": [
+                            "manual",
+                            "run_*"
+                        ],
+                        "denied_sources": [
+                            "manual_scan_*",
+                            "backfill_*"
+                        ],
+                        "allowed_categories": [],
+                        "denied_categories": []
+                    },
+                    "smart_scan": {
+                        "allowed_sources": [
+                            "manual",
+                            "run_*"
+                        ],
+                        "denied_sources": [],
+                        "allowed_categories": [],
+                        "denied_categories": []
+                    }
+                }
+            }
         }
     },
     "gemini": {
 
@@ -17,7 +17,16 @@
     "chunk_overlap": 40,
     "max_chunk_length": 512,
     "semantic_word_limit": 1024,
-    "top_k": 3
+    "top_k": 3,
+    "rerank": {
+      "enabled": true,
+      "provider": "local_oss",
+      "model": "",
+      "candidate_k": 40,
+      "top_k": null,
+      "timeout_seconds": 8.0,
+      "batch_size": 8
+    }
   },
   "agent": {
     "model_provider": "ollama",
@@ -44,7 +53,54 @@
     "test_agent_model": "gemma3:4b"
   },
   "remme": {
-    "extraction_prompt": "You are a Contextual Memory Management AI.\nYour job is to update the \"Memory Vault\" based on the latest conversation.\n\nRULES:\n1. ANTI-FRAGMENTATION: NEVER split related items into separate facts. Merge them into ONE rich, coherent memory entry.\n2. NO REDUNDANCY: If info is already captured, do nothing unless you have NEW details (use \"update\").\n3. CONTEXTUAL HUBS: Prefer a single \"Hub\" memory over separate atomic facts; emit it as one entry in \"memories\" (see OUTPUT FORMAT).\n4. NO NEGATIVE FACTS: NEVER store \"not found\" or \"missing\" info.\n5. NO META-LOGS: Do not store internal reasoning or agent traces.\n6. HIGH SALIENCE ONLY: Focus on project decisions, user preferences, architectural details.\n7. ACTIONS: \"add\" for new facts, \"update\" to expand existing, \"delete\" if proven false.\n\nOUTPUT FORMAT: Respond with JSON only: {\"memories\": [{\"action\": \"add\"|\"update\"|\"delete\", \"text\": \"...\", \"id\": \"...\" only for update/delete}], \"preferences\": {...}}. If nothing to store: {\"memories\": [], \"preferences\": {}}."
+    "extraction_prompt": "You are a Contextual Memory Management AI.\nYour job is to update the \"Memory Vault\" based on the latest conversation.\n\nRULES:\n1. ANTI-FRAGMENTATION: NEVER split related items into separate facts. Merge them into ONE rich, coherent memory entry.\n2. NO REDUNDANCY: If info is already captured, do nothing unless you have NEW details (use \"update\").\n3. CONTEXTUAL HUBS: Prefer a single \"Hub\" memory over separate atomic facts; emit it as one entry in \"memories\" (see OUTPUT FORMAT).\n4. NO NEGATIVE FACTS: NEVER store \"not found\" or \"missing\" info.\n5. NO META-LOGS: Do not store internal reasoning or agent traces.\n6. HIGH SALIENCE ONLY: Focus on project decisions, user preferences, architectural details.\n7. ACTIONS: \"add\" for new facts, \"update\" to expand existing, \"delete\" if proven false.\n\nOUTPUT FORMAT: Respond with JSON only: {\"memories\": [{\"action\": \"add\"|\"update\"|\"delete\", \"text\": \"...\", \"id\": \"...\" only for update/delete}], \"preferences\": {...}}. If nothing to store: {\"memories\": [], \"preferences\": {}}.",
+    "policy": {
+      "enabled": true,
+      "write": {
+        "max_text_length": 2000,
+        "blocked_patterns": [],
+        "allowed_sources": [],
+        "denied_sources": [],
+        "allowed_categories": [],
+        "denied_categories": [],
+        "default_ttl_seconds": null,
+        "source_ttl_overrides": {
+          "run_*": 1209600,
+          "manual_scan_*": 604800,
+          "backfill_*": 259200
+        }
+      },
+      "read": {
+        "allowed_sources": [],
+        "denied_sources": [],
+        "allowed_categories": [],
+        "denied_categories": [],
+        "exclude_expired": true,
+        "requester_overrides": {
+          "run_context": {
+            "allowed_sources": [
+              "manual",
+              "run_*"
+            ],
+            "denied_sources": [
+              "manual_scan_*",
+              "backfill_*"
+            ],
+            "allowed_categories": [],
+            "denied_categories": []
+          },
+          "smart_scan": {
+            "allowed_sources": [
+              "manual",
+              "run_*"
+            ],
+            "denied_sources": [],
+            "allowed_categories": [],
+            "denied_categories": []
+          }
+        }
+      }
+    }
   },
   "gemini": {
     "api_key_env": "GEMINI_API_KEY"
 
@@ -403,6 +403,53 @@ def get_embedding_provider() -> str:
     return provider or "ollama"
 
 
+def get_rag_rerank_settings() -> dict:
+    """Get normalized RAG reranker settings with safe defaults."""
+    rag_settings = load_settings().get("rag", {})
+    rerank = rag_settings.get("rerank", {}) if isinstance(rag_settings, dict) else {}
+    if not isinstance(rerank, dict):
+        rerank = {}
+
+    def _positive_int(value, default: int) -> int:
+        try:
+            parsed = int(value)
+        except (TypeError, ValueError):
+            return default
+        return parsed if parsed > 0 else default
+
+    def _optional_positive_int(value):
+        if value is None:
+            return None
+        if isinstance(value, str) and not value.strip():
+            return None
+        try:
+            parsed = int(value)
+        except (TypeError, ValueError):
+            return None
+        return parsed if parsed > 0 else None
+
+    def _positive_float(value, default: float) -> float:
+        try:
+            parsed = float(value)
+        except (TypeError, ValueError):
+            return default
+        return parsed if parsed > 0 else default
+
+    provider = str(rerank.get("provider", "local_oss") or "local_oss").strip().lower()
+    if provider in {"none", "disabled", "off"}:
+        provider = "noop"
+
+    return {
+        "enabled": bool(rerank.get("enabled", False)),
+        "provider": provider,
+        "model": str(rerank.get("model", "") or "").strip(),
+        "candidate_k": _positive_int(rerank.get("candidate_k"), 40),
+        "top_k": _optional_positive_int(rerank.get("top_k")),
+        "timeout_seconds": _positive_float(rerank.get("timeout_seconds"), 8.0),
+        "batch_size": _positive_int(rerank.get("batch_size"), 8),
+    }
+
+
 def get_timeout() -> int:
     """Get Ollama timeout in seconds."""
     return load_settings()["ollama"]["timeout"]