bug-ops
diff --git a/‎CHANGELOG.md‎
Lines changed: 3 additions & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎crates/zeph-config/src/memory.rs‎
Lines changed: 95 additions & 1 deletion b/‎crates/zeph-config/src/memory.rs‎
Lines changed: 95 additions & 1 deletion
diff --git a/‎crates/zeph-config/src/root.rs‎
Lines changed: 1 addition & 0 deletions b/‎crates/zeph-config/src/root.rs‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎crates/zeph-core/src/bootstrap/mod.rs‎
Lines changed: 39 additions & 1 deletion b/‎crates/zeph-core/src/bootstrap/mod.rs‎
Lines changed: 39 additions & 1 deletion
@@ -19,6 +19,9 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/).
 - feat(skills): ERL experiential reflective learning — `spawn_erl_reflection()` fires a background LLM call after each successful skill+tool turn to extract transferable heuristics; heuristics are stored in `skill_heuristics` table with Jaccard deduplication; at skill matching time `build_erl_heuristics_prompt()` prepends a `## Learned Heuristics` section to the skill context; controlled by `[skills.learning] erl_enabled = false`, `erl_max_heuristics_per_skill = 3`, `erl_min_confidence = 0.5` (closes #2463)
 - feat(db): migrations 057 (`skill_usage_log`) and 058 (`skill_heuristics`) for STEM and ERL storage; both SQLite and Postgres variants
 - feat(config): `LearningConfig` extended with 14 new fields for ARISE/STEM/ERL (all disabled by default); new fields registered in `config/default.toml` as commented-out entries
+- feat(testing): memory benchmarking harness — `.local/testing/bench-memory.py` seeds N facts via agent CLI `--pipe` mode, recalls them, and reports `hit_rate`, `avg_recall_latency_ms`, `p50_ms`, `p99_ms`, `compression_ratio`, `interference_rate` as JSON; token-level hit matching tolerates LLM paraphrase; optional CSV append for longitudinal tracking; stdlib-only Python, no external dependencies (closes #2419)
+- feat(memory): cost-sensitive store routing — new `[memory.store_routing]` config section with `strategy` (`heuristic`/`llm`/`hybrid`), `routing_classifier_provider`, `confidence_threshold`, `fallback_route`; `RoutingDecision` struct carries route + confidence + reasoning; `LlmRouter` calls configured provider with quoted query (injection hardening) and parses structured JSON response; `HybridRouter` runs heuristic first and escalates to LLM only when confidence < threshold; `HeuristicRouter.route_with_confidence()` returns granular confidence (`1.0 / matched_count` for ambiguous queries); `AsyncMemoryRouter` trait for async callers; all LLM paths fall back to heuristic on failure (closes #2444)
+- feat(memory): CraniMem goal-conditioned write gate (#2408) — `goal_utility` sixth factor added to `AdmissionFactors` and `AdmissionWeights`; new config fields `goal_conditioned_write`, `goal_utility_provider`, `goal_utility_threshold` (default 0.4), `goal_utility_weight` (default 0.25) in `[memory.admission]`; `GoalGateConfig` and `AdmissionControl::with_goal_gate()`; embedding-first scoring with optional LLM refinement for borderline cases; minimum goal text length check (< 10 chars treated as absent, W3.1 fix); soft floor of 0.1 prevents off-goal memories from scoring zero above threshold; zero regression when `goal_conditioned_write = false` (closes #2408)
 - feat(core): `/new` slash command — resets conversation context (messages, compaction state, tool caches, focus/sidequest, pending plans) while preserving memory, MCP connections, providers, and skills; creates a new `ConversationId` in SQLite for audit trail; generates a session digest for the outgoing conversation fire-and-forget unless `--no-digest` is passed; active sub-agents and background compression tasks are cancelled; `--keep-plan` preserves a pending plan graph; available in all channels (CLI, TUI, Telegram) via the unified `handle_builtin_command` path (closes #2451)
 - feat(memory): Kumiho AGM-inspired belief revision for graph edges — new `BeliefRevisionConfig` with `similarity_threshold`; `find_superseded_edges()` uses contradiction heuristic (same relation domain + high cosine similarity = supersession); `superseded_by` column added to `graph_edges` for audit trail; `invalidate_edge_with_supersession()` in `GraphStore`; `resolve_edge_typed` accepts optional `BeliefRevisionConfig`; controlled by `[memory.graph.belief_revision] enabled = false` (migration 056, closes #2441)
 - feat(memory): D-MEM RPE-based tiered graph extraction routing — `RpeRouter` computes heuristic surprise score from context similarity and entity novelty; low-RPE turns skip the MAGMA LLM extraction pipeline; `consecutive_skips` safety valve forces extraction after `max_skip_turns` consecutive skips; `extract_candidate_entities()` helper for cheap regex+keyword entity detection; controlled by `[memory.graph.rpe] enabled = false, threshold = 0.3, max_skip_turns = 5` (closes #2442)
 
@@ -775,6 +775,12 @@ pub struct MemoryConfig {
     /// Default: `None` (uses `sqlite_path` instead).
     #[serde(default)]
     pub database_url: Option<String>,
+    /// Cost-sensitive store routing (#2444).
+    ///
+    /// When `store_routing.enabled = true`, query intent is classified and routed to
+    /// the cheapest sufficient backend instead of querying all stores on every turn.
+    #[serde(default)]
+    pub store_routing: StoreRoutingConfig,
 }
 
 fn default_crossover_turn_threshold() -> u32 {
@@ -1419,6 +1425,11 @@ pub struct AdmissionWeights {
     /// Content type prior based on role. Default: `0.15`.
     #[serde(deserialize_with = "validate_admission_weight")]
     pub content_type_prior: f32,
+    /// Goal-conditioned utility (#2408). `0.0` when `goal_conditioned_write = false`.
+    /// When enabled, set this alongside reducing `future_utility` so total sums remain stable.
+    /// Normalized automatically at runtime. Default: `0.0`.
+    #[serde(deserialize_with = "validate_admission_weight")]
+    pub goal_utility: f32,
 }
 
 impl Default for AdmissionWeights {
@@ -1429,6 +1440,7 @@ impl Default for AdmissionWeights {
             semantic_novelty: 0.30,
             temporal_recency: 0.10,
             content_type_prior: 0.15,
+            goal_utility: 0.0,
         }
     }
 }
@@ -1443,7 +1455,8 @@ impl AdmissionWeights {
             + self.factual_confidence
             + self.semantic_novelty
             + self.temporal_recency
-            + self.content_type_prior;
+            + self.content_type_prior
+            + self.goal_utility;
         if sum <= f32::EPSILON {
             return Self::default();
         }
@@ -1453,6 +1466,7 @@ impl AdmissionWeights {
             semantic_novelty: self.semantic_novelty / sum,
             temporal_recency: self.temporal_recency / sum,
             content_type_prior: self.content_type_prior / sum,
+            goal_utility: self.goal_utility / sum,
         }
     }
 }
@@ -1489,6 +1503,32 @@ pub struct AdmissionConfig {
     /// Background RL model retraining interval in seconds. Default: `3600`.
     #[serde(default = "default_rl_retrain_interval_secs")]
     pub rl_retrain_interval_secs: u64,
+    /// Enable goal-conditioned write gate (#2408). When `true`, memories are scored
+    /// against the current task goal and rejected if relevance is below `goal_utility_threshold`.
+    /// Zero regression when `false`. Default: `false`.
+    #[serde(default)]
+    pub goal_conditioned_write: bool,
+    /// Provider name from `[[llm.providers]]` for goal-utility LLM refinement.
+    /// Used only for borderline cases (similarity within 0.1 of threshold).
+    /// Falls back to the primary provider when empty. Default: `""`.
+    #[serde(default)]
+    pub goal_utility_provider: String,
+    /// Minimum cosine similarity between goal embedding and candidate memory
+    /// to consider it goal-relevant. Below this, `goal_utility = 0.0`. Default: `0.4`.
+    #[serde(default = "default_goal_utility_threshold")]
+    pub goal_utility_threshold: f32,
+    /// Weight of the `goal_utility` factor in the composite admission score.
+    /// Set to `0.0` to disable (equivalent to `goal_conditioned_write = false`). Default: `0.25`.
+    #[serde(default = "default_goal_utility_weight")]
+    pub goal_utility_weight: f32,
+}
+
+fn default_goal_utility_threshold() -> f32 {
+    0.4
+}
+
+fn default_goal_utility_weight() -> f32 {
+    0.25
 }
 
 impl Default for AdmissionConfig {
@@ -1502,6 +1542,58 @@ impl Default for AdmissionConfig {
             admission_strategy: AdmissionStrategy::default(),
             rl_min_samples: default_rl_min_samples(),
             rl_retrain_interval_secs: default_rl_retrain_interval_secs(),
+            goal_conditioned_write: false,
+            goal_utility_provider: String::new(),
+            goal_utility_threshold: default_goal_utility_threshold(),
+            goal_utility_weight: default_goal_utility_weight(),
+        }
+    }
+}
+
+/// Routing strategy for `[memory.store_routing]`.
+#[derive(Debug, Clone, Copy, Default, PartialEq, Eq, Deserialize, Serialize)]
+#[serde(rename_all = "snake_case")]
+pub enum StoreRoutingStrategy {
+    /// Pure heuristic pattern matching. Zero LLM calls. Default.
+    #[default]
+    Heuristic,
+    /// LLM-based classification via `routing_classifier_provider`.
+    Llm,
+    /// Heuristic first; escalates to LLM only when confidence is low.
+    Hybrid,
+}
+
+/// Configuration for cost-sensitive store routing (`[memory.store_routing]`).
+///
+/// Controls how each query is classified and routed to the appropriate memory
+/// backend(s), avoiding unnecessary store queries for simple lookups.
+#[derive(Debug, Clone, Deserialize, Serialize)]
+#[serde(default)]
+pub struct StoreRoutingConfig {
+    /// Enable configurable store routing. When `false`, `HeuristicRouter` is used
+    /// directly (existing behavior). Default: `false`.
+    pub enabled: bool,
+    /// Routing strategy. Default: `heuristic`.
+    pub strategy: StoreRoutingStrategy,
+    /// Provider name from `[[llm.providers]]` for LLM-based classification.
+    /// Falls back to the primary provider when empty. Default: `""`.
+    pub routing_classifier_provider: String,
+    /// Route to use when the classifier is uncertain (confidence < threshold).
+    /// Default: `"hybrid"`.
+    pub fallback_route: String,
+    /// Confidence threshold below which `HybridRouter` escalates to LLM.
+    /// Range: `[0.0, 1.0]`. Default: `0.7`.
+    pub confidence_threshold: f32,
+}
+
+impl Default for StoreRoutingConfig {
+    fn default() -> Self {
+        Self {
+            enabled: false,
+            strategy: StoreRoutingStrategy::Heuristic,
+            routing_classifier_provider: String::new(),
+            fallback_route: "hybrid".into(),
+            confidence_threshold: 0.7,
         }
     }
 }
@@ -1648,6 +1740,7 @@ mod tests {
             semantic_novelty: 3.0,
             temporal_recency: 1.0,
             content_type_prior: 3.0,
+            goal_utility: 0.0,
         };
         let n = w.normalized();
         let sum = n.future_utility
@@ -1686,6 +1779,7 @@ mod tests {
             semantic_novelty: 0.0,
             temporal_recency: 0.0,
             content_type_prior: 0.0,
+            goal_utility: 0.0,
         };
         let n = w.normalized();
         let default = AdmissionWeights::default();
 
@@ -206,6 +206,7 @@ impl Default for Config {
                 crossover_turn_threshold: 20,
                 consolidation: crate::memory::ConsolidationConfig::default(),
                 database_url: None,
+                store_routing: crate::memory::StoreRoutingConfig::default(),
             },
             telegram: None,
             discord: None,
 
@@ -363,14 +363,52 @@ impl AppBuilder {
             semantic_novelty: w.semantic_novelty,
             temporal_recency: w.temporal_recency,
             content_type_prior: w.content_type_prior,
+            goal_utility: w.goal_utility,
         };
-        let control = zeph_memory::AdmissionControl::new(
+        let mut control = zeph_memory::AdmissionControl::new(
             self.config.memory.admission.threshold,
             self.config.memory.admission.fast_path_margin,
             weights,
         )
         .with_provider(admission_provider);
 
+        if self.config.memory.admission.goal_conditioned_write {
+            let goal_provider = if self
+                .config
+                .memory
+                .admission
+                .goal_utility_provider
+                .is_empty()
+            {
+                None
+            } else {
+                match create_named_provider(
+                    &self.config.memory.admission.goal_utility_provider,
+                    &self.config,
+                ) {
+                    Ok(p) => Some(p),
+                    Err(e) => {
+                        tracing::warn!(
+                            provider = %self.config.memory.admission.goal_utility_provider,
+                            error = %e,
+                            "goal_utility_provider not found, LLM refinement disabled"
+                        );
+                        None
+                    }
+                }
+            };
+            control = control.with_goal_gate(zeph_memory::GoalGateConfig {
+                threshold: self.config.memory.admission.goal_utility_threshold,
+                provider: goal_provider,
+                weight: self.config.memory.admission.goal_utility_weight,
+            });
+            tracing::info!(
+                threshold = self.config.memory.admission.goal_utility_threshold,
+                weight = self.config.memory.admission.goal_utility_weight,
+                "A-MAC: goal-conditioned write gate enabled"
+            );
+        }
+
         if self.config.memory.admission.admission_strategy == zeph_config::AdmissionStrategy::Rl {
             tracing::warn!(
                 "admission_strategy = \"rl\" is configured but the RL model is not yet wired \