knowledge: agent self-correction with audit + per-persona gate + revert
Bundles three coupled changes so agent-side mutations stay
auditable and reversible:
1. Audit columns on entity_facts —
`last_modified_by_model` / `last_modified_by_backend` /
`last_modified_at`. Stamped on every mutation path
(update_fact, supersede_fact, manual PATCH, manual supersede,
the new revert). NULL on rows never touched since creation.
Partial index on `last_modified_at WHERE NOT NULL` keeps the
"show me recent edits" feed fast without bloating from legacy
rows.
2. Per-persona gate `personas.allow_agent_corrections` (BOOLEAN,
default 0). Defense in depth at two layers:
- build_tool_definitions: when off, `update_fact` and
`supersede_fact` aren't in the catalog at all, so even a
hallucinated tool call by the model fails fast.
- tool_update_fact / tool_supersede_fact: re-checks the persona
flag at call time and returns an explicit "corrections
disabled" error if it's somehow off (e.g. flag flipped mid-
loop).
ToolGateOpts grows the flag; current_gate_opts splits into
`current_gate_opts` (no persona context, defaults closed) +
`current_gate_opts_for_persona` for chat callers that have a
persona id. Both call sites in insight_chat are updated.
3. Revert action — new DAO method `revert_supersession` +
`POST /knowledge/facts/{id}/restore`. Flips status back to
'active', clears `superseded_by`, clears `valid_until` (we
don't track whether it was hand-set vs auto-stamped, so the
safe reset is to drop it — user can re-bound after). Stamps
`last_modified_*` so the revert itself is attributable.
Manual paths (PATCH / supersede via HTTP, plus restore) stamp the
audit columns with `("manual", "manual")`. Agent paths stamp the
loop-time chat model and backend (mirroring the existing
created_by_* convention).
FactDetail in the HTTP response now carries the audit triple
alongside the existing provenance. Apollo wires the new field set
in the matching commit.
PersonaView / UpdatePersonaRequest grow `allowAgentCorrections`;
the PersonaPatch + InsertPersona + bulk_import paths thread it.
317 lib tests pass, including unchanged update_fact / supersede
DAO tests (now passing audit=None — None means "no provenance
context to attribute", legacy semantics).
Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
This commit is contained in:
@@ -108,6 +108,12 @@ pub struct ToolGateOpts {
|
||||
pub calendar_present: bool,
|
||||
pub location_history_present: bool,
|
||||
pub faces_present: bool,
|
||||
/// Per-persona toggle from migration 2026-05-10-000500. When
|
||||
/// false the agent's update_fact / supersede_fact tools aren't
|
||||
/// in the catalog at all — defense-in-depth so a hallucinated
|
||||
/// tool name still 404s, and the agent doesn't waste iterations
|
||||
/// trying corrections it isn't allowed to do.
|
||||
pub allow_agent_corrections: bool,
|
||||
}
|
||||
|
||||
impl InsightGenerator {
|
||||
@@ -164,6 +170,20 @@ impl InsightGenerator {
|
||||
/// supplied by the caller because it depends on the model selected
|
||||
/// for this turn, not on persistent state.
|
||||
pub fn current_gate_opts(&self, has_vision: bool) -> ToolGateOpts {
|
||||
self.current_gate_opts_for_persona(has_vision, None)
|
||||
}
|
||||
|
||||
/// Same as `current_gate_opts` but resolves the per-persona
|
||||
/// `allow_agent_corrections` flag too. Pass `Some((user_id,
|
||||
/// persona_id))` when generating in a persona context (every chat
|
||||
/// turn does); pass `None` for callers that don't have one yet
|
||||
/// (cold paths, populate_knowledge bin), which defaults the gate
|
||||
/// to closed — the conservative posture.
|
||||
pub fn current_gate_opts_for_persona(
|
||||
&self,
|
||||
has_vision: bool,
|
||||
persona: Option<(i32, &str)>,
|
||||
) -> ToolGateOpts {
|
||||
let cx = opentelemetry::Context::new();
|
||||
let calendar_present = {
|
||||
let mut dao = self
|
||||
@@ -190,6 +210,16 @@ impl InsightGenerator {
|
||||
let mut dao = self.face_dao.lock().expect("Unable to lock FaceDao");
|
||||
dao.has_any_faces(&cx).unwrap_or(false)
|
||||
};
|
||||
let allow_agent_corrections = persona
|
||||
.and_then(|(uid, pid)| {
|
||||
let mut pdao = self
|
||||
.persona_dao
|
||||
.lock()
|
||||
.expect("Unable to lock PersonaDao");
|
||||
pdao.get_persona(&cx, uid, pid).ok().flatten()
|
||||
})
|
||||
.map(|p| p.allow_agent_corrections)
|
||||
.unwrap_or(false);
|
||||
ToolGateOpts {
|
||||
has_vision,
|
||||
apollo_enabled: self.apollo_enabled(),
|
||||
@@ -197,6 +227,7 @@ impl InsightGenerator {
|
||||
calendar_present,
|
||||
location_history_present,
|
||||
faces_present,
|
||||
allow_agent_corrections,
|
||||
}
|
||||
}
|
||||
|
||||
@@ -1592,6 +1623,14 @@ Return ONLY the summary, nothing else."#,
|
||||
)
|
||||
.await
|
||||
}
|
||||
"update_fact" => {
|
||||
self.tool_update_fact(arguments, user_id, persona_id, model, backend, cx)
|
||||
.await
|
||||
}
|
||||
"supersede_fact" => {
|
||||
self.tool_supersede_fact(arguments, user_id, persona_id, model, backend, cx)
|
||||
.await
|
||||
}
|
||||
"get_current_datetime" => Self::tool_get_current_datetime(),
|
||||
unknown => format!("Unknown tool: {}", unknown),
|
||||
};
|
||||
@@ -2761,6 +2800,12 @@ Return ONLY the summary, nothing else."#,
|
||||
superseded_by: None,
|
||||
created_by_model: Some(model.to_string()),
|
||||
created_by_backend: Some(backend.to_string()),
|
||||
// Initial write — no modification yet; last_modified_*
|
||||
// intentionally NULL so the audit feed only shows real
|
||||
// post-creation changes.
|
||||
last_modified_by_model: None,
|
||||
last_modified_by_backend: None,
|
||||
last_modified_at: None,
|
||||
};
|
||||
|
||||
let mut kdao = self
|
||||
@@ -2800,6 +2845,151 @@ Return ONLY the summary, nothing else."#,
|
||||
)
|
||||
}
|
||||
|
||||
/// Tool: update_fact — patch a fact's mutable fields. Gated by the
|
||||
/// active persona's `allow_agent_corrections` flag at the schema /
|
||||
/// catalog layer (build_tool_definitions); rechecked here as a
|
||||
/// defense in depth in case a hallucinated tool call slips
|
||||
/// through.
|
||||
async fn tool_update_fact(
|
||||
&self,
|
||||
args: &serde_json::Value,
|
||||
user_id: i32,
|
||||
persona_id: &str,
|
||||
model: &str,
|
||||
backend: &str,
|
||||
cx: &opentelemetry::Context,
|
||||
) -> String {
|
||||
use crate::database::FactPatch;
|
||||
|
||||
// Defense-in-depth gate check.
|
||||
let allowed = {
|
||||
let mut pdao = self.persona_dao.lock().expect("Unable to lock PersonaDao");
|
||||
pdao.get_persona(cx, user_id, persona_id)
|
||||
.ok()
|
||||
.flatten()
|
||||
.map(|p| p.allow_agent_corrections)
|
||||
.unwrap_or(false)
|
||||
};
|
||||
if !allowed {
|
||||
return "Error: agent corrections are disabled for this persona. Ask the operator to flip allow_agent_corrections.".to_string();
|
||||
}
|
||||
|
||||
let fact_id = match args.get("fact_id").and_then(|v| v.as_i64()) {
|
||||
Some(id) => id as i32,
|
||||
None => return "Error: missing required parameter 'fact_id'".to_string(),
|
||||
};
|
||||
|
||||
// Build the patch from any fields present on `args`. valid_*
|
||||
// are tri-state — JSON null → Some(None) → clear back to NULL,
|
||||
// omitted → None → leave alone, value → Some(Some(value)) →
|
||||
// set. The match-on-presence pattern below mirrors the HTTP
|
||||
// PATCH path's serde-helper behaviour.
|
||||
let parse_optional_i64 =
|
||||
|v: Option<&serde_json::Value>| -> Option<Option<i64>> {
|
||||
v.map(|val| {
|
||||
if val.is_null() {
|
||||
None
|
||||
} else {
|
||||
val.as_i64()
|
||||
}
|
||||
})
|
||||
};
|
||||
|
||||
let patch = FactPatch {
|
||||
predicate: args
|
||||
.get("predicate")
|
||||
.and_then(|v| v.as_str())
|
||||
.map(|s| s.to_string()),
|
||||
object_value: args
|
||||
.get("object_value")
|
||||
.and_then(|v| v.as_str())
|
||||
.map(|s| s.to_string()),
|
||||
status: args
|
||||
.get("status")
|
||||
.and_then(|v| v.as_str())
|
||||
.filter(|s| matches!(*s, "active" | "reviewed" | "rejected"))
|
||||
.map(|s| s.to_string()),
|
||||
confidence: args
|
||||
.get("confidence")
|
||||
.and_then(|v| v.as_f64())
|
||||
.map(|f| f.clamp(0.0, 0.95) as f32),
|
||||
valid_from: parse_optional_i64(args.get("valid_from")),
|
||||
valid_until: parse_optional_i64(args.get("valid_until")),
|
||||
};
|
||||
|
||||
log::info!("tool_update_fact: fact_id={}", fact_id);
|
||||
|
||||
let mut kdao = self
|
||||
.knowledge_dao
|
||||
.lock()
|
||||
.expect("Unable to lock KnowledgeDao");
|
||||
|
||||
match kdao.update_fact(cx, fact_id, patch, Some((model, backend))) {
|
||||
Ok(Some(f)) => format!(
|
||||
"Updated fact ID:{} (status={}, confidence={:.2})",
|
||||
f.id, f.status, f.confidence
|
||||
),
|
||||
Ok(None) => format!("Error: fact ID:{} not found", fact_id),
|
||||
Err(e) => format!("Error updating fact: {:?}", e),
|
||||
}
|
||||
}
|
||||
|
||||
/// Tool: supersede_fact — replace one fact with another. Same
|
||||
/// gating as update_fact.
|
||||
async fn tool_supersede_fact(
|
||||
&self,
|
||||
args: &serde_json::Value,
|
||||
user_id: i32,
|
||||
persona_id: &str,
|
||||
model: &str,
|
||||
backend: &str,
|
||||
cx: &opentelemetry::Context,
|
||||
) -> String {
|
||||
let allowed = {
|
||||
let mut pdao = self.persona_dao.lock().expect("Unable to lock PersonaDao");
|
||||
pdao.get_persona(cx, user_id, persona_id)
|
||||
.ok()
|
||||
.flatten()
|
||||
.map(|p| p.allow_agent_corrections)
|
||||
.unwrap_or(false)
|
||||
};
|
||||
if !allowed {
|
||||
return "Error: agent corrections are disabled for this persona.".to_string();
|
||||
}
|
||||
|
||||
let old_fact_id = match args.get("old_fact_id").and_then(|v| v.as_i64()) {
|
||||
Some(id) => id as i32,
|
||||
None => return "Error: missing required parameter 'old_fact_id'".to_string(),
|
||||
};
|
||||
let new_fact_id = match args.get("new_fact_id").and_then(|v| v.as_i64()) {
|
||||
Some(id) => id as i32,
|
||||
None => return "Error: missing required parameter 'new_fact_id'".to_string(),
|
||||
};
|
||||
if old_fact_id == new_fact_id {
|
||||
return "Error: old_fact_id and new_fact_id must differ".to_string();
|
||||
}
|
||||
|
||||
log::info!(
|
||||
"tool_supersede_fact: old={}, new={}",
|
||||
old_fact_id,
|
||||
new_fact_id
|
||||
);
|
||||
|
||||
let mut kdao = self
|
||||
.knowledge_dao
|
||||
.lock()
|
||||
.expect("Unable to lock KnowledgeDao");
|
||||
|
||||
match kdao.supersede_fact(cx, old_fact_id, new_fact_id, Some((model, backend))) {
|
||||
Ok(Some(f)) => format!(
|
||||
"Superseded fact ID:{} (now status={}, valid_until={:?})",
|
||||
f.id, f.status, f.valid_until
|
||||
),
|
||||
Ok(None) => "Error: old or new fact not found".to_string(),
|
||||
Err(e) => format!("Error superseding fact: {:?}", e),
|
||||
}
|
||||
}
|
||||
|
||||
/// Tool: get_current_datetime — returns the current local date and time
|
||||
fn tool_get_current_datetime() -> String {
|
||||
let now = Local::now();
|
||||
@@ -3049,6 +3239,55 @@ Return ONLY the summary, nothing else."#,
|
||||
}),
|
||||
));
|
||||
|
||||
// Self-correction tools — only exposed when the active persona
|
||||
// has allow_agent_corrections=true. Gating happens here AND in
|
||||
// the tool method itself (the runtime check is the load-bearing
|
||||
// one; this just keeps the tool out of the model's catalog so
|
||||
// it doesn't waste iterations trying calls it can't make).
|
||||
if opts.allow_agent_corrections {
|
||||
tools.push(Tool::function(
|
||||
"update_fact",
|
||||
"Correct an existing fact in the knowledge memory. Use sparingly — only when you have \
|
||||
stronger evidence than the original write justified (e.g. a clearer photo, a \
|
||||
contradicting timestamp on a related fact, or explicit user correction). Common \
|
||||
patches: tighten `valid_from` / `valid_until` to a known interval, downgrade \
|
||||
`confidence` after seeing contradicting evidence, or flip `status` to 'reviewed' if \
|
||||
you've verified the fact independently. Cannot change subject / object — supersede \
|
||||
instead. Pass `fact_id` plus any subset of patchable fields.",
|
||||
serde_json::json!({
|
||||
"type": "object",
|
||||
"required": ["fact_id"],
|
||||
"properties": {
|
||||
"fact_id": { "type": "integer", "description": "ID of the fact to patch (from recall_facts_for_photo or list)." },
|
||||
"predicate": { "type": "string", "description": "New predicate string. Rare." },
|
||||
"object_value": { "type": "string", "description": "New free-text object. Use for typed-fact corrections." },
|
||||
"status": { "type": "string", "description": "'active' | 'reviewed' | 'rejected'. 'superseded' is for the supersede_fact tool." },
|
||||
"confidence": { "type": "number", "description": "0.0–0.95. Lower when you've seen contradicting evidence." },
|
||||
"valid_from": { "type": "integer", "description": "Unix-seconds lower bound on when the fact began being true. Null clears." },
|
||||
"valid_until": { "type": "integer", "description": "Unix-seconds upper bound on when the fact stopped being true. Null clears." }
|
||||
}
|
||||
}),
|
||||
));
|
||||
|
||||
tools.push(Tool::function(
|
||||
"supersede_fact",
|
||||
"Mark an old fact as replaced by a newer one. Use when the new fact contradicts the \
|
||||
old AND the contradiction is a *time-bounded change* (relationship changed, address \
|
||||
changed, role changed), not a correction of a mistake — for mistakes, set the old \
|
||||
fact's status to 'rejected' via update_fact. Atomically: flips old.status to \
|
||||
'superseded', points old.superseded_by at the new fact, and stamps old.valid_until \
|
||||
from new.valid_from (when not already set) so the two intervals are disjoint.",
|
||||
serde_json::json!({
|
||||
"type": "object",
|
||||
"required": ["old_fact_id", "new_fact_id"],
|
||||
"properties": {
|
||||
"old_fact_id": { "type": "integer", "description": "The fact being replaced." },
|
||||
"new_fact_id": { "type": "integer", "description": "The fact that replaces it. Must already exist (use store_fact first if you're recording a new one)." }
|
||||
}
|
||||
}),
|
||||
));
|
||||
}
|
||||
|
||||
tools.push(Tool::function(
|
||||
"get_current_datetime",
|
||||
"Get the current date and time. Useful when reasoning about how long ago a photo was taken.",
|
||||
@@ -4008,6 +4247,7 @@ mod tests {
|
||||
calendar_present: false,
|
||||
location_history_present: false,
|
||||
faces_present: false,
|
||||
allow_agent_corrections: false,
|
||||
};
|
||||
let tools = InsightGenerator::build_tool_definitions(opts);
|
||||
let names: Vec<&str> = tools.iter().map(|t| t.function.name.as_str()).collect();
|
||||
@@ -4030,6 +4270,9 @@ mod tests {
|
||||
assert!(!names.contains(&"get_calendar_events"));
|
||||
assert!(!names.contains(&"get_location_history"));
|
||||
assert!(!names.contains(&"get_faces_in_photo"));
|
||||
// Agent-correction tools are absent without the gate.
|
||||
assert!(!names.contains(&"update_fact"));
|
||||
assert!(!names.contains(&"supersede_fact"));
|
||||
}
|
||||
|
||||
#[test]
|
||||
@@ -4041,6 +4284,7 @@ mod tests {
|
||||
calendar_present: true,
|
||||
location_history_present: true,
|
||||
faces_present: true,
|
||||
allow_agent_corrections: true,
|
||||
};
|
||||
let tools = InsightGenerator::build_tool_definitions(opts);
|
||||
let names: Vec<&str> = tools.iter().map(|t| t.function.name.as_str()).collect();
|
||||
@@ -4050,6 +4294,8 @@ mod tests {
|
||||
assert!(names.contains(&"get_calendar_events"));
|
||||
assert!(names.contains(&"get_location_history"));
|
||||
assert!(names.contains(&"get_faces_in_photo"));
|
||||
assert!(names.contains(&"update_fact"));
|
||||
assert!(names.contains(&"supersede_fact"));
|
||||
}
|
||||
|
||||
fn place(name: &str, description: &str) -> ApolloPlace {
|
||||
|
||||
Reference in New Issue
Block a user