Merge pull request 'feat(truth): add scoring pipeline module (#34)' (#48) from feature/truth-scorer into main

Merge truth scoring pipeline module (#34)
2026-06-15 22:07:08 +00:00 · 2026-04-04 03:57:59 +00:00
parent 075d06a2ec a7a070024a
commit 50d0a944b5
2 changed files with 397 additions and 0 deletions
--- a/src/truth/mod.rs
+++ b/src/truth/mod.rs
@@ -13,3 +13,4 @@

 pub mod ecan;
 pub mod pln;
+pub mod scorer;
--- a/src/truth/scorer.rs
+++ b/src/truth/scorer.rs
@@ -0,0 +1,396 @@
+//! Truth scoring pipeline — orchestrates PLN, ECAN, and cross-referencing
+//! to produce truth scores for memories.
+//!
+//! This is the core intelligence module that evaluates each memory by:
+//! 1. Finding related memories via vector similarity (cross-referencing)
+//! 2. Classifying related memories as confirmations or contradictions
+//! 3. Applying PLN evidence-based scoring
+//! 4. Computing ECAN attention values (STI/LTI)
+//! 5. Categorizing the result
+
+use crate::truth::ecan::EcanParams;
+use crate::truth::pln::{self, TruthValue};
+
+/// Truth category assigned after scoring.
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub enum TruthCategory {
+    /// TV ≥ verification_threshold AND has confirmations
+    Verified,
+    /// TV ≥ 0.5
+    Plausible,
+    /// TV < 0.5 AND no contradictions
+    Unverified,
+    /// Contradictions detected
+    Contradicted,
+}
+
+impl TruthCategory {
+    pub fn as_str(&self) -> &'static str {
+        match self {
+            TruthCategory::Verified => "verified",
+            TruthCategory::Plausible => "plausible",
+            TruthCategory::Unverified => "unverified",
+            TruthCategory::Contradicted => "contradicted",
+        }
+    }
+}
+
+impl std::fmt::Display for TruthCategory {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        f.write_str(self.as_str())
+    }
+}
+
+/// Configuration for the scoring pipeline.
+#[derive(Debug, Clone)]
+pub struct ScorerConfig {
+    /// Base confidence for PLN scoring when no prior exists.
+    pub pln_base_confidence: f32,
+    /// Similarity threshold above which two memories are considered related.
+    pub contradiction_threshold: f32,
+    /// Truth value threshold for "verified" category.
+    pub verification_threshold: f32,
+    /// ECAN parameters.
+    pub ecan: EcanParams,
+}
+
+impl Default for ScorerConfig {
+    fn default() -> Self {
+        Self {
+            pln_base_confidence: 0.85,
+            contradiction_threshold: 0.85,
+            verification_threshold: 0.8,
+            ecan: EcanParams::default(),
+        }
+    }
+}
+
+/// A related memory found during cross-referencing.
+#[derive(Debug, Clone)]
+pub struct RelatedMemory {
+    /// Cosine similarity to the candidate memory.
+    pub similarity: f32,
+    /// Content of the related memory.
+    pub content: String,
+    /// Existing truth value of the related memory (if scored).
+    pub truth_value: Option<f32>,
+    /// Existing confidence of the related memory (if scored).
+    pub truth_confidence: Option<f32>,
+}
+
+/// Result of scoring a single memory.
+#[derive(Debug, Clone)]
+pub struct ScoringResult {
+    pub truth_value: f32,
+    pub truth_confidence: f32,
+    pub category: TruthCategory,
+    pub ecan_sti: f32,
+    pub ecan_lti: f32,
+    pub confirmation_count: usize,
+    pub contradiction_count: usize,
+}
+
+/// Determine whether two pieces of content are contradictory.
+///
+/// This uses a heuristic approach: if two memories are semantically similar
+/// (high cosine similarity) but contain negation patterns, they likely
+/// contradict each other.
+///
+/// A more sophisticated implementation could use an NLI model, but this
+/// provides a reasonable baseline.
+fn is_contradiction(candidate_content: &str, related_content: &str, similarity: f32) -> bool {
+    // High similarity is required — unrelated content can't contradict
+    if similarity < 0.6 {
+        return false;
+    }
+
+    let negation_markers = [
+        "not ", "never ", "no ", "false", "incorrect", "wrong",
+        "isn't", "aren't", "wasn't", "weren't", "don't", "doesn't",
+        "didn't", "won't", "wouldn't", "shouldn't", "couldn't",
+        "cannot", "can't", "unlikely", "impossible", "untrue",
+    ];
+
+    let candidate_lower = candidate_content.to_lowercase();
+    let related_lower = related_content.to_lowercase();
+
+    let candidate_negations = negation_markers
+        .iter()
+        .filter(|m| candidate_lower.contains(*m))
+        .count();
+    let related_negations = negation_markers
+        .iter()
+        .filter(|m| related_lower.contains(*m))
+        .count();
+
+    // If one has significantly more negation markers than the other,
+    // and they're semantically similar, it suggests contradiction.
+    let negation_diff = (candidate_negations as i32 - related_negations as i32).unsigned_abs();
+
+    // Contradiction if: high similarity + asymmetric negation
+    negation_diff >= 1 && similarity >= 0.7
+}
+
+/// Score a memory against its related memories.
+///
+/// This is the core scoring function that:
+/// 1. Classifies related memories as confirmations or contradictions
+/// 2. Builds PLN truth values for each
+/// 3. Applies evidence-based scoring
+/// 4. Computes ECAN attention values
+/// 5. Categorizes the result
+pub fn score_memory(
+    config: &ScorerConfig,
+    candidate_content: &str,
+    related: &[RelatedMemory],
+    existing_sti: Option<f32>,
+    existing_lti: Option<f32>,
+) -> ScoringResult {
+    // Build base truth value from config
+    let base_tv = TruthValue::new(config.pln_base_confidence, config.pln_base_confidence);
+
+    // Classify related memories
+    let mut confirmations: Vec<TruthValue> = Vec::new();
+    let mut contradictions: Vec<TruthValue> = Vec::new();
+
+    for related_mem in related {
+        let strength = related_mem.truth_value.unwrap_or(0.5);
+        let confidence = related_mem.truth_confidence.unwrap_or(0.3);
+
+        // Scale confidence by similarity — closer matches are stronger evidence
+        let scaled_confidence = confidence * related_mem.similarity;
+
+        let tv = TruthValue::new(strength, scaled_confidence);
+
+        if is_contradiction(candidate_content, &related_mem.content, related_mem.similarity) {
+            contradictions.push(tv);
+        } else if related_mem.similarity >= config.contradiction_threshold {
+            // High similarity + not contradiction = confirmation
+            confirmations.push(tv);
+        }
+        // Memories below contradiction_threshold similarity are ignored
+        // (not similar enough to be meaningful evidence)
+    }
+
+    // Apply PLN evidence-based scoring
+    let scored_tv = pln::score_with_evidence(base_tv, &confirmations, &contradictions);
+
+    // Compute ECAN values
+    let (ecan_sti, ecan_lti) = if let (Some(sti), Some(lti)) = (existing_sti, existing_lti) {
+        // Re-scoring: run ECAN cycle on existing values
+        config.ecan.cycle(sti, lti, scored_tv.strength)
+    } else {
+        // First scoring: initialize from truth value
+        config.ecan.initialize(scored_tv.strength, scored_tv.confidence)
+    };
+
+    // Categorize
+    let category = categorize(
+        scored_tv.strength,
+        &confirmations,
+        &contradictions,
+        config.verification_threshold,
+    );
+
+    ScoringResult {
+        truth_value: scored_tv.strength,
+        truth_confidence: scored_tv.confidence,
+        category,
+        ecan_sti,
+        ecan_lti,
+        confirmation_count: confirmations.len(),
+        contradiction_count: contradictions.len(),
+    }
+}
+
+/// Categorize a scored memory based on its truth value and evidence.
+fn categorize(
+    truth_value: f32,
+    confirmations: &[TruthValue],
+    contradictions: &[TruthValue],
+    verification_threshold: f32,
+) -> TruthCategory {
+    if !contradictions.is_empty() {
+        return TruthCategory::Contradicted;
+    }
+    if truth_value >= verification_threshold && !confirmations.is_empty() {
+        return TruthCategory::Verified;
+    }
+    if truth_value >= 0.5 {
+        return TruthCategory::Plausible;
+    }
+    TruthCategory::Unverified
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    fn default_config() -> ScorerConfig {
+        ScorerConfig::default()
+    }
+
+    #[test]
+    fn score_no_related_memories() {
+        let config = default_config();
+        let result = score_memory(&config, "test claim", &[], None, None);
+
+        // With no evidence, should get base confidence as plausible
+        assert!(result.truth_value > 0.0);
+        assert!(result.truth_confidence > 0.0);
+        assert_eq!(result.category, TruthCategory::Plausible);
+        assert_eq!(result.confirmation_count, 0);
+        assert_eq!(result.contradiction_count, 0);
+    }
+
+    #[test]
+    fn score_with_confirmations_boosts_truth() {
+        let config = default_config();
+        let related = vec![
+            RelatedMemory {
+                similarity: 0.92,
+                content: "supporting evidence".to_string(),
+                truth_value: Some(0.9),
+                truth_confidence: Some(0.8),
+            },
+            RelatedMemory {
+                similarity: 0.88,
+                content: "more support".to_string(),
+                truth_value: Some(0.85),
+                truth_confidence: Some(0.7),
+            },
+        ];
+
+        let result = score_memory(&config, "verified claim", &related, None, None);
+
+        assert!(result.confirmation_count >= 1);
+        assert_eq!(result.contradiction_count, 0);
+        assert_eq!(result.category, TruthCategory::Verified);
+    }
+
+    #[test]
+    fn score_with_contradiction_detected() {
+        let config = default_config();
+        let related = vec![RelatedMemory {
+            similarity: 0.85,
+            content: "This is not true and incorrect".to_string(),
+            truth_value: Some(0.8),
+            truth_confidence: Some(0.7),
+        }];
+
+        let result = score_memory(
+            &config,
+            "This is true and correct",
+            &related,
+            None,
+            None,
+        );
+
+        assert!(result.contradiction_count >= 1);
+        assert_eq!(result.category, TruthCategory::Contradicted);
+    }
+
+    #[test]
+    fn score_with_existing_ecan_runs_cycle() {
+        let config = default_config();
+        let result = score_memory(
+            &config,
+            "existing memory",
+            &[],
+            Some(0.8),
+            Some(0.5),
+        );
+
+        // ECAN cycle should decay STI
+        assert!(result.ecan_sti < 0.8, "STI should decay: {}", result.ecan_sti);
+        assert!(result.ecan_sti > 0.0);
+        assert!(result.ecan_lti > 0.0);
+    }
+
+    #[test]
+    fn score_first_time_initializes_ecan() {
+        let config = default_config();
+        let result = score_memory(&config, "new memory", &[], None, None);
+
+        // ECAN should be initialized from truth value
+        assert!(result.ecan_sti > 0.0, "STI should be initialized");
+        assert!(result.ecan_lti >= 0.0, "LTI should be initialized");
+    }
+
+    #[test]
+    fn categorize_verified() {
+        let cat = categorize(
+            0.9,
+            &[TruthValue::new(0.8, 0.7)],
+            &[],
+            0.8,
+        );
+        assert_eq!(cat, TruthCategory::Verified);
+    }
+
+    #[test]
+    fn categorize_plausible() {
+        let cat = categorize(0.6, &[], &[], 0.8);
+        assert_eq!(cat, TruthCategory::Plausible);
+    }
+
+    #[test]
+    fn categorize_unverified() {
+        let cat = categorize(0.3, &[], &[], 0.8);
+        assert_eq!(cat, TruthCategory::Unverified);
+    }
+
+    #[test]
+    fn categorize_contradicted_takes_priority() {
+        // Even with high truth value, contradictions = contradicted
+        let cat = categorize(
+            0.95,
+            &[TruthValue::new(0.9, 0.8)],
+            &[TruthValue::new(0.7, 0.6)],
+            0.8,
+        );
+        assert_eq!(cat, TruthCategory::Contradicted);
+    }
+
+    #[test]
+    fn is_contradiction_negation_asymmetry() {
+        assert!(is_contradiction(
+            "The sky is blue",
+            "The sky is not blue",
+            0.85,
+        ));
+        assert!(!is_contradiction(
+            "The sky is blue",
+            "The ocean is blue",
+            0.80,
+        ));
+    }
+
+    #[test]
+    fn is_contradiction_low_similarity_returns_false() {
+        assert!(!is_contradiction(
+            "Apples are healthy",
+            "Cars are not fast",
+            0.3,
+        ));
+    }
+
+    #[test]
+    fn scoring_result_bounded() {
+        let config = default_config();
+        let result = score_memory(&config, "test", &[], None, None);
+
+        assert!(result.truth_value >= 0.0 && result.truth_value <= 1.0);
+        assert!(result.truth_confidence >= 0.0 && result.truth_confidence <= 1.0);
+        assert!(result.ecan_sti >= 0.0 && result.ecan_sti <= 1.0);
+        assert!(result.ecan_lti >= 0.0 && result.ecan_lti <= 1.0);
+    }
+
+    #[test]
+    fn truth_category_display() {
+        assert_eq!(TruthCategory::Verified.as_str(), "verified");
+        assert_eq!(TruthCategory::Plausible.as_str(), "plausible");
+        assert_eq!(TruthCategory::Unverified.as_str(), "unverified");
+        assert_eq!(TruthCategory::Contradicted.as_str(), "contradicted");
+    }
+}