{
  "model": "x-ai/grok-4.1-fast",
  "date": "2026-05-13",
  "run_id": "2026-05-13T10-10-56-382Z",
  "judge_model": "google/gemini-2.5-flash:online",
  "specificity_judge": "google/gemini-2.5-flash",
  "overall": {
    "verifiability": 78,
    "specificity": 75,
    "currency": 70,
    "coverage": 96,
    "composite": 79,
    "n_signals_total": 192,
    "n_briefs": 12
  },
  "briefs": [
    {
      "brief_id": "healthcare-regulated-ai",
      "scores": {
        "verifiability": 76,
        "specificity": 69,
        "currency": 83,
        "coverage": 97,
        "composite": 78,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Clinical",
          "title": "AI Diagnostic Bias Exposed",
          "summary": "Clinical trials expose racial bias in AI diagnostic tools at 18% error rate. Indicates inequities in patient care outcomes.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 85,
          "newest_source_date": "2026-02-02",
          "judge_comments": "While racial bias in AI diagnostic tools is a well-documented concern, a specific, quantifiable 18% error rate exposed in clinical trials was not found.",
          "spec_comments": "Concrete actor and event (clinical trials, AI tools, 18%), but 'racial bias' is an interpretation, not a directly observed shift.",
          "sources": []
        },
        {
          "index": 1,
          "category": "Clinical",
          "title": "AI Triage Errors Increase",
          "summary": "Emergency studies record 22% error rates in AI triage systems. Signals reliance risks on automated assessments.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-03-16",
          "judge_comments": "Multiple sources confirm AI triage error rates, particularly undertriage of urgent cases, raising safety concerns for regulated healthcare.",
          "spec_comments": "Concrete actor, event, and quantifiable anchor present. Minor fill word deduction.",
          "sources": []
        },
        {
          "index": 2,
          "category": "Clinical",
          "title": "Adverse Events from AI Rx",
          "summary": "US hospitals report adverse events tied to AI prescriptions in 12% cases. Indicates oversight gaps in treatment plans.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-04-21",
          "judge_comments": "No evidence found to support '12% cases' of adverse events from AI prescriptions in US hospitals. Sources indicate early pilots with strict oversight.",
          "spec_comments": "Concrete actor US hospitals and event adverse events, with quantitative anchor 12%.",
          "sources": []
        },
        {
          "index": 3,
          "category": "Clinical",
          "title": "AI Tool Validation Fails",
          "summary": "Audits reveal 28% failure in post-market AI clinical validations. Signals demands for real-time monitoring.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 70,
          "newest_source_date": "2025-11-06",
          "judge_comments": "No direct audit finding of '28% failure' in post-market AI clinical validations was found. The signal for real-time monitoring is grounded.",
          "spec_comments": "Concrete actor, event, and quantitative anchor. Passive language in first sentence.",
          "sources": []
        },
        {
          "index": 4,
          "category": "Regulatory",
          "title": "EU AI Act Device Rules",
          "summary": "EU AI Act mandates pre-market assessments for high-risk medical AI. Indicates prolonged approval timelines.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-05-07",
          "judge_comments": "The EU AI Act mandates pre-market assessment for high-risk medical AI, layering on top of existing MDR requirements, delaying timelines.",
          "spec_comments": "Concrete actor, event, and shift. Lacks quantitative/temporal anchor, uses some vague phrasing.",
          "sources": []
        },
        {
          "index": 5,
          "category": "Regulatory",
          "title": "FDA AI Lifecycle Guidance",
          "summary": "FDA issues guidance requiring ongoing AI/ML performance monitoring. Signals shift from static approvals.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 75,
          "currency_score": 50,
          "newest_source_date": "2025-01-07",
          "judge_comments": "FDA draft guidance emphasizes ongoing performance monitoring for AI-enabled medical devices throughout their lifecycle. This signals a shift toward dynamic oversight.",
          "spec_comments": "Concrete actor/event, active voice. Lacks quantitative/temporal anchor.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Regulatory",
          "title": "US State AI Restrictions",
          "summary": "Five states pass laws limiting AI in clinical decisions. Indicates patchwork compliance burdens.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-26",
          "judge_comments": "Multiple sources confirm at least six states have enacted laws prohibiting AI as the sole basis for healthcare claim denials, with more pending. This creates a compliance patchwork.",
          "spec_comments": "Concrete actor, event, and quantitative anchor. Lacks present tense active voice in second sentence.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Regulatory",
          "title": "EMA Algorithm Disclosures",
          "summary": "EMA enforces full disclosure of AI algorithms in approvals. Signals transparency over proprietary tech.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 85,
          "newest_source_date": "2026-01-14",
          "judge_comments": "EMA/FDA established principles for AI in medicine. Disclosure isn't explicitly 'full disclosure of algorithms' but points towards transparency and adherence to standards.",
          "spec_comments": "Names actor and product, but 'full disclosure' and 'signals transparency' are somewhat vague and lack quantitative or temporal anchors.",
          "sources": []
        },
        {
          "index": 8,
          "category": "Operational",
          "title": "AI Integration Budget Overruns",
          "summary": "Networks exceed AI integration budgets by 35% on average. Indicates strain on resource allocation.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 75,
          "currency_score": 0,
          "judge_comments": "No direct evidence found for 'AI Integration Budget Overruns by 35% on average' in healthcare systems within the provided search results. Budget increases are noted, but not specific overruns.",
          "spec_comments": "Concrete actor ('Networks'), event ('exceed AI integration budgets'), and quantitative anchor (35% on average). No hype or vague forecasts.",
          "sources": []
        },
        {
          "index": 9,
          "category": "Operational",
          "title": "Clinician Resistance to AI",
          "summary": "Surveys capture 55% clinician pushback against AI tools. Signals workflow disruption potentials.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 75,
          "currency_score": 100,
          "newest_source_date": "2026-03-12",
          "judge_comments": "No source directly states 55% clinician pushback. Some surveys indicate hesitancy/reservations regarding AI, but not outright 'pushback' at this level.",
          "spec_comments": "Concrete actor, quantitative anchor, active voice. Lacks specific product/event.",
          "sources": []
        },
        {
          "index": 10,
          "category": "Operational",
          "title": "AI System Outage Impacts",
          "summary": "Pilot hospitals log 12% operational downtime from AI failures. Indicates dependency vulnerabilities.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 100,
          "newest_source_date": "2026-03-10",
          "judge_comments": "No specific reports of AI system outages causing EHR downtime found in reputable sources. Broader trend of AI integration in EHRs is documented.",
          "spec_comments": "Concrete actors, events, and a temporal anchor are present. Excellent specificity.",
          "sources": []
        },
        {
          "index": 11,
          "category": "Operational",
          "title": "Single Vendor AI Lock-in",
          "summary": "Hospitals commit to one AI vendor in 70% implementations. Signals reduced operational agility.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 20,
          "currency_score": 100,
          "newest_source_date": "2026-03-24",
          "judge_comments": "While single-vendor dominance is discussed for EHRs and AI is growing, the 70% figure for AI lock-in is not confirmed.",
          "spec_comments": "No specific actor, event, or anchor. Uses general terms like 'hospitals' and 'single AI vendors'.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Patient Trust",
          "title": "AI Platform Data Breaches",
          "summary": "Breaches from AI systems expose 400k patient records yearly. Indicates privacy protection shortfalls.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-04-23",
          "judge_comments": "The signal states 400k records yearly. While multiple sources show AI-related breaches, one incident alone impacted 3.1M individuals, making 400k yearly an unlikely specific number.",
          "spec_comments": "Concrete actor and event (AI systems, data breaches) with a quantitative and temporal anchor.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Patient Trust",
          "title": "Patient AI Trust Decline",
          "summary": "Surveys show 32% drop in patient confidence in AI care. Signals consent requirement escalations.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-03-04",
          "judge_comments": "No source indicates a 32% *drop* in patient confidence in AI care. Some surveys show lower trust in AI vs. human care, but not a significant recent decline.",
          "spec_comments": "Concrete actors implied (patients, AI-based diagnostics), quantitative and temporal anchors present.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Patient Trust",
          "title": "Lawsuits on AI Harms",
          "summary": "Courts process 45 claims of harm from AI decisions. Indicates accountability pressures on providers.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-25",
          "judge_comments": "Multiple lawsuits concerning AI-led denial of care are surfacing in the US, indicating growing accountability pressures. Exact count of 45 claims is unverified by the provided sources.",
          "spec_comments": "Concrete actor (courts), quantifiable event (45 claims), but lacks specific companies or types of AI harm.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Patient Trust",
          "title": "AI Consent Rejections Rise",
          "summary": "Patients decline 27% of AI-involved consent forms. Signals trust barriers in adoption.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 30,
          "newest_source_date": "2024-05-13",
          "judge_comments": "No evidence found to support the specific claim of 27% rejections. Public trust is a concern, but the figure is unverified.",
          "spec_comments": "Concrete actors implied (patients, AI-based diagnostics), quantitative and temporal anchors present.",
          "sources": []
        }
      ]
    },
    {
      "brief_id": "fintech-stablecoin-rails",
      "scores": {
        "verifiability": 84,
        "specificity": 84,
        "currency": 70,
        "coverage": 94,
        "composite": 83,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Regulatory",
          "title": "EU MiCA Stablecoin Rules",
          "summary": "EU applies MiCA regulation to stablecoins since June 2024. Issuers hold 1:1 reserves and obtain authorization. Signals heightened compliance for euro stablecoins in payments.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 30,
          "newest_source_date": "2024-06-30",
          "judge_comments": "MiCA mandates 1:1 liquid, segregated reserves for EU stablecoins, requiring authorization for issuance and distribution. Compliance for cross-border settlement is operational reality.",
          "spec_comments": "Concrete actor (EU, MiCA), specific mandates, and a temporal anchor ('now mandates').",
          "sources": []
        },
        {
          "index": 1,
          "category": "Regulatory",
          "title": "Hong Kong Stablecoin Sandbox",
          "summary": "Hong Kong Monetary Authority launches stablecoin issuer sandbox in 2024. Participants meet reserve and disclosure standards. Indicates regulatory paths for Asia-Pacific cross-border rails.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 90,
          "currency_score": 10,
          "newest_source_date": "2024-03-12",
          "judge_comments": "HKMA launched a stablecoin issuer sandbox on March 12, 2024. Participants must have a reasonable business plan and operate within limited, risk-controllable scope.",
          "spec_comments": "Concrete actor, event, and temporal anchor. No vague language or hype. Strong specificity.",
          "sources": []
        },
        {
          "index": 2,
          "category": "Regulatory",
          "title": "Singapore MAS Payment Licenses",
          "summary": "MAS grants major payment institution licenses to stablecoin platforms in 2024. Licensees comply with AML and reserve rules. Signals approved fiat-backed tokens for settlements.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-01",
          "judge_comments": "MAS has granted licenses to stablecoin issuers (e.g., Paxos) and is actively developing a regulatory framework for stablecoins.",
          "spec_comments": "Concrete actor (MAS), event (grants licenses), and implies temporal (now). Lacks specific company names or numbers.",
          "sources": []
        },
        {
          "index": 3,
          "category": "Regulatory",
          "title": "UK FCA Crypto Asset Rules",
          "summary": "UK FCA finalizes rules for crypto asset promotions and stablecoins in 2024. Firms register and segregate client assets. Indicates structured oversight for sterling payment rails.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 85,
          "newest_source_date": "2026-02-06",
          "judge_comments": "The FCA has not finalized stablecoin rules in 2024. They published proposals, and final rules are expected in 2026. The claim of finalization is incorrect.",
          "spec_comments": "Concrete actor (UK FCA), event (finalizes rules), and temporal anchor (2024), active voice.",
          "sources": []
        },
        {
          "index": 4,
          "category": "Infrastructure",
          "title": "Swift CBDC Interlink Pilot",
          "summary": "Swift tests CBDC interoperability with over 30 central banks since 2024. Platform links tokenized deposits across ledgers. Signals unified settlement layers for cross-border flows.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 30,
          "newest_source_date": "2024-11-05",
          "judge_comments": "Swift has conducted multiple phases of CBDC interlinking pilots, with over 30 institutions participating, demonstrating technical feasibility and exploring use cases.",
          "spec_comments": "Concrete actor, event, and temporal anchor. Good use of active voice.",
          "sources": []
        },
        {
          "index": 5,
          "category": "Infrastructure",
          "title": "Visa USDC Settlement Network",
          "summary": "Visa enables USDC settlements on Solana and Ethereum blockchains in 2024. Merchants receive fiat conversions instantly. Indicates blockchain integration into card rails.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 85,
          "newest_source_date": "2025-12-16",
          "judge_comments": "Visa is settling USDC on Solana for issuer/acquirer partners and merchant payments. Public blockchain integration is happening.",
          "spec_comments": "Concrete actor (Visa), event (settlement), specific tech (USDC, Solana). Active voice. No hype.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Infrastructure",
          "title": "JPM Onyx Blockchain Expansion",
          "summary": "JPMorgan scales Onyx platform to $1B daily tokenized deposit volume in 2024. Network supports 24/7 cross-border payments. Signals bank-led alternatives to legacy systems.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-05-13",
          "judge_comments": "JPMorgan's Kinexys (formerly Onyx) is actively expanding its tokenization platform with cross-border settlement features, as evidenced by multiple collaborative initiatives and new product filings.",
          "spec_comments": "Concrete actor, product, and action with a clear signal. 'Established banks' is slightly vague.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Infrastructure",
          "title": "Ripple XRP Ledger Upgrades",
          "summary": "Ripple upgrades XRP Ledger with automated market makers in 2024. Features enable stablecoin liquidity pools. Indicates efficient rails for unbundled settlements.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-03-16",
          "judge_comments": "XLS-30 AMM launched on XRPL in March 2024. This enables stablecoin liquidity pools for efficient, unbundled cross-border settlement.",
          "spec_comments": "Concrete actor (Ripple), event (upgrades), product (XRPL), and temporal anchor (2024).",
          "sources": []
        },
        {
          "index": 8,
          "category": "Competitive",
          "title": "PayPal PYUSD Stablecoin Launch",
          "summary": "PayPal issues PYUSD stablecoin on Ethereum since 2023 with $200M circulation. Users redeem via app for remittances. Signals fintech entry into dollar-pegged rails.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-17",
          "judge_comments": "PayPal launched PYUSD in 2023, expanding its availability globally by March 2026. It's integrated into Xoom and Arbitrum for payments and cross-border transfers. PYUSDx allows developers to build PYUSD-backed stablecoins.",
          "spec_comments": "Concrete actor (PayPal), event (introduces PYUSD stablecoin), and purpose (payments and transfers on its platform).",
          "sources": []
        },
        {
          "index": 9,
          "category": "Competitive",
          "title": "Stripe Bridge Acquisition",
          "summary": "Stripe acquires Bridge stablecoin platform in 2024. Acquisition accelerates USDC payouts to developers. Indicates payment processors building crypto settlement stacks.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 95,
          "currency_score": 50,
          "newest_source_date": "2025-02-04",
          "judge_comments": "Stripe acquired Bridge for $1.1B. Bridge's tech enables stablecoin-based cross-border payments, unbundling traditional bank settlement.",
          "spec_comments": "Concrete actor, event, amount, date; active voice. \"Signals that\" is a slight deduction.",
          "sources": []
        },
        {
          "index": 10,
          "category": "Competitive",
          "title": "Circle USDC Enterprise Adoption",
          "summary": "Circle signs 100 enterprises for USDC cross-border payments in 2024. Volume reaches $500B annually. Signals stablecoin dominance in B2B transfers.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 70,
          "newest_source_date": "2025-08-06",
          "judge_comments": "While Circle's USDC is actively integrated into major payment networks and cross-border solutions, the specific claim of 100 enterprise sign-ups in 2024 and $500B annual volume is not directly verified by the provided sources.",
          "spec_comments": "Concrete actor, event, quantitative/temporal anchors. Active voice. 'Dominance' is a soft claim.",
          "sources": []
        },
        {
          "index": 11,
          "category": "Competitive",
          "title": "Revolut Crypto Payment Rails",
          "summary": "Revolut integrates stablecoins for instant EEA transfers since 2024. Service processes 1M monthly transactions. Indicates neobank challenge to bank wires.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 90,
          "currency_score": 85,
          "newest_source_date": "2025-11-18",
          "judge_comments": "Revolut services in UK/EEA use Polygon since Dec 2024 for stablecoin remittances; processed over $1.2B by Nov 2025. This challenges traditional bank wires with low fees and instant settlement.",
          "spec_comments": "Concrete actor, product, temporal anchor, and quantitative data. Minimal filler.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Consumer Behavior",
          "title": "Stablecoin Remittance Surge",
          "summary": "Argentinians transact $100B in stablecoins yearly via exchanges. Users bypass inflation with dollar pegs. Signals preference for crypto rails in high-inflation zones.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 75,
          "currency_score": 70,
          "newest_source_date": "2025-09-01",
          "judge_comments": "No source supports $100B in yearly stablecoin transactions in Argentina. Multiple sources indicate significant, but lower, transaction volumes and preference for stablecoins.",
          "spec_comments": "Concrete actor, quantitative anchor, and effect, but lacks specific timeframe for 'yearly' and uses some filler.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Consumer Behavior",
          "title": "USDC P2P Transfer Growth",
          "summary": "USDC peer-to-peer volume doubles to $300B in 2024 on wallets. Senders favor instant global sends. Indicates shift from apps to blockchain wallets.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 50,
          "newest_source_date": "2025-01-14",
          "judge_comments": "The signal claims USDC P2P volume doubled to $300B in 2024. While overall USDC transaction volume is high, there's no specific mention of P2P volume or the $300B figure in the provided sources. The growth of USDC and its accessibility, particularly in payment applications, suggests this is plausible, but the specific claim is unverified.",
          "spec_comments": "Concrete actor, event, quantitative/temporal anchor, active voice. 'Wallets' could be more specific.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Consumer Behavior",
          "title": "DeFi Lending Stablecoin Use",
          "summary": "Users lock $50B USDT and USDC in DeFi protocols monthly. Borrowers access yields without banks. Signals demand for programmable payment alternatives.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-04-07",
          "judge_comments": "$50B monthly specific figure not found, but broader trend of stablecoins in DeFi lending is well-documented.",
          "spec_comments": "Concrete actors (USDT, USDC, DeFi protocols), quantitative anchor ($50B), and active voice support a high score.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Consumer Behavior",
          "title": "Venmo Crypto Remittance Trial",
          "summary": "Venmo users send PYUSD for cross-border gifts since 2024. Feature logs 500K transactions monthly. Indicates social app evolution into global rails.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 50,
          "newest_source_date": "2024-11-19",
          "judge_comments": "No evidence of a Venmo cross-border remittance trial. PYUSD is available on Venmo, but for transfers, not specifically for cross-border remittances via Venmo.",
          "spec_comments": "Concrete actor, event, and quantifiable data are strong. Active voice used.",
          "sources": []
        }
      ]
    },
    {
      "brief_id": "defense-autonomous-systems",
      "scores": {
        "verifiability": 82,
        "specificity": 71,
        "currency": 77,
        "coverage": 100,
        "composite": 81,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Doctrine",
          "title": "USAF Human-on-Loop Guidelines",
          "summary": "USAF publishes guidelines allowing supervised autonomous target engagement by drones. Signals doctrinal shift toward semi-autonomous systems in air operations.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-02-25",
          "judge_comments": "DoD Directive 3000.09 and AFDN 25-1 both outline policies for autonomous weapon systems and human-machine teaming in air operations, indicating a doctrinal shift.",
          "spec_comments": "Concrete actor, event, and shift. Lacks quantitative/temporal anchor, uses 'signals doctrinal shift'.",
          "sources": []
        },
        {
          "index": 1,
          "category": "Doctrine",
          "title": "PLA Swarm Tactics Manual",
          "summary": "PLA releases manual detailing drone swarm deployment in anti-access scenarios. Indicates incorporation of swarm tactics into core warfighting doctrine.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-03-26",
          "judge_comments": "PLA strategic documents laud uncrewed systems but lack specific details on swarm tactics or MUM-T. No manual found.",
          "spec_comments": "Concrete actor and event, active voice, measurable shift, but lacks quantitative/temporal anchor.",
          "sources": []
        },
        {
          "index": 2,
          "category": "Doctrine",
          "title": "NATO LAWS Policy Framework",
          "summary": "NATO updates framework for lethal autonomous weapons system oversight. Signals harmonization of alliance rules on drone autonomy employment.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-02-17",
          "judge_comments": "While NATO is actively exploring autonomous systems, there's no direct evidence of a newly updated framework for lethal autonomous weapons system oversight or harmonized alliance rules on drone autonomy employment mentioned as of late 2025/early 2026.",
          "spec_comments": "Concrete actor (NATO), event (updates framework), and product (LAWS). Lacks a quantitative/temporal anchor.",
          "sources": []
        },
        {
          "index": 3,
          "category": "Doctrine",
          "title": "IDF Drone ROE Revisions",
          "summary": "IDF revises rules of engagement to permit autonomous drone loitering munitions. Indicates evolution in urban warfare doctrine for high-threat zones.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2025-01-08",
          "judge_comments": "While Israel is developing autonomous loitering munitions and AI for drone warfare, no sources specifically confirm revised IDF ROE permitting autonomous loitering munitions.",
          "spec_comments": "Concrete actor (IDF); concrete event (revises ROE); specific product type (loitering munitions).",
          "sources": []
        },
        {
          "index": 4,
          "category": "Technology",
          "title": "Shield AI Hivemind Swarm Software",
          "summary": "Shield AI deploys Hivemind software enabling collaborative drone autonomy. Signals advancement in multi-agent AI for contested airspace control.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-24",
          "judge_comments": "Multiple sources confirm Shield AI's Hivemind enables autonomous, collaborative drone operations. It is also selected for the US Air Force CCA program.",
          "spec_comments": "Good actor and product, but 'advancement' is vague. Needs a quantitative/temporal anchor.",
          "sources": []
        },
        {
          "index": 5,
          "category": "Technology",
          "title": "DARPA Gremlins Air Recovery Tech",
          "summary": "DARPA demonstrates Gremlins system recovering and reusing drone swarms mid-mission. Indicates maturation of expendable swarm recovery capabilities.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 10,
          "newest_source_date": "2021-11-15",
          "judge_comments": "DARPA successfully demonstrated airborne recovery of a Gremlins drone to a C-130, and the drone was refurbished and flown again within 24 hours. This marks a critical step towards reusable drone swarms.",
          "spec_comments": "Concrete actor, product, and measurable shift. Minimal hype.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Technology",
          "title": "Skydio X10 Autonomy Kit",
          "summary": "Skydio releases X10 kit with AI for fully autonomous drone navigation. Signals commercial viability of obstacle-avoiding drone tech.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 10,
          "newest_source_date": "2024-02-27",
          "judge_comments": "Skydio X10 and X10D feature onboard AI for autonomous flight and obstacle avoidance, including NightSense for zero-light environments.",
          "spec_comments": "Concrete actor, product, and active voice. 'Commercial viability' lacks a timeline or quantitative anchor.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Technology",
          "title": "Teledyne FLIR Prism AI Sensor",
          "summary": "Teledyne FLIR integrates Prism AI into drone sensors for target identification. Indicates fusion of edge AI with electro-optical systems.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-04-28",
          "judge_comments": "Multiple reputable sources confirm Teledyne FLIR's Prism AI, including SKR and C-UAS, integrates edge AI for target recognition in various drone systems.",
          "spec_comments": "Concrete actor/product. Lacks quantitative/temporal anchor. Uses present tense, active voice. No deductions.",
          "sources": []
        },
        {
          "index": 8,
          "category": "Geopolitical",
          "title": "BIS Tightens Drone AI Exports",
          "summary": "US BIS amends export rules restricting drone AI algorithms to adversaries. Signals escalation in controls over dual-use autonomy software.",
          "verdict": "fabricated",
          "verifiability_score": 20,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-02-19",
          "judge_comments": "The Bureau of Industry and Security (BIS) recently *eased* export controls on certain civil UAVs, not tightened them regarding AI.",
          "spec_comments": "Concrete actor, action, and target. 'Escalation' is slightly vague but overall strong.",
          "sources": []
        },
        {
          "index": 9,
          "category": "Geopolitical",
          "title": "China Wing Loong Sales to UAE",
          "summary": "China delivers Wing Loong II armed drones to UAE military. Indicates expansion of Chinese drone influence in Middle East alliances.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-04-15",
          "judge_comments": "The UAE has operated Wing Loong I and II UAVs. China's drone influence in the Middle East is well-documented.",
          "spec_comments": "Concrete actor/event/product, but lacks temporal and quantitative anchors beyond 'sales'.",
          "sources": []
        },
        {
          "index": 10,
          "category": "Geopolitical",
          "title": "EU Proposals for Drone Bans",
          "summary": "EU Commission proposes bans on high-risk drone exports to non-allies. Signals emerging transatlantic consensus on dual-use restrictions.",
          "verdict": "future",
          "verifiability_score": 75,
          "specificity_score": 65,
          "currency_score": 85,
          "newest_source_date": "2026-02-11",
          "judge_comments": "The EU is strengthening export controls on dual-use items, including drones. This reflects a trend towards restricting sensitive technologies from non-allies. The specific proposal for 'bans' hasn't been codified yet, making it future-looking.",
          "spec_comments": "Concrete actor, action, and subject. 'Emerging consensus' is a very mild deduction.",
          "sources": []
        },
        {
          "index": 11,
          "category": "Geopolitical",
          "title": "Iran Shahed Drone Transfers",
          "summary": "Iran supplies Shahed-136 drones to proxy forces in multiple theaters. Indicates proliferation of low-cost autonomous loitering munitions.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-11",
          "judge_comments": "Iran has supplied Shahed drones to various actors, including Russia, and now Russia is sending upgraded variants back to Iran. The widespread use across multiple theaters is well-documented.",
          "spec_comments": "Names actor and product, but 'proxy forces' and 'multiple theaters' lack specificity. 'Indicates' is weak.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Industrial Base",
          "title": "Anduril Roadrunner Production Scale",
          "summary": "Anduril doubles Roadrunner drone production lines for US customers. Signals ramp-up in domestic reusable autonomous munition capacity.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-03-28",
          "judge_comments": "Anduril is planning Roadrunner production at Arsenal-1 by year-end, which includes 500 units for DoD, but a 'doubling of production lines' is not explicitly confirmed.",
          "spec_comments": "Concrete actor, product, and specific action with a quantitative anchor. Avoids hype.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Industrial Base",
          "title": "Ukraine FPV Drone Factories",
          "summary": "Ukraine opens new factories producing FPV guidance kits for drones. Indicates localization of drone component manufacturing amid conflict.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2025-03-16",
          "judge_comments": "No direct evidence of new 'factories' specifically for FPV guidance kits. Localization of drone component manufacturing is underway.",
          "spec_comments": "Concrete actor, event. Lacks specific quantity or exact time. Active voice for the most part.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Industrial Base",
          "title": "AeroVironment Switchblade Contracts",
          "summary": "AeroVironment secures contracts expanding Switchblade loitering munition output. Signals surge in US industrial output for tube-launched autonomy.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-02-26",
          "judge_comments": "AeroVironment has secured multiple contracts for Switchblade systems, expanding its U.S. Army commitments and production capacity.",
          "spec_comments": "Concrete actor/product. Lacks quantitative/temporal anchor. 'Surge' is vague.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Industrial Base",
          "title": "DJI Dual-Use Component Shift",
          "summary": "DJI reallocates civilian drone components to defense-qualified production. Indicates pivot in commercial base toward military autonomous systems.",
          "verdict": "fabricated",
          "verifiability_score": 20,
          "specificity_score": 65,
          "currency_score": 30,
          "newest_source_date": "2024-07-31",
          "judge_comments": "DJI explicitly states its products are for civilian use only and has never designed or sold military-grade equipment. It complies with export controls to prevent military use.",
          "spec_comments": "Concrete actor and shift mentioned. Lacks a temporal or quantitative anchor, and uses some vague terms like 'pivot'.",
          "sources": []
        }
      ]
    },
    {
      "brief_id": "climate-adaptation-capital",
      "scores": {
        "verifiability": 55,
        "specificity": 86,
        "currency": 66,
        "coverage": 100,
        "composite": 73,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Policy",
          "title": "California Rate Hike Approvals",
          "summary": "California regulators approve average 20% property insurance rate increases. Increases address wildfire and flood claim surges.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-05-12",
          "judge_comments": "The signal states an average 20% increase, which contradicts the information from the web search that shows a 1.5% average increase for Farmers and a 17% increase for State Farm, and rate reductions for some policy types.",
          "spec_comments": "Concrete actor, event, and quantitative anchor. No hype or vague quantifiers.",
          "sources": []
        },
        {
          "index": 1,
          "category": "Policy",
          "title": "Florida Non-Renewal Caps",
          "summary": "Florida legislature enacts law limiting annual policy non-renewals to 10%. Law counters 1 million dropped homeowner policies.",
          "verdict": "fabricated",
          "verifiability_score": 20,
          "specificity_score": 90,
          "currency_score": 30,
          "newest_source_date": "2024-05-13",
          "judge_comments": "Florida legislation (HB 1611) limits non-renewals for hurricane damage, but does not cap overall non-renewals at 10%. Insurer-initiated non-renewals are much higher.",
          "spec_comments": "Concrete actor, specific event, and quantitative anchors are strong. 'Dropped policies' is slightly past tense.",
          "sources": []
        },
        {
          "index": 2,
          "category": "Policy",
          "title": "EU Adaptation Funding Rule",
          "summary": "EU mandates 40% of climate finance targets adaptation measures. Rule applies to national recovery and resilience plans.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 85,
          "newest_source_date": "2026-01-27",
          "judge_comments": "No direct evidence of a *mandated 40% target for adaptation measures* in EU climate finance, though adaptation finance is increasing.",
          "spec_comments": "Concrete actor and measurable shift, but lacks a temporal anchor beyond \"applies\".",
          "sources": []
        },
        {
          "index": 3,
          "category": "Policy",
          "title": "World Bank Adaptation Loans",
          "summary": "World Bank disburses $10 billion in loans for adaptation infrastructure. Loans prioritize vulnerable developing countries.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 75,
          "currency_score": 100,
          "newest_source_date": "2026-03-04",
          "judge_comments": "The World Bank actively funds climate adaptation projects, especially in vulnerable countries, but a specific $10 billion disbursement for this purpose is not explicitly stated in the provided documents.",
          "spec_comments": "Concrete actor, quantitative anchor, and specific action. 'Vulnerable developing countries' is a slight deduction.",
          "sources": []
        },
        {
          "index": 4,
          "category": "Capital Markets",
          "title": "Adaptation Green Bond Surge",
          "summary": "Market issues $5 billion in bonds financing coastal defenses and water systems. Bonds attract institutional investors.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 90,
          "currency_score": 70,
          "newest_source_date": "2025-10-10",
          "judge_comments": "While a specific $5 billion bond issue isn't found, the trend of adaptation-focused bonds, especially for water infrastructure and coastal protection, is well-documented and growing.",
          "spec_comments": "Concrete actor (market, institutional investors), specific event (issues), temporal anchor ($5 billion).",
          "sources": []
        },
        {
          "index": 5,
          "category": "Capital Markets",
          "title": "Munich Re Stock Drop",
          "summary": "Munich Re shares decline 15% after Q2 catastrophe losses exceed $2 billion. Losses include US storms and floods.",
          "verdict": "fabricated",
          "verifiability_score": 20,
          "specificity_score": 95,
          "currency_score": 100,
          "newest_source_date": "2026-05-13",
          "judge_comments": "Munich Re's Q1 2026 results show significantly lower major loss expenditure, contradicting a Q2 $2 billion catastrophe loss, and the stock did not drop 15%.",
          "spec_comments": "Concrete actor, quantitative anchored event in active voice. Minor deduction for 'US storms and floods' not fully specific.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Capital Markets",
          "title": "Physical Risk Premium Index",
          "summary": "S&P Global launches index measuring climate risk premiums across 500 insurers. Index benchmarks repricing trends.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-02-17",
          "judge_comments": "S&P Global and Verisk collaborate. No mention of an 'S&P Global Physical Risk Premium Index' specifically.",
          "spec_comments": "Concrete actor (S&P Global), concrete event (launches index), and a quantitative anchor (500 insurers) are present.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Capital Markets",
          "title": "Coastal Investment Withdrawals",
          "summary": "Pension funds pull $2 billion from coastal real estate funds. Pullouts cite FEMA flood map updates.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 90,
          "currency_score": 85,
          "newest_source_date": "2026-02-01",
          "judge_comments": "No evidence found to support the specific claim of pension funds pulling $2 billion from coastal real estate funds due to FEMA flood map updates. The concept of withdrawal from at-risk areas is mentioned in relation to insurance, not specifically pension fund real estate investments.",
          "spec_comments": "Concrete actors, specific amount, clear event, and reason for the withdrawal.",
          "sources": []
        },
        {
          "index": 8,
          "category": "Physical Risk",
          "title": "US Flood Claims Increase",
          "summary": "NFIP reports 30% rise in flood claims during 2023 season. Storms drive payouts over $10 billion.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 90,
          "currency_score": 100,
          "newest_source_date": "2026-03-26",
          "judge_comments": "No source verified a 30% rise or $10 billion in NFIP payouts for 2023. One source indicates $8 billion in 2024 damages.",
          "spec_comments": "Concrete actor, specific event, quantitative and temporal anchors, active voice.",
          "sources": []
        },
        {
          "index": 9,
          "category": "Physical Risk",
          "title": "Global Wildfire Area Doubles",
          "summary": "Satellite data show wildfire burned area doubles since 2000 baseline. Canada 2023 season burns 45 million acres.",
          "verdict": "fabricated",
          "verifiability_score": 20,
          "specificity_score": 85,
          "currency_score": 10,
          "newest_source_date": "2024-04-04",
          "judge_comments": "Global burned area is slightly below average (3.9 million km² vs. 2001-2022 average of 384 Mha, which is 3.84 million km²). Canada's 2023 season burned 15 million hectares (37 million acres), not 45 million acres.",
          "spec_comments": "Concrete data (NASA, 2000, 2023, 45m acres), but 'global' could be more precise.",
          "sources": []
        },
        {
          "index": 10,
          "category": "Physical Risk",
          "title": "Sea Level Rise Acceleration",
          "summary": "NASA satellites record 5.2mm annual sea level rise globally. Rise erodes 1,000 km of US coastlines.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 95,
          "currency_score": 10,
          "newest_source_date": "2024-03-26",
          "judge_comments": "Global mean sea level rise was 4.5 mm/year in 2023, doubling since 1993. The US coastlines are facing accelerated rise and increased flooding.",
          "spec_comments": "Concrete actor, specific measurement, temporal anchor, active voice. The 'erodes' part is a bit of a leap.",
          "sources": []
        },
        {
          "index": 11,
          "category": "Physical Risk",
          "title": "Heatwave Excess Deaths Rise",
          "summary": "Europe registers 70,000 excess deaths from 2022 heatwaves per WHO. Mortality rates climb 20% over decade.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 90,
          "currency_score": 70,
          "newest_source_date": "2025-09-22",
          "judge_comments": "The WHO states over 175,000 heat-related deaths annually in the European Region from 2000-2019, not specifically 70,000 in 2022. Other sources cite around 60k-70k for 2022, but not from WHO.",
          "spec_comments": "Concrete actor, event, quantitative/temporal anchors, active voice. Lacks a specific present-tense observation.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Technology",
          "title": "AI Flood Risk Models",
          "summary": "Google AI achieves 90% accuracy in flood forecasting via satellite data. Model covers Southeast Asia rivers.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-03-12",
          "judge_comments": "While Google extensively uses AI and satellite imagery for flood forecasting with reported high accuracy, the specific 90% accuracy figure for Southeast Asia rivers isn't directly stated across sources.",
          "spec_comments": "Concrete actor, specific product/event, quantitative and temporal anchors. Active voice. High specificity.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Technology",
          "title": "Satellite Adaptation Monitoring",
          "summary": "Planet Labs imagery tracks sea wall construction in 20 cities. Data verifies $500 million in projects.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 10,
          "newest_source_date": "2023-05-25",
          "judge_comments": "While Planet Labs uses satellite imagery to monitor climate risks and urban development, there is no specific evidence of them tracking sea wall construction in 20 cities or verifying $500M in projects.",
          "spec_comments": "Concrete actor and event, quantitative anchors, active voice. Lacks specific dates or project names.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Technology",
          "title": "Drone Post-Storm Assessments",
          "summary": "Insurers use drones to survey Hurricane Idalia damage in 48 hours. Surveys cut claims processing time 70%.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 95,
          "currency_score": 10,
          "newest_source_date": "2023-09-04",
          "judge_comments": "Drones used for Idalia damage assessment, but no mention of 70% claims processing time reduction.",
          "spec_comments": "Concrete actor, event, quantitative data, active voice. Excellent specificity.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Technology",
          "title": "Blockchain Finance Tracking",
          "summary": "UN blockchain platform traces $100 million adaptation funds in Kenya. Platform logs disbursements to projects.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 90,
          "currency_score": 70,
          "newest_source_date": "2025-09-26",
          "judge_comments": "The World Bank Group is piloting a blockchain tool, FundsChain, for tracking project funds, not specifically UN or adaptation funds in Kenya.",
          "spec_comments": "Concrete actor, amount, location, and action. \"logs disbursements\" is good specificity.",
          "sources": []
        }
      ]
    },
    {
      "brief_id": "retail-genai-commerce",
      "scores": {
        "verifiability": 84,
        "specificity": 60,
        "currency": 78,
        "coverage": 97,
        "composite": 78,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Channels",
          "title": "Google AI Overviews Shopping",
          "summary": "Google embeds shopping actions in AI-generated overviews for product queries. Signals channels consolidate search and purchase in AI interfaces.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 85,
          "newest_source_date": "2026-02-11",
          "judge_comments": "Google is embedding shopping actions and direct checkout in AI overviews in Search and Gemini, consolidating search and purchase within AI interfaces.",
          "spec_comments": "Concrete actor and action, but 'Signals channels consolidate' is vague and slightly future-tense.",
          "sources": []
        },
        {
          "index": 1,
          "category": "Channels",
          "title": "Amazon Rufus AI Shopper",
          "summary": "Amazon deploys Rufus generative AI to assist product discovery in app. Signals channels integrate conversational AI for direct sales.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-04-01",
          "judge_comments": "Amazon has widely deployed Rufus, its generative AI shopping assistant, which aids product discovery and integrates conversational AI for direct sales and agentic actions.",
          "spec_comments": "Concrete actor (Amazon), product (Rufus), and event (deploys). Lacks a temporal or quantitative anchor.",
          "sources": []
        },
        {
          "index": 2,
          "category": "Channels",
          "title": "TikTok Shop AI Tabs",
          "summary": "TikTok activates AI-curated tabs within Shop for video-based browsing. Signals channels fuse entertainment and commerce via AI.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 65,
          "currency_score": 0,
          "spec_comments": "Concrete actor, event. Lacks a quantitative/temporal anchor or active voice. \"Signals channels fuse\" is generic.",
          "sources": []
        },
        {
          "index": 3,
          "category": "Channels",
          "title": "Pinterest AI Shopping Lenses",
          "summary": "Pinterest launches AI lenses that link pins to instant purchases. Signals channels transform visual search into transactional paths.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 70,
          "newest_source_date": "2025-10-30",
          "judge_comments": "Pinterest has integrated AI-powered visual search tools enabling users to find and purchase look-alike items directly from Pins.",
          "spec_comments": "Names actor (Pinterest), product (AI lenses), and event (launches). Lacks specific quantitative/temporal anchors.",
          "sources": []
        },
        {
          "index": 4,
          "category": "Brand",
          "title": "Nike AI Custom Discovery",
          "summary": "Nike deploys AI agents to generate personalized product narratives. Signals brands control discovery beyond ad platforms.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-05-07",
          "judge_comments": "Nike has deployed AI in its app for personalized search and recommendations. Marqo's Sibbi and Microsoft's Brand Agents also illustrate similar trends in agentic commerce.",
          "spec_comments": "Concrete actor (Nike), event (deploys AI agents), specific action (generate personalized product narratives). Lacks temporal anchor.",
          "sources": []
        },
        {
          "index": 5,
          "category": "Brand",
          "title": "Coca-Cola AI Brand Agents",
          "summary": "Coca-Cola tests AI agents that pitch products in chat interfaces. Signals brands engage consumers directly via AI.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 70,
          "newest_source_date": "2025-08-18",
          "judge_comments": "Coca-Cola uses AI for customer interaction and content creation, but no direct evidence of 'AI brand agents pitching products in chat interfaces'.",
          "spec_comments": "Concrete actor, specific event, and active voice. Lacks a temporal/quantitative anchor.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Brand",
          "title": "Unilever Generative Brand Twins",
          "summary": "Unilever creates digital twins of brands using generative AI. Signals brands redefine identity through AI simulations.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 40,
          "currency_score": 100,
          "newest_source_date": "2026-02-17",
          "judge_comments": "Unilever uses generative AI to create digital twins of products for marketing, improving efficiency and consistency. The partnership with Google will expand this scope.",
          "spec_comments": "No concrete actor beyond company, no quantifiable/temporal anchor. 'Redefine' is subjective, lacks active voice for the core action of the signal.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Brand",
          "title": "Patagonia AI Storytelling Bots",
          "summary": "Patagonia builds AI bots that narrate brand stories on demand. Signals brands bypass media for direct narratives.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 75,
          "currency_score": 85,
          "newest_source_date": "2026-01-08",
          "judge_comments": "While no direct mention of Patagonia AI bots, the trend of brands using AI for storytelling and direct engagement is widespread.",
          "spec_comments": "Concrete actor, specific product/event. Lacks temporal anchor or quantitative insight.",
          "sources": []
        },
        {
          "index": 8,
          "category": "Technology",
          "title": "OpenAI GPT-4o Vision Commerce",
          "summary": "OpenAI's GPT-4o processes images to recommend and compare products. Signals technology enables visual agentic shopping.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-24",
          "judge_comments": "ChatGPT now allows visual browsing, image uploads for similar items, and side-by-side product comparisons to facilitate shopping.",
          "spec_comments": "Concrete actor, product, and function. Lacks explicit quantitative/temporal anchor; 'agentic shopping' is slightly generic.",
          "sources": []
        },
        {
          "index": 9,
          "category": "Technology",
          "title": "Anthropic Claude Tool Use",
          "summary": "Anthropic's Claude integrates APIs for autonomous purchase execution. Signals technology advances agentic commerce capabilities.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-05-12",
          "judge_comments": "Anthropic's Project Deal and Shoppable's MCP server demonstrate Claude's integration with APIs for autonomous purchase execution in real-world scenarios.",
          "spec_comments": "Good actor and function; could benefit from a temporal anchor or specific API examples.",
          "sources": []
        },
        {
          "index": 10,
          "category": "Technology",
          "title": "Perplexity AI Shopping Links",
          "summary": "Perplexity AI appends buy links to conversational product answers. Signals technology merges search with e-commerce.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 70,
          "newest_source_date": "2025-05-14",
          "judge_comments": "Perplexity AI explicitly integrates shopping features, including \"Buy with Pro\" and PayPal checkout, directly into its conversational search, merging discovery and e-commerce.",
          "spec_comments": "Concrete actor, action, and product. Lacks quantitative/temporal anchor, uses some hype.",
          "sources": []
        },
        {
          "index": 11,
          "category": "Technology",
          "title": "xAI Grok Image Shopping",
          "summary": "xAI's Grok analyzes images to source and price similar items. Signals technology supports generative product matching.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 65,
          "currency_score": 70,
          "newest_source_date": "2025-05-20",
          "judge_comments": "No evidence of xAI Grok's image shopping capabilities or 'agentic checkout' features. Other AI models have similar features.",
          "spec_comments": "Names actor (xAI, Grok), concrete event (analyzes images to source/price items), and current function. Lacks quantitative/temporal anchor.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Consumer Behavior",
          "title": "ChatGPT Custom Shopping GPTs",
          "summary": "Users build GPTs in ChatGPT for personalized deal hunting. Signals consumers delegate discovery to AI agents.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-24",
          "judge_comments": "While ChatGPT is evolving into a shopping platform with agentic commerce, dedicated custom GPTs for 'deal hunting' are not explicitly mentioned yet as a core feature.",
          "spec_comments": "Names actors (ChatGPT, GPTs), and a measurable shift (users building). Lacks quantitative/temporal anchor.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Consumer Behavior",
          "title": "Consumers Query AI for Outfits",
          "summary": "Shoppers prompt AI with photos for styled purchase lists. Signals consumers adopt agentic workflows for fashion.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 40,
          "currency_score": 85,
          "newest_source_date": "2026-01-29",
          "judge_comments": "AI platforms like FindGPT allow users to upload photos for personalized shopping suggestions and instant purchases. Google also offers virtual try-on with uploaded photos.",
          "spec_comments": "No concrete actor, event, or anchor. \"Shoppers\" is generic. \"Agentic workflows\" is vague.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Consumer Behavior",
          "title": "Reddit Users AI Purchase Agents",
          "summary": "Reddit threads document AI agents completing grocery orders. Signals consumers entrust routine buys to AI.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 10,
          "newest_source_date": "2023-11-20",
          "judge_comments": "Reddit integrates AI answers into its search bar, but there's no evidence of users specifically tasking AI agents within Reddit to complete grocery orders. Instacart has launched an AI integration with ChatGPT, not Reddit.",
          "spec_comments": "Concrete actor (Reddit users), event (document AI agents), but 'signals consumers' is a generic forecast.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Consumer Behavior",
          "title": "X Users Delegate Travel Booking",
          "summary": "X platform users share AI-handled flight and hotel bookings. Signals consumers shift to agentic travel planning.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 30,
          "currency_score": 100,
          "newest_source_date": "2026-04-01",
          "judge_comments": "While specific \"X users\" data isn't available, multiple sources confirm the broader trend of AI handling travel planning and booking, with platforms like Expedia, Booking.com, and eDreams ODIGEO integrating such features. The shift toward agentic commerce in travel is well-documented.",
          "spec_comments": "Vague actors (X platform users), passive voice, generic shift, no quantitative/temporal anchor.",
          "sources": []
        }
      ]
    },
    {
      "brief_id": "biotech-platform-shifts",
      "scores": {
        "verifiability": 66,
        "specificity": 84,
        "currency": 76,
        "coverage": 97,
        "composite": 78,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Discovery",
          "title": "AI-Generated GLP-1 Dual Agonists",
          "summary": "Generate:Biomed announces AI platform produces GLP-1/GIP dual agonists with sub-nanomolar potency. Candidates advance to lead optimization phase. Signals expanded tractability of multi-target peptide design.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 85,
          "newest_source_date": "2026-01-20",
          "judge_comments": "While AI is generating GLP-1 candidates, specific mention of Generate:Biomed's dual agonists or lead optimization status is lacking.",
          "spec_comments": "Concrete actor, product, and measurable shift with quantitative anchors. \"Expanded tractability\" is slightly abstract.",
          "sources": []
        },
        {
          "index": 1,
          "category": "Discovery",
          "title": "Absci AI GLP-1 Receptor Antibodies",
          "summary": "Absci designs antibodies targeting GLP-1 receptor using generative AI. Constructs exhibit 10-fold stability improvement over baselines. Indicates biologics potential in GLP-1 therapeutics.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2025-05-13",
          "judge_comments": "Absci's press release mentions AI-designed biologics but focuses on an anti-TL1A antibody, not GLP-1R antibodies. No specific mention of 10-fold stability improvement.",
          "spec_comments": "Concrete actor and event; includes quantitative anchor, but uses vague 'indicates potential'.",
          "sources": []
        },
        {
          "index": 2,
          "category": "Discovery",
          "title": "Recursion AI GLP-1 Pathway Hits",
          "summary": "Recursion applies AI phenotypic screens to identify GLP-1 modulators. Hits confirm activity in human iPSC-derived cells. Signals unbiased mechanism discovery for follow-ons.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 65,
          "currency_score": 85,
          "newest_source_date": "2025-12-08",
          "judge_comments": "No evidence links Recursion's AI platform to GLP-1 modulators or iPSC-derived cells. Their focus is REC-4881 for FAP.",
          "spec_comments": "Concrete actor (Recursion AI), product (GLP-1), measurable shift (hits confirm activity). Future tense for follow-ons is a minor deduction.",
          "sources": []
        },
        {
          "index": 3,
          "category": "Discovery",
          "title": "Isomorphic GLP-1 Structure Predictions",
          "summary": "Isomorphic Labs generates AI predictions of GLP-1 receptor structures at 0.5Å RMSD accuracy. Predictions guide novel ligand synthesis. Indicates precision engineering of GPCR binders.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 85,
          "newest_source_date": "2026-02-10",
          "judge_comments": "While Isomorphic Labs demonstrates advanced AI for drug design and protein structure prediction (including GPCRs), there's no specific mention of GLP-1 receptor structure predictions at 0.5Å RMSD or guiding novel ligand synthesis.",
          "spec_comments": "Concrete actor, product, and quantitative anchor. 'Precision engineering' is slightly interpretive but still grounded.",
          "sources": []
        },
        {
          "index": 4,
          "category": "Clinical",
          "title": "AI-Driven Adaptive GLP-1 Trials",
          "summary": "Sponsors deploy AI algorithms to adapt Phase 2 GLP-1 dosing in real-time. Trials complete enrollment four months early. Signals timeline compression in metabolic trials.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 100,
          "newest_source_date": "2026-02-25",
          "judge_comments": "While AI is used in drug *discovery* and specific GLP-1 trials show impressive speed, real-time AI-driven adaptive dosing in GLP-1 Phase 2 trials with a four-month early enrollment completion is not explicitly mentioned across two independent sources.",
          "spec_comments": "Concrete actors, event, quantitative/temporal anchor. Active voice. Minor deduction for 'timeline compression' as slightly generic.",
          "sources": []
        },
        {
          "index": 5,
          "category": "Clinical",
          "title": "Decentralized GLP-1 Trial Platforms",
          "summary": "Medable hosts decentralized GLP-1 study with 4,000 remote participants. Site costs fall 35% below benchmarks. Indicates scalable economics for large cohorts.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-02-26",
          "judge_comments": "The general trend of DCTs in GLP-1 trials is documented, but the specific claim about Medable hosting a 4,000-participant decentralized GLP-1 study with 35% site cost reduction is not verified.",
          "spec_comments": "Concrete actor, event, and quantitative anchors. 'Indicates scalable economics' is a slight forecast without a direct anchor.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Clinical",
          "title": "Wearable Data in GLP-1 Trials",
          "summary": "Trials incorporate continuous glucose monitoring from wearables for GLP-1 efficacy. Endpoint analysis accelerates by 20%. Signals digital endpoint integration.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-05-13",
          "judge_comments": "While GLP-1 trials are progressing with new drugs and methods, the direct integration of CGM data from wearables to accelerate endpoint analysis by 20% is not mentioned in these sources. The broader trend of digital endpoint integration is plausible.",
          "spec_comments": "Concrete actor (wearables) and event (trials) are named, along with a quantitative anchor.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Clinical",
          "title": "AI Trial Failure Prediction Models",
          "summary": "Owkin model predicts GLP-1 Phase 2 futility with 82% accuracy from interim data. Two studies terminate early. Indicates capital preservation in portfolios.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 95,
          "currency_score": 100,
          "newest_source_date": "2026-02-26",
          "judge_comments": "The signal points to a broader trend of AI being used in drug discovery and clinical trial optimization, including GLP-1 follow-ons. MindRank's success with MDR-001 showcases AI's potential in accelerating drug development with demonstrated efficacy and safety. The increasing rate of clinical trial terminations due to strategic business decisions further suggests a drive for capital preservation, a trend that AI-driven prediction models could support.",
          "spec_comments": "Concrete actor, product, and quantitative anchors. Active voice. Specific event and outcome.",
          "sources": []
        },
        {
          "index": 8,
          "category": "Regulatory",
          "title": "FDA AI Drug Guidance Release",
          "summary": "FDA issues guidance requiring AI model validation for discovery submissions. Document mandates reproducibility datasets. Signals oversight standardization for platforms.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 50,
          "newest_source_date": "2025-02-01",
          "judge_comments": "The FDA issued draft guidance on AI use in drug development, emphasizing model credibility and engagement with the agency.",
          "spec_comments": "Concrete actor, event, and specific requirements are present. \"Signal oversight standardization\" is a slight generalization.",
          "sources": []
        },
        {
          "index": 9,
          "category": "Regulatory",
          "title": "EMA AI Candidate IND Acceptance",
          "summary": "EMA clears IND for Exscientia AI-designed oncology drug. Review verifies training data integrity. Indicates pathway for computational leads.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 30,
          "newest_source_date": "2024-05-21",
          "judge_comments": "The provided documents do not mention EMA clearing an IND for an Exscientia AI-designed oncology drug or any review of training data integrity. Exscientia primarily discusses IND/CTA submissions rather than EMA IND acceptances.",
          "spec_comments": "Concrete actor, event, and anchor. 'Indicates pathway' is a small generic inference.",
          "sources": []
        },
        {
          "index": 10,
          "category": "Regulatory",
          "title": "USPTO AI Patent Expedited Reviews",
          "summary": "USPTO processes AI-generated drug patents in nine months average. Four GLP-1 compositions receive grants. Signals IP acceleration for outputs.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-04-01",
          "judge_comments": "No evidence was found to support the claim of USPTO expediting AI-generated drug patents or average nine-month process specifically for AI.",
          "spec_comments": "Concrete actor, event, and quantitative anchor. Uses active voice. No deductions.",
          "sources": []
        },
        {
          "index": 11,
          "category": "Regulatory",
          "title": "FDA GLP-1 Digital Evidence Nod",
          "summary": "FDA incorporates AI-simulated PK data in three GLP-1 approvals. Guidance endorses surrogate modeling. Indicates data augmentation acceptance.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-04-28",
          "judge_comments": "No evidence of FDA accepting AI-simulated PK data for GLP-1 approvals or endorsing surrogate modeling. The referenced GLP-1 approval did not mention AI contributions to PK data.",
          "spec_comments": "Concrete actor (FDA), event (GLP-1 approvals), quantitative anchor (three), active voice. 'Indicates' is slightly weak.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Competitive",
          "title": "Pfizer Atomwise AI Licensing",
          "summary": "Pfizer pays $115M upfront to license Atomwise AI for GPCR hits. Deal includes GLP-1 targets. Signals big pharma AI integration.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 90,
          "currency_score": 50,
          "newest_source_date": "2025-01-07",
          "judge_comments": "No evidence of an Atomwise-Pfizer deal beyond early 2024. Pfizer has expanded its AI partnership with PostEra, not Atomwise, for drug discovery and ADCs.",
          "spec_comments": "Concrete actor, specific amount, measurable shift, active voice. 'Big pharma AI integration' is slightly abstract.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Competitive",
          "title": "Novo Oral Semaglutide NDA Filing",
          "summary": "Novo Nordisk submits NDA for oral GLP-1 with 45% bioavailability gain. Phase 3 reports 1.7% A1c reduction. Indicates formulation leadership.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 95,
          "currency_score": 85,
          "newest_source_date": "2025-12-22",
          "judge_comments": "Novo Nordisk filed an NDA for oral semaglutide. Bioavailability gain and A1c reduction claims are not directly supported by current sources.",
          "spec_comments": "Concrete actor, product, event, and quantitative anchors. Minimal fluff.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Competitive",
          "title": "Lilly Versanis Obesity Acquisition",
          "summary": "Eli Lilly acquires Versanis for $1.9B adding GLP-1 combo asset. Phase 2 data supports weight loss claims. Signals portfolio expansion.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 90,
          "currency_score": 10,
          "newest_source_date": "2023-08-14",
          "judge_comments": "Eli Lilly's acquisition of Versanis Bio for up to $1.925 billion is confirmed by multiple sources. The deal brings bimagrumab, an experimental antibody, into Lilly's pipeline, which is being assessed in combination with GLP-1s for obesity. This expands Lilly’s portfolio.",
          "spec_comments": "Concrete actor, action, and quantitative anchor. 'Signals' is slightly generic, but overall strong.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Competitive",
          "title": "Roche Recursion AI Partnership",
          "summary": "Roche invests $250M in Recursion AI alliance for metabolic targets. Collaboration targets GLP-1 pathways. Indicates alliance competition in discovery.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 85,
          "newest_source_date": "2026-01-27",
          "judge_comments": "Roche's Recursion AI alliance is for neuroscience and oncology, not metabolic targets or GLP-1 pathways, and predates recent GLP-1 developments.",
          "spec_comments": "Concrete actors, event, and quantitative anchor. 'Alliance competition' is a slight deduction.",
          "sources": []
        }
      ]
    },
    {
      "brief_id": "energy-grid-electrification",
      "scores": {
        "verifiability": 90,
        "specificity": 78,
        "currency": 58,
        "coverage": 91,
        "composite": 82,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Supply",
          "title": "NuScale VOYGR SMR Certification",
          "summary": "U.S. Nuclear Regulatory Commission certifies NuScale Power's VOYGR small modular reactor design. Signals baseload supply options for transmission-constrained data center regions.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 70,
          "newest_source_date": "2025-06-04",
          "judge_comments": "The NRC issued a Standard Design Approval for NuScale's US460 SMR on May 29, 2025, which is based on the VOYGR design. This enables reference in licensing applications.",
          "spec_comments": "Good concrete names for actor, event, and product. \"Baseload supply options for transmission-constrained data center regions\" is a generic forecast.",
          "sources": []
        },
        {
          "index": 1,
          "category": "Supply",
          "title": "Constellation TMI Unit 1 Restart",
          "summary": "Constellation Energy restarts Three Mile Island Unit 1 under Microsoft power purchase agreement. Indicates nuclear supply reactivation addresses hyperscaler demand near PJM bottlenecks.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 90,
          "currency_score": 70,
          "newest_source_date": "2025-09-23",
          "judge_comments": "Constellation is restarting TMI Unit 1 as the Crane Clean Energy Center, with a 20-year PPA with Microsoft to meet data center demand, alleviating PJM grid strain. The restart is ahead of schedule.",
          "spec_comments": "Excellent specificity: names actor, event, product, and includes clear temporal and quantitative anchors. Minimal deductions.",
          "sources": []
        },
        {
          "index": 2,
          "category": "Supply",
          "title": "X-energy TRISO Fuel Production",
          "summary": "X-energy starts TRISO-X fuel fabrication at Tennessee facility for Xe-100 SMRs. Signals domestic fuel chain supports SMR commercialization.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 90,
          "currency_score": 100,
          "newest_source_date": "2026-02-13",
          "judge_comments": "TRISO-X received its license in Feb 2026 for its TX-1 facility in Oak Ridge, TN. Production is expected to begin in early 2028.",
          "spec_comments": "Concrete actor, event, product, and anchors. Minor, unavoidable future-tense implication for SMR commercialization.",
          "sources": []
        },
        {
          "index": 3,
          "category": "Supply",
          "title": "GE Hitachi BWRX-300 Progress",
          "summary": "Ontario Power Generation submits BWRX-300 SMR construction license to Canadian regulator. Indicates compact reactors expand supply near urban loads.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 50,
          "newest_source_date": "2025-05-08",
          "judge_comments": "OPG applied for a construction license in October 2022, which was granted in April 2025. Construction has now been approved. BWRX-300 could be operational by 2030.",
          "spec_comments": "Concrete actor, event, and temporal anchor. 'Expand supply' is slightly generic but the core is specific.",
          "sources": []
        },
        {
          "index": 4,
          "category": "Demand",
          "title": "Microsoft Nuclear Power Agreement",
          "summary": "Microsoft secures 835 MW nuclear power from Three Mile Island restart. Signals data center demand drives dedicated generation contracts.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 90,
          "currency_score": 30,
          "newest_source_date": "2024-09-20",
          "judge_comments": "Microsoft signed a 20-year PPA for 835 MW from the Three Mile Island Unit 1 restart in 2028, highlighting data center demand for dedicated carbon-free energy.",
          "spec_comments": "Concrete actor, specific event & product, quantitative and temporal anchors. Clear, active voice.",
          "sources": []
        },
        {
          "index": 5,
          "category": "Demand",
          "title": "Google Kairos SMR Commitment",
          "summary": "Google agrees to buy 500 MW from Kairos Hermes SMR by 2030. Indicates AI workloads spur hyperscaler nuclear procurement.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 95,
          "currency_score": 30,
          "newest_source_date": "2024-10-14",
          "judge_comments": "Google committed to purchasing 500 MW from Kairos by 2035, with the first SMR online by 2030, specifically for AI.",
          "spec_comments": "Concrete actors, event, and quantitative/temporal anchors. Active voice. Minimal filler.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Demand",
          "title": "Dominion Virginia Data Center Boom",
          "summary": "Dominion Energy interconnects 2 GW data center capacity in 2023. Signals transmission overload in largest U.S. data center cluster.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 30,
          "newest_source_date": "2024-11-04",
          "judge_comments": "Dominion Energy's IRP and earnings calls confirm significant data center load growth (21GW as of July 2024, 8GW additional demand studying) stressing grid infrastructure.",
          "spec_comments": "Concrete actor, specific projection with quantity, but 'strains' is a generic forecast.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Demand",
          "title": "PJM 50 GW Tech Load Queue",
          "summary": "PJM interconnection queue lists 50 GW data center and tech loads. Indicates demand surge overwhelms grid expansion capacity.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 75,
          "currency_score": 85,
          "newest_source_date": "2026-01-16",
          "judge_comments": "PJM's queue for all projects is 250 GW as of early 2024, with data centers accounting for 30-40% of future load growth. While 50GW specifically for 'tech load queue' isn't explicitly stated, the broader trend is documented across sources.",
          "spec_comments": "Concrete data point, actor, and quantity. Active, present tense. Lacks temporal anchor.",
          "sources": []
        },
        {
          "index": 8,
          "category": "Policy",
          "title": "FERC Order 1920 Planning Rule",
          "summary": "FERC requires transmission regions to plan 20-year capacity expansions with scenarios. Signals regulatory mandate targets grid bottlenecks from new loads.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2024-11-21",
          "judge_comments": "FERC Order 1920, effective May 2024 (with a follow-up in November), mandates 20-year long-term regional transmission planning.",
          "spec_comments": "Concrete actor (FERC), event (Order 1920), and quantitative anchor (20-year). 'Regulatory pressure' is a slight deduction.",
          "sources": []
        },
        {
          "index": 9,
          "category": "Policy",
          "title": "DOE SMR Commercial Liftoff Report",
          "summary": "U.S. DOE publishes Pathways to Commercial Liftoff detailing SMR cost reductions. Indicates federal blueprint accelerates reactor supply deployment.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2025-03-24",
          "judge_comments": "The U.S. DOE has published a report titled 'Advanced Nuclear Commercial LiftOff' outlining a pathway to scaling nuclear capacity, including SMRs.",
          "spec_comments": "Concrete actor, event, and anchor present. 'Accelerates deployment' is a bit generic.",
          "sources": []
        },
        {
          "index": 10,
          "category": "Policy",
          "title": "IRA Zero-Emission Credits Extension",
          "summary": "Inflation Reduction Act provides nuclear PTC at $18 per MWh zero-emission credit. Signals policy incentives sustain supply against data center growth.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2025-01-15",
          "judge_comments": "The IRA's clean electricity credits, including for nuclear, are confirmed by Treasury. They aim to meet growing demand, notably from data centers, despite grid concerns.",
          "spec_comments": "Names actor (IRA), event (PTC), and quantifies ($18/MWh). 'Sustain supply' is a bit vague.",
          "sources": []
        },
        {
          "index": 11,
          "category": "Policy",
          "title": "ERCOT Large Load Integration Rules",
          "summary": "ERCOT approves framework for data centers to register as Large Flexible Loads. Indicates state policy enables demand response amid grid stress.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 65,
          "currency_score": 85,
          "newest_source_date": "2025-12-01",
          "judge_comments": "ERCOT is working with the Public Utility Commission of Texas (PUCT) to implement Senate Bill 6 (SB6) [nationalacademies.org](https://www.nationalacademies.org/cdn/materials/a04b8423-3e67-4fb5-0074-655f10b88605). SB6 establishes an interconnection, operational, and cost-allocation framework for Large Loads [nationalacademies.org](https://www.nationalacademies.org/cdn/materials/a04b8423-3e67-4fb5-0074-655f10b88605). The state law also includes provisions for emergency curtailment of Large Loads with backup generation and a Large Load Demand Management Service to procure demand reductions [nationalacademies.org](https://www.nationalacademies.org/cdn/materials/a04b8423-3e67-4fb5-0074-655f10b88605). While the signal mentions \"approves framework,\" rulemakings to implement SB6 were ongoing as of late 2025 [nationalacademies.org](https://www.nationalacademies.org/cdn/materials/a04b8423-3e67-4fb5-0074-655f10b88605). However, the broader trend of enabling demand response from Large Loads, particularly data centers, is well-documented and actively being pursued [ercot.com](https://www.ercot.com/files/docs/2025/12/01/16.2-System-Planning-and-Weatherization-Update.pdf), [utilitydive.com](https://www.utilitydive.com/news/ercots-large-load-queue-jumped-almost-300-last-year-official/808820/). The specific phrasing of \"approves framework\" lacks direct confirmation, but the underlying policy direction is clear.",
          "spec_comments": "Concrete actor (ERCOT, data centers) and event (approves framework, register). Lacks quantitative/temporal anchor.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Technology",
          "title": "Advanced Composite Conductor Installs",
          "summary": "U.S. utilities deploy 2,500 km high-capacity ACCC conductors since 2020. Signals reconductoring boosts transmission without new rights-of-way.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 90,
          "currency_score": 30,
          "newest_source_date": "2024-10-21",
          "judge_comments": "Utilities like NV Energy and SCE have deployed significant miles of ACCC conductors, confirming the signal's core claim of use for reconductoring and increased capacity.",
          "spec_comments": "Concrete actor, product, quantity, and timeframe. Strong, specific observation.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Technology",
          "title": "SMR Integral Passive Cooling",
          "summary": "NuScale SMR design uses natural circulation cooling without external power. Indicates technology enables siting near load centers.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 70,
          "newest_source_date": "2025-06-04",
          "judge_comments": "NuScale's SMR design incorporates passive safety via natural circulation, eliminating the need for active ECCS pumps. This feature is detailed in their SDA documents and reaffirmed in press releases.",
          "spec_comments": "Concrete actor (NuScale SMR), event (uses circulation). Missing quantitative/temporal anchor.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Technology",
          "title": "Grid-Forming Battery Inverters",
          "summary": "GE Vernova ships 100 MW grid-forming inverters to California ISO. Signals inverter tech stabilizes grids with high data center penetration.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 85,
          "currency_score": 50,
          "newest_source_date": "2025-03-26",
          "judge_comments": "While GE Vernova develops grid-forming battery systems for data centers to stabilize grids, there's no mention of shipping 100 MW specific units to CAISO. The broader trend of using GFMs for grid stability with high data center penetration is well-documented.",
          "spec_comments": "Concrete actor GE Vernova, specific event (ships 100 MW), and clear implication for grid tech.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Technology",
          "title": "Data Center Immersion Cooling Rollout",
          "summary": "Microsoft installs immersion cooling systems cutting data center power draw 20%. Indicates efficiency tech tempers grid demand intensity.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 85,
          "newest_source_date": "2025-11-12",
          "judge_comments": "Microsoft is *investigating* immersion cooling, but is not currently using it in datacenter operations, due to concerns about PFAS chemicals. Claims of 20% power draw reduction are from cold plates, not immersion cooling, and are across the full lifecycle.",
          "spec_comments": "Concrete actor, measurable shift, and quantitative anchor are strong. Minor deduction for 'indicates' future-tense implication.",
          "sources": []
        }
      ]
    },
    {
      "brief_id": "education-ai-tutors",
      "scores": {
        "verifiability": 74,
        "specificity": 87,
        "currency": 51,
        "coverage": 100,
        "composite": 78,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Pedagogy",
          "title": "University AI Tutor Pilots",
          "summary": "Harvard deploys AI tutor in CS50 course for 1000 students. Feedback reveals 20% reduction in problem-solving time.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 95,
          "currency_score": 10,
          "newest_source_date": "2024-03-07",
          "judge_comments": "Harvard integrated AI tools into CS50 for thousands of students. Students reported feeling like they had 'a personal tutor' which improved learning.",
          "spec_comments": "Concrete actor, product, event, and quantifiable results. Active voice & objective. Only minimal room for a perfect 100.",
          "sources": []
        },
        {
          "index": 1,
          "category": "Pedagogy",
          "title": "AI Feedback in Writing Classes",
          "summary": "Stanford integrates Grammarly AI for essay grading in composition courses. Students complete revisions 30% faster.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 90,
          "currency_score": 100,
          "newest_source_date": "2026-05-13",
          "judge_comments": "Specifics unverified; broader trend of AI feedback in writing is well-documented by Stanford research and other studies, aligning with AI tutor concepts.",
          "spec_comments": "Concrete actor, product, event, and quantifiable shift. Missing a temporal anchor for the change.",
          "sources": []
        },
        {
          "index": 2,
          "category": "Pedagogy",
          "title": "Personalized AI Learning Paths",
          "summary": "Duolingo Max delivers tailored language exercises to 5 million users. Completion rates increase by 15%. Signals customization of pedagogy at scale.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 50,
          "newest_source_date": "2025-04-30",
          "judge_comments": "Duolingo Max has AI features, but specific user numbers for tailored exercises and such a completion rate increase are not confirmed.",
          "spec_comments": "Concrete actor, product, users, and measurable shift. Minimal passive voice.",
          "sources": []
        },
        {
          "index": 3,
          "category": "Pedagogy",
          "title": "Virtual AI Teaching Assistants",
          "summary": "MIT launches AI TA for simulated office hours. System handles 500 sessions weekly. Indicates supplementation of faculty support roles.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 85,
          "currency_score": 70,
          "newest_source_date": "2025-07-21",
          "judge_comments": "MIT Learn offers AI assistants and tutors in select courses, but a specific AI TA for \"simulated office hours\" handling \"500 sessions weekly\" is not explicitly stated.",
          "spec_comments": "Concrete actor, event, and quantitative anchor. Passive voice in last sentence.",
          "sources": []
        },
        {
          "index": 4,
          "category": "Credentials",
          "title": "Rise of Micro-Credentials",
          "summary": "Coursera awards 10 million professional certificates since 2020. Employers accept 80% for hiring decisions.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 95,
          "currency_score": 50,
          "newest_source_date": "2025-05-02",
          "judge_comments": "While Coursera's specific 10 million certificates awarded figure isn't confirmed, the general trend of micro-credential adoption and employer acceptance for hiring is well-documented by multiple sources.",
          "spec_comments": "Concrete actor (Coursera), specific product/event (certificates), quantitative/temporal anchors (10M, 2020, 80%).",
          "sources": []
        },
        {
          "index": 5,
          "category": "Credentials",
          "title": "Blockchain Verified Degrees",
          "summary": "MIT issues blockchain diplomas to 2023 graduates. Credential verification completes in seconds.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 90,
          "currency_score": 10,
          "newest_source_date": "2018-04-25",
          "judge_comments": "MIT has been issuing blockchain-verified diplomas since 2017, confirming the existence of the technology and instant verification.",
          "spec_comments": "Concrete actor, event, and quantifiable outcome. Active voice and present tense used well.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Credentials",
          "title": "Employer-Led Skill Badges",
          "summary": "Google Career Certificates secure recognition from 150 firms. 75% recipients advance in jobs.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 90,
          "currency_score": 10,
          "newest_source_date": "2024-04-24",
          "judge_comments": "Google Career Certificates are recognized by an employer consortium of 150+ companies. 75% of graduates report positive career impact.",
          "spec_comments": "Concrete actor, specific event, and quantitative anchors provide strong specificity. No deductions needed.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Credentials",
          "title": "Unbundled Course Credits",
          "summary": "Western Governors credits MOOCs toward degrees. Modular program enrollment accelerates.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 10,
          "newest_source_date": "2024-04-16",
          "judge_comments": "WGU partners with edX to offer MicroBachelors programs, which are credit-backed and stackable towards degrees. WGU also partners with Udacity for Nanodegrees.",
          "spec_comments": "Concrete actor (Western Governors) and event (credits MOOCs toward degrees) named, active voice. 'Accelerates' is a vague qualifier.",
          "sources": []
        },
        {
          "index": 8,
          "category": "Economics",
          "title": "Subscription Learning Models",
          "summary": "MasterClass provides unlimited courses for $180 annually. Membership tops 2 million users.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 100,
          "newest_source_date": "2026-04-07",
          "judge_comments": "While MasterClass offers an annual membership, the specific price of $180 and the claim of 2 million users were not confirmed in the search results.",
          "spec_comments": "Concrete actor, product, price, and membership number. Clear and concise.",
          "sources": []
        },
        {
          "index": 9,
          "category": "Economics",
          "title": "AI Reduces Tutoring Costs",
          "summary": "Chegg AI tutors cost $10 monthly versus $50 hourly human rate. Adoption exceeds legacy services.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 85,
          "currency_score": 70,
          "newest_source_date": "2025-10-27",
          "judge_comments": "Chegg mentions AI reducing content creation costs and making learning affordable, but no specific comparison of AI tutor cost vs. human tutor cost, or adoption rates, is provided.",
          "spec_comments": "Concrete actors, products, costs, and a temporal anchor are present. 'Adoption exceeds' slightly vague, but still strong.",
          "sources": []
        },
        {
          "index": 10,
          "category": "Economics",
          "title": "University Revenue from Certs",
          "summary": "edX earns $100M from verified certificates in 2023. Institutions launch branded programs.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 90,
          "currency_score": 50,
          "newest_source_date": "2024-12-13",
          "judge_comments": "The provided search results do not mention edX earning $100M from verified certificates in 2023. While they discuss growth in AI-related programs and overall learner numbers, specific revenue figures for verified certificates are not present.",
          "spec_comments": "Concrete actor (edX), event (earns $100M), quantitative/temporal anchor (2023).",
          "sources": []
        },
        {
          "index": 11,
          "category": "Economics",
          "title": "Decline in Full-Time Enrollment",
          "summary": "U.S. colleges record 5% drop in traditional enrollment since 2022. Lifelong learning options expand.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 85,
          "newest_source_date": "2026-01-15",
          "judge_comments": "Multiple sources indicate an *increase* in overall college enrollment, with total postsecondary enrollment up by 3.2% in Spring 2025 and 1.0% in Fall 2025.",
          "spec_comments": "Concrete actor, quantitative anchor, and clear event. \"Lifelong learning options expand\" is a bit generic.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Equity",
          "title": "AI Tutors for Underserved Areas",
          "summary": "Khan Academy AI serves 100M low-income users. Achievement gaps decrease 10%.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 100,
          "newest_source_date": "2026-04-21",
          "judge_comments": "Khan Academy works to serve underserved communities and reduce achievement gaps, but specific outcomes, especially 10% reductions, are not yet verified.",
          "spec_comments": "Concrete actor, product, users, and measurable shift with quantitative anchors. Uses present tense.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Equity",
          "title": "Bias Audits in Ed AI Tools",
          "summary": "UNESCO requires bias evaluations for learning AI. Half of tools exhibit demographic skews.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 10,
          "newest_source_date": "2024-01-16",
          "judge_comments": "The UNESCO documents discuss ethical AI and human-centered design but do not explicitly mention a requirement for bias evaluations in learning AI tools or statistics on tools exhibiting demographic skews.",
          "spec_comments": "Concrete actor, action, and quantitative anchor. 'Half' is slightly vague but acceptable here.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Equity",
          "title": "Free AI Tutoring Platforms",
          "summary": "IBM Watson Tutor supplies free STEM aid worldwide. Developing countries log highest usage.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 65,
          "currency_score": 85,
          "newest_source_date": "2025-12-11",
          "judge_comments": "No evidence for an 'IBM Watson Tutor' offering free STEM aid, especially to developing countries. IBM's AI efforts are focused on broader training initiatives and partnerships.",
          "spec_comments": "Concrete actor, product, and observable trend, but 'worldwide' and 'highest usage' are vague quantifiers.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Equity",
          "title": "Inclusive AI for Disabilities",
          "summary": "Microsoft Reading Coach supports dyslexic learners with adaptive features. Special education adoption doubles.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 10,
          "newest_source_date": "2024-03-13",
          "judge_comments": "Microsoft Reading Coach offers personalized reading practice, including text-to-speech analysis, and adapts to learner needs. It is available in a standalone app, and an AI in Special Education course is launching.",
          "spec_comments": "Concrete actor, product, and measurable shift. Uses active voice. Specifics are well-defined.",
          "sources": []
        }
      ]
    },
    {
      "brief_id": "geopolitics-tech-blocs",
      "scores": {
        "verifiability": 90,
        "specificity": 58,
        "currency": 76,
        "coverage": 91,
        "composite": 78,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Trade",
          "title": "US Semiconductor Export Curbs",
          "summary": "US Bureau of Industry and Security tightens controls on advanced chips to China. Signals exclusive tech trade blocs amid sovereignty pushes.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 85,
          "newest_source_date": "2026-01-15",
          "judge_comments": "The US has imposed and continues to strengthen export controls on semiconductor technology to China, citing national security concerns and military applications. This confirms increased tech trade tensions.",
          "spec_comments": "Concrete actors and event, but 'increased trade tensions' is a bit generic.",
          "sources": []
        },
        {
          "index": 1,
          "category": "Trade",
          "title": "EU Chips Act Investments",
          "summary": "EU commits €43 billion to boost domestic semiconductor manufacturing capacity. Indicates trade realignment toward bloc-based supply chains.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 75,
          "currency_score": 50,
          "newest_source_date": "2025-04-28",
          "judge_comments": "The EU Chips Act aims for semiconductor sovereignty with significant investment, fostering bloc-based supply chains.",
          "spec_comments": "Concrete actor, quantitative anchor, active voice. 'Trade realignment' is a bit generic.",
          "sources": []
        },
        {
          "index": 2,
          "category": "Trade",
          "title": "India-US Chip Supply Pact",
          "summary": "India and US ink semiconductor supply chain cooperation agreement. Signals non-China alliance formation in trade flows.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-02-20",
          "judge_comments": "India joined the Pax Silica initiative, signing a declaration with the US to secure AI foundational technologies and strengthen supply chains. This forms a non-China focused tech-bloc.",
          "spec_comments": "Concrete actors (India, US), event (ink agreement), and shift (non-China alliance) noted. Lacks quantitative/temporal anchor.",
          "sources": []
        },
        {
          "index": 3,
          "category": "Trade",
          "title": "Japan Aligns Export Controls",
          "summary": "Japan restricts semiconductor equipment exports matching US rules. Indicates coordinated trade barriers in tech blocs.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2025-03-03",
          "judge_comments": "The US and Japan have substantially aligned export controls on advanced semiconductor manufacturing equipment, including tighter restrictions on various components and software, targeting China's indigenous chip production capabilities.",
          "spec_comments": "Concrete actors, event, and temporal anchor are good. \"tightening... limits\" is a bit generic.",
          "sources": []
        },
        {
          "index": 4,
          "category": "Security",
          "title": "CFIUS Blocks Chip Deals",
          "summary": "US CFIUS halts Chinese acquisitions of American semiconductor assets. Signals security screening intensification in alliance structures.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-13",
          "judge_comments": "US CFIUS ordered a Chinese-controlled firm to divest Emcore chip assets due to national security risks, specifically IP and supply chain. This reflects tightened scrutiny of foreign tech deals.",
          "spec_comments": "Concrete actor, specific event, but lacks quantitative/temporal anchor. 'Intensification' is vague.",
          "sources": []
        },
        {
          "index": 5,
          "category": "Security",
          "title": "DoD Secure Foundry Contracts",
          "summary": "US Defense Department funds domestic secure chip production facilities. Indicates militarized semiconductor sovereignty efforts.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 30,
          "newest_source_date": "2024-09-16",
          "judge_comments": "The DoD, in collaboration with the Department of Commerce, is funding domestic secure chip production, evidenced by Intel's Secure Enclave award and participation in RAMP-C.",
          "spec_comments": "Concrete actor (DoD), action (funds), and object (facilities) present. Lacks quantitative/temporal anchor.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Security",
          "title": "AUKUS Semiconductor Sharing",
          "summary": "AUKUS pact extends to advanced semiconductor technology exchanges. Signals security alliances reshaping tech access.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 40,
          "currency_score": 85,
          "newest_source_date": "2025-12-12",
          "judge_comments": "AUKUS specifically includes AI and advanced capabilities. Pax Silica reinforces deeper tech cooperation among AUKUS nations on semiconductors.",
          "spec_comments": "No concrete actors, events, or anchors. Uses 'extends to', 'reshaping tech access' - general.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Security",
          "title": "Quad Critical Minerals Pact",
          "summary": "Quad nations agree on secure semiconductor minerals supply. Indicates bloc-level security for supply chain resilience.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 85,
          "newest_source_date": "2026-02-05",
          "judge_comments": "No direct mention of a 'Quad Critical Minerals Pact' was found. However, there are significant efforts by the US and its allies to secure critical mineral supply chains, indicating a broader trend.",
          "spec_comments": "Names actors (Quad), concrete event (pact), but lacks quantitative/temporal anchors.",
          "sources": []
        },
        {
          "index": 8,
          "category": "Standards",
          "title": "China National Chip Standards",
          "summary": "China enforces domestic standards for semiconductor design and production. Signals standards bifurcation between rival tech blocs.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 70,
          "newest_source_date": "2025-08-19",
          "judge_comments": "China has released and will implement national standards for chiplet interconnects, signaling a distinct semiconductor ecosystem, and has a broader action plan for technology standards to be in place by 2027. Multiple sources confirm China's aim for semiconductor sovereignty and a divergence in technical standards, such as chiplet interfaces like ACC 1.0 against UCIe 2.0. This is part of China's strategy for a two-tiered global technology landscape.",
          "spec_comments": "Names actor and event. Lacks specific product/standard/date. 'Bifurcation' is a bit of a forecast.",
          "sources": []
        },
        {
          "index": 9,
          "category": "Standards",
          "title": "US Trusted Foundry Standards",
          "summary": "US government mandates standards for trusted semiconductor manufacturing. Indicates alliance-specific norms for secure chips.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 40,
          "currency_score": 85,
          "newest_source_date": "2025-12-29",
          "judge_comments": "The US is actively working to secure its semiconductor supply chain and promote domestic manufacturing and allied partnerships are a core part of its strategy.",
          "spec_comments": "No concrete actor, event, or temporal anchor. 'US government mandates' is somewhat vague.",
          "sources": []
        },
        {
          "index": 10,
          "category": "Standards",
          "title": "RISC-V Adoption Surge",
          "summary": "US allies accelerate RISC-V open standard implementation in chips. Signals shift from proprietary standards in blocs.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 55,
          "currency_score": 100,
          "newest_source_date": "2026-03-20",
          "judge_comments": "Multiple reputable sources confirm US allies (EU, Hong Kong) are actively adopting RISC-V to foster self-reliance and innovation in semiconductors.",
          "spec_comments": "Good actor/event. 'Accelerate' is a vague quantify, and 'blocs' is generic.",
          "sources": []
        },
        {
          "index": 11,
          "category": "Standards",
          "title": "EU Digital Sovereignty Norms",
          "summary": "EU develops standards for sovereign semiconductor ecosystems. Indicates bloc-driven divergence in tech interoperability.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-05-27",
          "judge_comments": "The EU is actively developing frameworks and policies, including the Chips Act, to enhance its semiconductor ecosystem and technological sovereignty. This effort aims to reduce dependencies and strengthen its industrial base.",
          "spec_comments": "Concrete actor and event; lacks quantitative or temporal anchor. \"Divergence\" is slightly vague.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Talent Flows",
          "title": "US Visa Curbs on Talent",
          "summary": "US limits H-1B visas for Chinese semiconductor specialists. Signals talent restriction in competing tech blocs.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2024-12-02",
          "judge_comments": "While the US restricts China's access to semiconductor tech and talent is a key component, there's no specific mention of H-1B visa curbs for Chinese semiconductor specialists in the provided sources.",
          "spec_comments": "Concrete actor, action, and target. 'Limits' is slightly vague. 'Talent restriction' is somewhat generic.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Talent Flows",
          "title": "Taiwan Engineers to Europe",
          "summary": "European nations recruit Taiwanese chip design experts aggressively. Indicates talent redirection for sovereignty goals.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 45,
          "currency_score": 70,
          "newest_source_date": "2025-05-28",
          "judge_comments": "Taiwan is actively establishing IC design training bases in Europe, specifically in the Czech Republic, and TSMC is opening a design center in Munich to address talent needs and strengthen European semiconductor capabilities.",
          "spec_comments": "No concrete actors, no quantitative/temporal anchor. 'Aggressively' is vague.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Talent Flows",
          "title": "India-US Talent Pipeline",
          "summary": "US chip firms expand training programs for Indian engineers. Signals allied bloc talent flow acceleration.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 55,
          "currency_score": 100,
          "newest_source_date": "2026-02-20",
          "judge_comments": "Purdue University has partnered with India for semiconductor workforce development. The Pax Silica Declaration also highlights shared workforce goals.",
          "spec_comments": "Concrete actors and event, but 'acceleration' and 'expand' are vague. Lacks quantitative/temporal anchor.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Talent Flows",
          "title": "China Chip Expert Exodus",
          "summary": "Prominent Chinese semiconductor researchers join US firms. Indicates brain drain reshaping alliance talent pools.",
          "verdict": "fabricated",
          "verifiability_score": 20,
          "specificity_score": 40,
          "currency_score": 50,
          "newest_source_date": "2025-04-09",
          "judge_comments": "The signal claims Chinese semiconductor experts are joining US firms, suggesting a 'brain drain' from China. However, all credible sources indicate the opposite trend: prominent Chinese-born semiconductor experts are returning to China from the US, driven by China's push for self-reliance and US export controls.",
          "spec_comments": "No specific firms, names, or quantifiable shift are provided, and no temporal anchor.",
          "sources": []
        }
      ]
    },
    {
      "brief_id": "ai-infrastructure-scaling",
      "scores": {
        "verifiability": 76,
        "specificity": 83,
        "currency": 60,
        "coverage": 97,
        "composite": 79,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Compute",
          "title": "Persistent H100 GPU Shortages",
          "summary": "NVIDIA reports H100 GPU supply lags demand by 50% in Q3 2024. Signals delays in AI training cluster expansions.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 95,
          "currency_score": 10,
          "newest_source_date": "2024-04-10",
          "judge_comments": "Sources indicate H100 lead times are decreasing, not increasing, and demand is being met through various channels. No mention of a 50% Q3 2024 lag.",
          "spec_comments": "Concrete actor, product, quantifiable shortage, and temporal anchor. Excellent specificity.",
          "sources": []
        },
        {
          "index": 1,
          "category": "Compute",
          "title": "AI Data Center Power Rejections",
          "summary": "Utilities reject 2.9GW power requests for US AI data centers. Indicates energy infrastructure limits compute growth.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-04-01",
          "judge_comments": "Nearly half of planned US AI data centers (7GW of 12GW) are delayed/canceled due to power grid limitations and component shortages, exceeding the 2.9GW mentioned.",
          "spec_comments": "Concrete actor (Utilities, US AI data centers), specific action (reject), quantitative anchor (2.9GW).",
          "sources": []
        },
        {
          "index": 2,
          "category": "Compute",
          "title": "GPU Cluster Utilization at 45%",
          "summary": "Benchmarks show average GPU utilization reaches 45% in production clusters. Signals inefficiencies constrain scaling benefits.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-04-21",
          "judge_comments": "Multiple sources indicate average GPU utilization is significantly lower than 45% in production clusters, some as low as 5-11%.",
          "spec_comments": "Concrete actor and anchor, but lacks specific product/filing. 'Inefficiencies' is vague.",
          "sources": []
        },
        {
          "index": 3,
          "category": "Compute",
          "title": "1.6Tbps Optical Interconnects Test",
          "summary": "Broadcom deploys 1.6Tbps optical Ethernet in AI superclusters. Indicates bandwidth pushes beyond electrical limits.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 100,
          "newest_source_date": "2026-03-12",
          "judge_comments": "Broadcom announced the availability of its 3nm 400G/lane optical PAM-4 DSP, the Taurus™ BCM83640, optimized for 1.6T transceiver solutions and sampling to early access customers.",
          "spec_comments": "Concrete actor, product, and quantitative anchor. 'Pushes beyond electrical limits' is a slight deduction.",
          "sources": []
        },
        {
          "index": 4,
          "category": "Models",
          "title": "4-Bit Quantized Llama 3.1",
          "summary": "Meta releases Llama 3.1 in 4-bit format for edge deployment. Signals reduced memory demands for inference.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 95,
          "currency_score": 30,
          "newest_source_date": "2024-07-23",
          "judge_comments": "Meta has released Llama 3.1, including 8-bit quantized versions for production inference. Earlier Llama 3.2 1B and 3B models were released in 4-bit versions for mobile edge devices, reducing memory and improving speed.",
          "spec_comments": "Concrete actor, event, and quantitative anchor. 'Signals reduced' is slightly passive.",
          "sources": []
        },
        {
          "index": 5,
          "category": "Models",
          "title": "Mixtral MoE Architecture Deployment",
          "summary": "Mistral Mixtral 8x22B serves at 70B dense model speed. Indicates sparse activation cuts inference compute.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 10,
          "newest_source_date": "2023-12-01",
          "judge_comments": "Mixtral 8x7B (a smaller version of Mixtral 8x22B) achieves 6x faster inference than Llama 2 70B, matching GPT-3.5 quality. This is due to its sparse MoE architecture where only a fraction of parameters are active per token, enabling a 47B parameter model to run at the speed of a 13B model.",
          "spec_comments": "Concrete actor, product, and specific metric. Lacks a temporal anchor for 'serves'.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Models",
          "title": "Distilled 7B Matches 70B",
          "summary": "Distillation compresses 70B models to 7B with 95% performance. Signals smaller models for cost-effective serving.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2025-01-30",
          "judge_comments": "Multiple sources confirm distillation of larger models (e.g., 70B) into smaller ones (e.g., 7B or 8B) with high performance retention, significantly reducing inference costs.",
          "spec_comments": "Concrete product, quantitative anchor, active voice. Lacks specific actors/companies.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Models",
          "title": "Speculative Decoding in vLLM",
          "summary": "vLLM integrates speculative decoding for 2x LLM throughput. Indicates latency reductions via parallel sampling.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 30,
          "newest_source_date": "2024-10-17",
          "judge_comments": "vLLM integrates speculative decoding, showing up to 2.8x speedups in specific scenarios, enhancing throughput and reducing latency.",
          "spec_comments": "Concrete actor (vLLM), event (integrates speculative decoding), quantitative anchor (2x, latency reductions).",
          "sources": []
        },
        {
          "index": 8,
          "category": "Tooling",
          "title": "vLLM PagedAttention Framework",
          "summary": "vLLM PagedAttention serves 10M tokens/sec on 8xH100. Signals high-throughput standard for LLM inference.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 90,
          "currency_score": 70,
          "newest_source_date": "2025-10-16",
          "judge_comments": "While vLLM with PagedAttention significantly boosts throughput and is a high-throughput standard, the specific claim of 10M tokens/sec on 8xH100 is not explicitly confirmed in the provided sources.",
          "spec_comments": "Concrete actor, product, quantity, and temporal anchor present. No major deductions.",
          "sources": []
        },
        {
          "index": 9,
          "category": "Tooling",
          "title": "TensorRT-LLM H100 Optimizations",
          "summary": "NVIDIA TensorRT-LLM boosts Llama 70B inference 4x on H100. Indicates GPU-specific acceleration tooling.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 95,
          "currency_score": 10,
          "newest_source_date": "2023-09-09",
          "judge_comments": "TensorRT-LLM accelerates Llama 2 70B inference by 4.6x on H100 GPUs, reducing TCO and energy consumption.",
          "spec_comments": "Concrete actor, product, measurable shift (4x), and quantitative anchor (70B, H100).",
          "sources": []
        },
        {
          "index": 10,
          "category": "Tooling",
          "title": "SGLang Structured Generation",
          "summary": "SGLang accelerates LLM apps 4x with grammar constraints. Signals optimized execution for production pipelines.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-05-13",
          "judge_comments": "SGLang uses compressed finite state machines for faster-constrained decoding, achieving up to 6.4x throughput over other systems on prefix-heavy workloads and 1.8x at low concurrency.",
          "spec_comments": "Names SGLang and LLM apps, states 4x acceleration. Lacks a temporal anchor or specific event.",
          "sources": []
        },
        {
          "index": 11,
          "category": "Tooling",
          "title": "Triton Multi-Model Server",
          "summary": "NVIDIA Triton 24.09 supports MoE and dynamic batching. Indicates unified serving for diverse models.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 70,
          "newest_source_date": "2025-09-01",
          "judge_comments": "NVIDIA Triton supports dynamic batching and concurrent model execution (including MoE) to improve throughput and resource utilization.",
          "spec_comments": "Concrete actor, product, temporal anchor, active voice. Lacks specific measurable shift.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Economics",
          "title": "Grok API Price at 0.10/M",
          "summary": "xAI sets Grok-2 inference at $0.10 per million tokens. Signals downward pressure on API economics.",
          "verdict": "fabricated",
          "verifiability_score": 20,
          "specificity_score": 90,
          "currency_score": 100,
          "newest_source_date": "2026-05-06",
          "judge_comments": "Grok-2 inference is not $0.10/M. Current Grok models are $1.25/M (input) and $2.50/M (output), or $2.00/M (input) and $6.00/M (output), with cached input at $0.20/M.",
          "spec_comments": "Concrete actor, product, event, and quantitative anchor. 'Downward pressure' is a slight deduction.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Economics",
          "title": "Batch Inference 75% Discounts",
          "summary": "Together AI applies 75% discount to batch inference pricing. Indicates shift to cost-efficient async workloads.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 70,
          "newest_source_date": "2025-09-15",
          "judge_comments": "Together AI consistently states a 50% discount for batch inference on most serverless models, not 75%. This is explicitly mentioned in multiple blog posts and their pricing documentation.",
          "spec_comments": "Concrete actor, quantitative anchor, active voice. 'Indicates shift' is a minor deduction for future implication.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Economics",
          "title": "RunPod A100 Rentals at 0.20/hr",
          "summary": "RunPod lowers A100 GPU rental to $0.20 per hour. Signals accessible self-hosting for startups.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 95,
          "currency_score": 10,
          "newest_source_date": "2024-04-01",
          "judge_comments": "RunPod shows A100s at or above $0.76/hr for Flex workers and $1.69/hr for Secure Cloud as of April 2026. $0.20/hr appears to be for less powerful GPUs.",
          "spec_comments": "Concrete actor, product, price, and active voice. Clear, anchored observation.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Economics",
          "title": "Baseten Serverless at Sub-Cent",
          "summary": "Baseten charges under one cent per million input tokens. Indicates granular pay-per-use inference models.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-04-17",
          "judge_comments": "No direct mention of 'sub-cent per million input tokens' found. Baseten details discounted cache token pricing, but not overall input token pricing at that scale.",
          "spec_comments": "Concrete actor, product, and quantitative anchor. Passive voice for the implication.",
          "sources": []
        }
      ]
    },
    {
      "brief_id": "mobility-autonomous-fleets",
      "scores": {
        "verifiability": 83,
        "specificity": 69,
        "currency": 75,
        "coverage": 85,
        "composite": 78,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Technology",
          "title": "Waymo Phoenix Fleet Expansion",
          "summary": "Waymo operates 700 robotaxis in Phoenix daily. Signals robotaxi commercialization scale for OEM urban deployment.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 85,
          "newest_source_date": "2025-11-12",
          "judge_comments": "Waymo has expanded its robotaxi service in Phoenix, including freeway operations, which signals increased technical reliability and operational confidence in urban environments. They've also expanded to new cities such as Dallas, Houston, San Antonio, and Orlando simultaneously, showing a broader expansion of services.",
          "spec_comments": "Concrete actor and event, specific location named. The second sentence is slightly interpretative.",
          "sources": []
        },
        {
          "index": 1,
          "category": "Technology",
          "title": "Aurora Driverless Truck Routes",
          "summary": "Aurora runs driverless trucks on 100-mile Texas routes. Indicates autonomous trucking economics through freight efficiency.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 90,
          "currency_score": 100,
          "newest_source_date": "2026-05-13",
          "judge_comments": "Aurora operates driverless trucks on routes, including Fort Worth to El Paso and Dallas to Houston. The economic benefits of efficiency are highlighted by Aurora and Texas officials [aurora.tech](https://ir.aurora.tech/news-events/press-releases/detail/132/aurora-triples-driverless-network-to-10-routes-and-prepares-to-expand-across-u-s-sun-belt), [businesswire.com](https://www.businesswire.com/news/home/20250501031863/en/Aurora-Begins-Commercial-Driverless-Trucking-in-Texas-Ushering-in-a-New-Era-of-Freight).",
          "spec_comments": "Concrete actor, specific route length, implies observable efficiency, active voice.",
          "sources": []
        },
        {
          "index": 2,
          "category": "Technology",
          "title": "LiDAR Sensor Price Cuts",
          "summary": "Luminar delivers LiDAR units at $500 per sensor. Signals cost reductions enabling robotaxi fleet economics.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 50,
          "currency_score": 50,
          "newest_source_date": "2025-05-13",
          "judge_comments": "LiDAR unit costs below $500, and even $200, are repeatedly cited across multiple reputable sources due to mass production and chip integration.",
          "sources": []
        },
        {
          "index": 3,
          "category": "Technology",
          "title": "Tesla FSD Compute Upgrades",
          "summary": "Tesla integrates HW4 into FSD vehicles for redundancy. Indicates technology maturity for robotaxi operations.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 60,
          "currency_score": 100,
          "newest_source_date": "2026-04-23",
          "judge_comments": "Tesla is integrating HW4 for FSD, but full redundancy for robotaxi operations isn't explicitly confirmed as completed or fully realized through this. HW3 cars require retrofits.",
          "spec_comments": "Concrete actor and event, but 'technology maturity' and 'robotaxi operations' are forecast-like, lacking specific anchors.",
          "sources": []
        },
        {
          "index": 4,
          "category": "Regulation",
          "title": "California AV Testing Permits",
          "summary": "California DMV issues 50 new AV testing permits. Signals regulatory easing for robotaxi commercialization.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-05-05",
          "judge_comments": "The signal claims 50 new AV testing permits. While regulations have changed, the provided sources don't support 50 'new' permits by the DMV for robotaxi commercialization specifically.",
          "spec_comments": "Concrete actor, number, and event. Easing is somewhat vague. No active voice for objective sentence.",
          "sources": []
        },
        {
          "index": 5,
          "category": "Regulation",
          "title": "FMCSA Remote Trucking Rules",
          "summary": "FMCSA approves remote monitoring for autonomous trucks. Indicates regulatory support for trucking economics.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 10,
          "newest_source_date": "2023-02-01",
          "judge_comments": "FMCSA has requested public comment on remote assistants for ADS-equipped CMVs, but has not yet approved rules.",
          "spec_comments": "Concrete actor, action, and implies a shift. Lacks quantitative/temporal anchor, uses 'indicates'.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Regulation",
          "title": "EU AV Data Sharing Mandate",
          "summary": "EU requires AV firms to share safety data. Signals harmonized rules impacting urban mobility.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-03",
          "judge_comments": "The EU has mandated technical specifications for type-approval of automated driving systems, including safety validation and management systems. This impacts urban mobility and autonomous vehicle deployment.",
          "spec_comments": "Names actor (EU), event (mandate). Lacks specific firms, dates, or measurable shift details.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Regulation",
          "title": "Texas Driverless Operations Law",
          "summary": "Texas enacts law allowing fully driverless vehicles. Indicates state-level push for robotaxi services.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-04-30",
          "judge_comments": "Texas's SB 2807 (effective Sept 2025, enforceable May 2026) establishes a regulatory framework for commercial driverless operation. Bot Auto completed a humanless commercial truckload in Texas, highlighting the law's impact. The law covers urban mobility and trucking.",
          "spec_comments": "Names a concrete actor (Texas) and event (enacts law). Lacks specific date or measurable shift in the summary itself.",
          "sources": []
        },
        {
          "index": 8,
          "category": "Business Model",
          "title": "Zoox Amazon Funding Boost",
          "summary": "Amazon invests $1 billion in Zoox robotaxi tech. Signals investor backing for AV business models.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-24",
          "judge_comments": "While Reuters mentions Amazon owns Zoox, no specific $1 billion investment from Amazon in Zoox is found in the search results.",
          "spec_comments": "Concrete actor, event, and quantitative anchor are present. 'Signals investor backing' is a generic forecast.",
          "sources": []
        },
        {
          "index": 9,
          "category": "Business Model",
          "title": "Uber Waymo Partnership Growth",
          "summary": "Uber expands Waymo robotaxi integration in Austin. Indicates ride-hailing shift to autonomous fleets.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2025-03-04",
          "judge_comments": "Uber and Waymo expanded their partnership to Austin, TX, with robotaxis available on the Uber app since March 2025. Atlanta is next.",
          "spec_comments": "Concrete actors and event, but 'shift' is a bit generic and forecast-like.",
          "sources": []
        },
        {
          "index": 10,
          "category": "Business Model",
          "title": "TuSimple Freight Contracts",
          "summary": "TuSimple secures contracts for autonomous trucking hauls. Signals economics viability via cost savings.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 55,
          "currency_score": 0,
          "judge_comments": "No recent direct evidence of TuSimple securing new contracts for autonomous trucking hauls or specific economic viability claims.",
          "spec_comments": "Concrete actor and event, but lacks quantitative/temporal anchors and uses 'signals' passively.",
          "sources": []
        },
        {
          "index": 11,
          "category": "Business Model",
          "title": "Motional Hyundai Robotaxi Deal",
          "summary": "Hyundai licenses Motional tech for robotaxi production. Indicates OEM integration of AV business models.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 60,
          "currency_score": 100,
          "newest_source_date": "2026-03-13",
          "judge_comments": "Motional uses Hyundai produced Ioniq 5 robotaxis, but there's no indication of a licensing deal or Hyundai integrating Motional's tech into its broader product line.",
          "spec_comments": "Concrete actors, event, but lacks quantitative/temporal anchors and uses some generic observations.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Cities",
          "title": "San Francisco Cruise Halt",
          "summary": "San Francisco suspends Cruise robotaxi permits post-incident. Signals urban safety concerns for AV rollout.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 50,
          "newest_source_date": "2024-12-10",
          "judge_comments": "DMV and CPUC suspended Cruise permits following incidents and safety concerns raised by San Francisco officials.",
          "spec_comments": "Concrete actor, action, and event with a clear temporal anchor. \"Signals\" is slightly passive.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Cities",
          "title": "Phoenix Waymo Rider Uptake",
          "summary": "Phoenix residents book 100,000 Waymo rides weekly. Indicates city acceptance of robotaxi services.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 95,
          "currency_score": 50,
          "newest_source_date": "2025-02-27",
          "judge_comments": "The claim of 100,000 rides specifically in Phoenix is not supported. Waymo's overall weekly rides are higher.",
          "spec_comments": "Concrete actor, quantitative anchor, active voice, present tense. Specific and sharp.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Cities",
          "title": "Singapore AV Shuttle Zones",
          "summary": "Singapore designates zones for driverless shuttles. Signals urban planning for autonomous mobility.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-04-07",
          "judge_comments": "Singapore's LTA has announced progressive deployment of autonomous shuttle services in Punggol, with specific routes and operators. Public rides have commenced for some routes, indicating designated zones.",
          "spec_comments": "Concrete actor and event named. Lacks quantitative/temporal anchor. Active voice and present tense used.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Cities",
          "title": "Austin Tesla Robotaxi Prep",
          "summary": "Austin approves Tesla robotaxi pilot sites. Indicates municipal support for AV commercialization.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-04-29",
          "judge_comments": "Tesla is operating a limited number of unsupervised robotaxis in Austin, but no sources indicate specific 'pilot sites' or municipal approval of such. The city's actions are focused on managing existing AV operations.",
          "spec_comments": "Concrete actor, event, and location given. Lacks quantitative/temporal anchor.",
          "sources": []
        }
      ]
    },
    {
      "brief_id": "food-agtech-shifts",
      "scores": {
        "verifiability": 72,
        "specificity": 76,
        "currency": 75,
        "coverage": 100,
        "composite": 78,
        "n_signals": 16
      },
      "signals": [
        {
          "index": 0,
          "category": "Technology",
          "title": "Precision Fermentation Yield Gains",
          "summary": "Engineered microbes produce casein at 100g/L titers in pilot plants. Signals cost reductions for dairy proteins in food formulations.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 85,
          "currency_score": 50,
          "newest_source_date": "2025-05-07",
          "judge_comments": "While industrial production of precision fermentation casein is confirmed, no specific 100g/L titer has been publicly stated. Cost reduction is a stated goal, but not yet verified.",
          "spec_comments": "Concrete actor (engineered microbes), specific product (casein), quantitative anchor (100g/L), and present tense.",
          "sources": []
        },
        {
          "index": 1,
          "category": "Technology",
          "title": "CRISPR Drought-Tolerant Wheat",
          "summary": "Researchers release CRISPR-edited wheat varieties resisting 30% yield loss in droughts. Indicates resilient grain options for staple food production.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 65,
          "currency_score": 70,
          "newest_source_date": "2025-09-19",
          "judge_comments": "Multiple sources confirm field trials of gene-edited drought-tolerant wheat, showing promise for climate resilience.",
          "spec_comments": "Good actor, event, and quantifiable anchor; 'accelerating replacement' is generic forecast.",
          "sources": []
        },
        {
          "index": 2,
          "category": "Technology",
          "title": "AI-Driven Gene Editing Tools",
          "summary": "AI platforms accelerate discovery of climate-resilient crop traits by 5x. Signals faster development of adaptive seed varieties.",
          "verdict": "future",
          "verifiability_score": 75,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-05-08",
          "judge_comments": "AI is being used to accelerate gene discovery, aiming to reduce breeding timelines. No specific mention of a 5x acceleration, but implies significant speed-up.",
          "spec_comments": "Good anchor (5x), but lacks a named actor or specific event/product.",
          "sources": []
        },
        {
          "index": 3,
          "category": "Technology",
          "title": "Microbial Fat Production Scale",
          "summary": "Companies engineer yeasts to yield cocoa butter equivalents at 50g/L. Signals alternatives to imported tropical fats.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-04-15",
          "judge_comments": "Companies like Seminal Biosciences and Celleste Bio use engineered yeast (e.g., Yarrowia lipolytica) to produce cocoa butter alternatives. Some strains can produce ~60% of their body weight in fat, with Celleste aiming for significant production volumes.",
          "spec_comments": "Concrete actor (companies), event (engineer yeasts), product (cocoa butter equivalents), quantitative anchor (50g/L).",
          "sources": []
        },
        {
          "index": 4,
          "category": "Policy",
          "title": "Food Sovereignty Bill Passage",
          "summary": "Brazil enacts law mandating 30% local sourcing for public food procurement. Signals prioritization of domestic agriculture over imports.",
          "verdict": "grounded",
          "verifiability_score": 100,
          "specificity_score": 85,
          "currency_score": 70,
          "newest_source_date": "2025-09-30",
          "judge_comments": "The minimum percentage for family farm products in school meals increased to 45%, not 30%.",
          "spec_comments": "Concrete actor, event, and quantifiable anchor; uses active voice.",
          "sources": []
        },
        {
          "index": 5,
          "category": "Policy",
          "title": "Resilient Crop Subsidy Program",
          "summary": "US allocates $2B for breeding climate-adaptive corn and soy varieties. Indicates government support for supply stability.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-04-13",
          "judge_comments": "No mention of a $2 billion Resilient Crop Subsidy Program for corn and soy was found in USDA press releases, nor any focused on 'climate-adaptive' breeding.",
          "spec_comments": "Concrete actor, amount, and purpose. Weakness in 'indicates government support'.",
          "sources": []
        },
        {
          "index": 6,
          "category": "Policy",
          "title": "GMO Labeling Requirements",
          "summary": "EU mandates labels for precision-edited ingredients in processed foods. Signals transparency demands affecting product formulations.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2025-03-14",
          "judge_comments": "The EU is moving towards a two-tier system for New Genomic Techniques (NGTs) where NGT-1 plants, comparable to conventionally bred varieties, will generally NOT have mandatory labeling requirements for derived food products. NGT-2 plants will retain full GMO labeling and traceability. Therefore, a blanket mandate for precision-edited ingredients in processed foods is contradicted by recent proposals.",
          "spec_comments": "Concrete actor, event, and temporal anchor. 'Affecting' is a bit weak for active voice.",
          "sources": []
        },
        {
          "index": 7,
          "category": "Policy",
          "title": "Seed Sovereignty Initiatives",
          "summary": "India promotes farmer-saved seeds through national policy framework. Indicates pushback against patented crop technologies.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 65,
          "currency_score": 85,
          "newest_source_date": "2026-01-04",
          "judge_comments": "India's recent release of climate-resilient seeds and plans for genome-edited varieties show a complex interplay between promoting farmer-centric approaches and advanced agricultural technologies, not a singular push against patented crop technologies.",
          "spec_comments": "Concrete actor (India, farmers) and event (policy framework) are named. 'Promotes' is a bit general.",
          "sources": []
        },
        {
          "index": 8,
          "category": "Consumer",
          "title": "Fermented Protein Purchases Rise",
          "summary": "US consumers buy 20% more precision-fermented dairy alternatives in 2023. Signals acceptance of novel proteins in everyday diets.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 85,
          "currency_score": 70,
          "newest_source_date": "2025-06-01",
          "judge_comments": "No specific data found for a 20% rise in US precision-fermented dairy alternative purchases in 2023. GFI data for 2024 shows low overall consumer awareness.",
          "spec_comments": "Concrete actor, event, and quantitative anchor. Uses active voice. Small deduction for 'novel proteins'.",
          "sources": []
        },
        {
          "index": 9,
          "category": "Consumer",
          "title": "Climate-Resilient Grain Demand",
          "summary": "Shoppers select drought-tolerant rice labels 15% more frequently. Indicates preference for stable-supply staple foods.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2025-05-13",
          "judge_comments": "Consumers value sustainably produced rice, including climate-resilient traits, but specific 15% drought-tolerant preference is unverified.",
          "spec_comments": "Concrete product, quantitative anchor, and active voice are good. Lacks a named actor.",
          "sources": []
        },
        {
          "index": 10,
          "category": "Consumer",
          "title": "Sovereignty Food Label Growth",
          "summary": "Local-sovereignty certified products capture 10% market share in Europe. Signals value placed on non-corporate sourcing.",
          "verdict": "dubious",
          "verifiability_score": 40,
          "specificity_score": 65,
          "currency_score": 100,
          "newest_source_date": "2026-03-25",
          "judge_comments": "While 'Ohne Gentechnik' and organic labels show growth, there's no evidence of a distinct 'local-sovereignty certified products' category reaching 10% market share in Europe. Food sovereignty is gaining political traction, but not yet as a widespread label.",
          "spec_comments": "Concrete actor, quantitative anchor. Vague 'signals value' and 'non-corporate sourcing' detract.",
          "sources": []
        },
        {
          "index": 11,
          "category": "Consumer",
          "title": "Alt-Fat Consumer Adoption",
          "summary": "Precision-fermented butter substitutes sell out in major retailers. Indicates shift from traditional animal fats.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 65,
          "currency_score": 50,
          "newest_source_date": "2025-03-20",
          "judge_comments": "Savor's butter is launching in select restaurants and bakeries, not yet major retailers. Melt&Marble and Clean Food Group are approved for sales, but not yet adopted by consumers.",
          "spec_comments": "Concrete product, event, and implies a shift, but lacks actor/brands, specific retailers, or temporal anchor.",
          "sources": []
        },
        {
          "index": 12,
          "category": "Supply Chain",
          "title": "Fermentation Facility Expansions",
          "summary": "Perfect Day doubles precision fermentation capacity to 1M liters annually. Signals integration of alt-proteins into dairy chains.",
          "verdict": "future",
          "verifiability_score": 75,
          "specificity_score": 85,
          "currency_score": 50,
          "newest_source_date": "2024-12-19",
          "judge_comments": "Perfect Day's new facility in India, set to open Q1 2026, will significantly increase capacity. The 'doubling to 1M liters annually' figure is not explicitly stated in provided sources, but substantial bookings indicate confidence in increased output.",
          "spec_comments": "Concrete actor, capacity increase, and temporal anchor are strong.",
          "sources": []
        },
        {
          "index": 13,
          "category": "Supply Chain",
          "title": "Resilient Seed Contracts Surge",
          "summary": "Food firms sign deals for 25% more climate-hardy corn seeds. Indicates hedging against weather variability.",
          "verdict": "indicative",
          "verifiability_score": 60,
          "specificity_score": 85,
          "currency_score": 100,
          "newest_source_date": "2026-05-05",
          "judge_comments": "Demand for climate-resilient crops is increasing. While a 25% increase in corn seed contracts specifically isn't confirmed, the trend of increased interest and partnerships for such seeds is evident.",
          "spec_comments": "Concrete actor, quantitative anchor, and event. 'Climate-hardy' is a slight vagueness, but well-supported.",
          "sources": []
        },
        {
          "index": 14,
          "category": "Supply Chain",
          "title": "Localized Ingredient Sourcing",
          "summary": "Nestlé sources 40% proteins from regional fermentation plants. Signals reduction in global import dependencies.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 85,
          "currency_score": 70,
          "newest_source_date": "2025-05-20",
          "judge_comments": "Nestlé is investing in precision fermentation and sourcing initiatives, but there's no mention of 40% protein from regional fermentation plants or specific reduction in global import dependencies.",
          "spec_comments": "Concrete actor, quantitative anchor, and objective present-tense effect. Good specificity, avoids hype.",
          "sources": []
        },
        {
          "index": 15,
          "category": "Supply Chain",
          "title": "Sovereignty Trade Diversification",
          "summary": "Processors shift 15% soy procurement to domestic resilient varieties. Indicates response to geopolitical food controls.",
          "verdict": "speculative",
          "verifiability_score": 80,
          "specificity_score": 85,
          "currency_score": 85,
          "newest_source_date": "2026-02-04",
          "judge_comments": "While China aims for increased domestic soybean production and reduced reliance on imports, there's no specific mention of processors shifting 15% procurement to domestic, climate-resilient varieties. Policies support general increase.",
          "spec_comments": "Concrete actor, measurable shift, and present tense. Deducted for 'geopolitical food controls' being slightly vague.",
          "sources": []
        }
      ]
    }
  ]
}