{
  "run_id": "trace_real_20260319T200653",
  "generated_at_utc": "2026-03-20T00:10:40Z",
  "benchmark_mode": "blind",
  "current": {
    "exact_match": 5,
    "semantic_match": 5,
    "total_fields": 12,
    "evidence_quality": 0.9,
    "low_quality_source_urls": null,
    "grounded_fields": 3,
    "tokens_used": 37808,
    "tokens_per_grounded_field": 12602.6667,
    "runtime_evidence_gain_per_1k_tokens": 0.4315,
    "token_efficiency_metric": 0.4315,
    "token_efficiency_direction": "higher_is_better",
    "token_efficiency_source": "diagnostics.performance.evidence_gain_per_1k_tokens",
    "finalization_invariant_failures": 0,
    "quality_gate_failures": 5,
    "quality_gate_failed_current": false,
    "quality_gate_blocked_current": false,
    "quality_gate_reason_current": null,
    "all_required_terminalized_current": true,
    "all_required_concrete_current": false,
    "concrete_completion_status_current": "in_progress",
    "confidence_min_threshold_current": 0.55,
    "global_confidence_payload": 0.5594,
    "global_confidence_gate_score": 0.5594,
    "global_confidence_source": "completion_gate",
    "global_confidence": 0.5594
  },
  "baseline": {
    "exact_match": 5,
    "semantic_match": 5,
    "total_fields": 12,
    "evidence_quality": 0.9,
    "low_quality_source_urls": null,
    "grounded_fields": 3,
    "tokens_used": 51214,
    "tokens_per_grounded_field": 17071.3333,
    "runtime_evidence_gain_per_1k_tokens": 0.383,
    "token_efficiency_metric": 0.383,
    "token_efficiency_direction": "higher_is_better",
    "token_efficiency_source": "diagnostics.performance.evidence_gain_per_1k_tokens",
    "finalization_invariant_failures": 0,
    "quality_gate_failures": 7,
    "quality_gate_failed_current": false,
    "quality_gate_blocked_current": false,
    "quality_gate_reason_current": null,
    "all_required_terminalized_current": true,
    "all_required_concrete_current": false,
    "concrete_completion_status_current": "in_progress",
    "confidence_min_threshold_current": 0.55,
    "global_confidence_payload": 0.5594,
    "global_confidence_gate_score": 0.5594,
    "global_confidence_source": "completion_gate",
    "global_confidence": 0.5594
  },
  "delta": {
    "exact_match_delta": 0,
    "semantic_match_delta": 0,
    "evidence_quality_delta": 0,
    "global_confidence_delta": 0,
    "quality_gate_failures_delta": -2,
    "tokens_used_delta": -13406,
    "tokens_per_grounded_field_delta": -4468.6667,
    "token_efficiency_metric_delta": 0.0485,
    "invariant_failures_delta": 0
  }
}