[
  {
    "id": "eval-001",
    "input": "Claim CLM-101: Auto collision, claimant John Martinez. Documents: police report, photos, repair estimate, medical records. Completeness: 100%. Damage vs estimate match: 89%. Fraud risk score: 18. Policy coverage match: 97%. Analyze this claim.",
    "expected_output": {
      "classification": "normal",
      "action": "approve",
      "urgency": "low"
    }
  },
  {
    "id": "eval-002",
    "input": "Claim CLM-102: Property water damage, claimant Lisa Park. Documents: photos, plumber report. Completeness: 55%. Damage vs estimate match: N/A (no estimate provided). Fraud risk score: 22. Policy coverage match: 94%. Analyze this claim.",
    "expected_output": {
      "classification": "warning",
      "action": "request_documents",
      "urgency": "medium"
    }
  },
  {
    "id": "eval-003",
    "input": "Claim CLM-103: Auto collision, claimant Ahmed Farouk. Documents: police report, photos, repair estimate, medical records. Completeness: 100%. Damage vs estimate match: 45%. Fraud risk score: 79. Policy coverage match: 88%. Analyze this claim.",
    "expected_output": {
      "classification": "critical",
      "action": "investigate",
      "urgency": "high"
    }
  },
  {
    "id": "eval-004",
    "input": "Claim CLM-104: Property fire, claimant Nina Johansson. Documents: fire department report, photos, repair estimate, inventory list. Completeness: 100%. Damage vs estimate match: 92%. Fraud risk score: 8. Policy coverage match: 100%. Analyze this claim.",
    "expected_output": {
      "classification": "normal",
      "action": "approve",
      "urgency": "low"
    }
  },
  {
    "id": "eval-005",
    "input": "Claim CLM-105: Auto theft, claimant Derek Thompson. Documents: police report only. Completeness: 40%. Damage vs estimate match: N/A. Fraud risk score: 61. Policy coverage match: 75%. Analyze this claim.",
    "expected_output": {
      "classification": "critical",
      "action": "investigate",
      "urgency": "high"
    }
  },
  {
    "id": "eval-006",
    "input": "Claim CLM-106: Property water damage, claimant Rosa Gutierrez. Documents: photos, plumber report, repair estimate, inventory list. Completeness: 100%. Damage vs estimate match: 83%. Fraud risk score: 25. Policy coverage match: 91%. Analyze this claim.",
    "expected_output": {
      "classification": "normal",
      "action": "approve",
      "urgency": "low"
    }
  },
  {
    "id": "eval-007",
    "input": "Claim CLM-107: Auto collision, claimant Wei Zhang. Documents: police report, photos, repair estimate. Completeness: 85%. Damage vs estimate match: 61%. Fraud risk score: 53. Policy coverage match: 93%. Analyze this claim.",
    "expected_output": {
      "classification": "warning",
      "action": "review",
      "urgency": "medium"
    }
  },
  {
    "id": "eval-008",
    "input": "Claim CLM-108: Property fire, claimant Tom Nakamura. Documents: fire department report, photos. Completeness: 65%. Damage vs estimate match: N/A. Fraud risk score: 33. Policy coverage match: 100%. Analyze this claim.",
    "expected_output": {
      "classification": "warning",
      "action": "request_documents",
      "urgency": "medium"
    }
  },
  {
    "id": "eval-009",
    "input": "Claim CLM-109: Auto collision, claimant Priya Sharma. Documents: police report, photos, repair estimate, medical records. Completeness: 100%. Damage vs estimate match: 38%. Fraud risk score: 85. Policy coverage match: 60%. Analyze this claim.",
    "expected_output": {
      "classification": "critical",
      "action": "deny_or_investigate",
      "urgency": "high"
    }
  },
  {
    "id": "eval-010",
    "input": "Claim CLM-110: Auto collision, claimant Marcus Johnson. Documents: police report, photos, repair estimate, dashcam footage. Completeness: 100%. Damage vs estimate match: 94%. Fraud risk score: 5. Policy coverage match: 100%. Analyze this claim.",
    "expected_output": {
      "classification": "normal",
      "action": "approve",
      "urgency": "low"
    }
  }
]
