{
  "dataset_metadata": {
    "name": "AI OCR Performance & Accuracy Matrix 2026",
    "provider": "Jpgtotext AI Engine Research Lab",
    "last_updated": "2026-05-29",
    "license": "Creative Commons Attribution 4.0"
  },
  "benchmarks": [
    {
      "language": "English (Latin)",
      "client_side_accuracy": 0.994,
      "server_side_accuracy_comparison": 0.995,
      "average_processing_time_ms": 1120,
      "character_recognition_rate": "1500 chars/sec"
    },
    {
      "language": "Vietnamese (Diacritics)",
      "client_side_accuracy": 0.985,
      "server_side_accuracy_comparison": 0.987,
      "average_processing_time_ms": 1450,
      "character_recognition_rate": "1100 chars/sec"
    },
    {
      "language": "Spanish",
      "client_side_accuracy": 0.991,
      "server_side_accuracy_comparison": 0.992,
      "average_processing_time_ms": 1180,
      "character_recognition_rate": "1400 chars/sec"
    },
    {
      "language": "Chinese (Simplified)",
      "client_side_accuracy": 0.972,
      "server_side_accuracy_comparison": 0.978,
      "average_processing_time_ms": 2100,
      "character_recognition_rate": "750 chars/sec"
    },
    {
      "language": "Korean",
      "client_side_accuracy": 0.981,
      "server_side_accuracy_comparison": 0.984,
      "average_processing_time_ms": 1850,
      "character_recognition_rate": "890 chars/sec"
    },
    {
      "language": "Japanese",
      "client_side_accuracy": 0.969,
      "server_side_accuracy_comparison": 0.975,
      "average_processing_time_ms": 2300,
      "character_recognition_rate": "680 chars/sec"
    }
  ],
  "testing_environment": {
    "engine": "Tesseract.js v5 with JpgToText Auto-Preprocessors",
    "hardware_specs": "Client-side WebAssembly CPU Threading (Average core count: 4)",
    "sample_size": "5,000 standard layout digital & physical scanned document pages"
  }
}
