{
  "assamese": {
    "top_substitutions": [
      {
        "ref": "অ",
        "hyp": "অঁ",
        "count": 13
      },
      {
        "ref": "অঁ",
        "hyp": "অ",
        "count": 8
      },
      {
        "ref": "চাগৈ",
        "hyp": "চাগে",
        "count": 4
      },
      {
        "ref": "লিখাৰ",
        "hyp": "লেখাৰ",
        "count": 4
      },
      {
        "ref": "ত",
        "hyp": "তো",
        "count": 4
      },
      {
        "ref": "আৰু",
        "hyp": "মই",
        "count": 4
      },
      {
        "ref": "ধৰি",
        "hyp": "লওক",
        "count": 4
      },
      {
        "ref": "লিখা",
        "hyp": "লেখা",
        "count": 4
      },
      {
        "ref": "সঁচাকৈয়ে",
        "hyp": "সঁচাকৈ",
        "count": 3
      },
      {
        "ref": "লৈ",
        "hyp": "যায়",
        "count": 3
      },
      {
        "ref": "পোৱা",
        "hyp": "যায়",
        "count": 3
      },
      {
        "ref": "অলপ",
        "hyp": "পিছত",
        "count": 3
      },
      {
        "ref": "জনসংখ্যা",
        "hyp": "জনসাংখ্যা",
        "count": 3
      },
      {
        "ref": "হয়",
        "hyp": "কৰা",
        "count": 3
      },
      {
        "ref": "unintelligible",
        "hyp": "হয়",
        "count": 3
      },
      {
        "ref": "যদি",
        "hyp": "মই",
        "count": 3
      },
      {
        "ref": "কথা",
        "hyp": "আছে",
        "count": 3
      },
      {
        "ref": "এই",
        "hyp": "সেই",
        "count": 3
      },
      {
        "ref": "হব",
        "hyp": "হবো",
        "count": 3
      },
      {
        "ref": "তাৰ",
        "hyp": "তাৰপিছত",
        "count": 3
      }
    ],
    "top_insertions": [
      {
        "word": "সেই",
        "count": 21
      },
      {
        "word": "অঁ",
        "count": 20
      },
      {
        "word": "এই",
        "count": 17
      },
      {
        "word": "আৰু",
        "count": 15
      },
      {
        "word": "পৰা",
        "count": 14
      },
      {
        "word": "হয়",
        "count": 13
      },
      {
        "word": "অ",
        "count": 12
      },
      {
        "word": "মই",
        "count": 11
      },
      {
        "word": "মানে",
        "count": 10
      },
      {
        "word": "কাৰণে",
        "count": 9
      },
      {
        "word": "আছে",
        "count": 9
      },
      {
        "word": "ন",
        "count": 9
      },
      {
        "word": "বা",
        "count": 9
      },
      {
        "word": "এনেকুৱা",
        "count": 9
      },
      {
        "word": "হৈ",
        "count": 8
      },
      {
        "word": "এটা",
        "count": 8
      },
      {
        "word": "লেখাৰ",
        "count": 8
      },
      {
        "word": "ভাল",
        "count": 8
      },
      {
        "word": "পিছত",
        "count": 7
      },
      {
        "word": "মোৰ",
        "count": 7
      }
    ],
    "top_deletions": [
      {
        "word": "অঁ",
        "count": 42
      },
      {
        "word": "unintelligible",
        "count": 28
      },
      {
        "word": "অ",
        "count": 19
      },
      {
        "word": "আৰু",
        "count": 15
      },
      {
        "word": "ভিডিঅ",
        "count": 14
      },
      {
        "word": "হয়",
        "count": 12
      },
      {
        "word": "এই",
        "count": 12
      },
      {
        "word": "হেৰি",
        "count": 10
      },
      {
        "word": "পৰা",
        "count": 9
      },
      {
        "word": "নাই",
        "count": 9
      },
      {
        "word": "জনসংখ্যা",
        "count": 9
      },
      {
        "word": "তাৰ",
        "count": 9
      },
      {
        "word": "লিখা",
        "count": 9
      },
      {
        "word": "কৰি",
        "count": 8
      },
      {
        "word": "সেই",
        "count": 8
      },
      {
        "word": "এতিয়া",
        "count": 7
      },
      {
        "word": "দাঁতৰ",
        "count": 7
      },
      {
        "word": "নে",
        "count": 7
      },
      {
        "word": "সমস্যা",
        "count": 7
      },
      {
        "word": "লিখাৰ",
        "count": 7
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 0,
      "punctuation_only_count": 2,
      "spacing_tokenization_count": 401,
      "entity_mismatch_count": 0,
      "script_confusion_count": 9,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "as_0026",
        "as_0094",
        "as_0354"
      ],
      "best_samples": [
        "as_0001",
        "as_0013",
        "as_0014"
      ],
      "numeric_mismatch_samples": [],
      "entity_mismatch_samples": []
    }
  },
  "bengali": {
    "top_substitutions": [
      {
        "ref": "মো",
        "hyp": "মৌ",
        "count": 8
      },
      {
        "ref": "দুই",
        "hyp": "দু",
        "count": 6
      },
      {
        "ref": "তাঁর",
        "hyp": "তার",
        "count": 5
      },
      {
        "ref": "এ",
        "hyp": "এই",
        "count": 5
      },
      {
        "ref": "অতিথি",
        "hyp": "অতি��ি",
        "count": 5
      },
      {
        "ref": "ড",
        "hyp": "ডগ",
        "count": 5
      },
      {
        "ref": "এক",
        "hyp": "একশো",
        "count": 4
      },
      {
        "ref": "বার",
        "hyp": "বারো",
        "count": 3
      },
      {
        "ref": "প্রাক্তন",
        "hyp": "প্রাপ্তন",
        "count": 3
      },
      {
        "ref": "অব",
        "hyp": "অফ",
        "count": 3
      },
      {
        "ref": "কোনও",
        "hyp": "কোনো",
        "count": 3
      },
      {
        "ref": "এক",
        "hyp": "উনিশশো",
        "count": 3
      },
      {
        "ref": "তিন",
        "hyp": "তিনশো",
        "count": 3
      },
      {
        "ref": "ডা",
        "hyp": "দা",
        "count": 3
      },
      {
        "ref": "মোহাম্মদ",
        "hyp": "মহাম্মদ",
        "count": 2
      },
      {
        "ref": "ভাল",
        "hyp": "ভালো",
        "count": 2
      },
      {
        "ref": "পনের",
        "hyp": "পনেরো",
        "count": 2
      },
      {
        "ref": "ত্রিশ",
        "hyp": "তিরিশ",
        "count": 2
      },
      {
        "ref": "এখনও",
        "hyp": "এখনো",
        "count": 2
      },
      {
        "ref": "একনজরে",
        "hyp": "এক",
        "count": 2
      }
    ],
    "top_insertions": [
      {
        "word": "মৌ",
        "count": 14
      },
      {
        "word": "এই",
        "count": 11
      },
      {
        "word": "বি",
        "count": 9
      },
      {
        "word": "সহ",
        "count": 7
      },
      {
        "word": "তার",
        "count": 7
      },
      {
        "word": "দু",
        "count": 7
      },
      {
        "word": "ডগ",
        "count": 7
      },
      {
        "word": "এ",
        "count": 7
      },
      {
        "word": "এস",
        "count": 7
      },
      {
        "word": "এন",
        "count": 7
      },
      {
        "word": "একশো",
        "count": 6
      },
      {
        "word": "প্রাপ্তন",
        "count": 6
      },
      {
        "word": "দা",
        "count": 6
      },
      {
        "word": "পি",
        "count": 6
      },
      {
        "word": "ম",
        "count": 6
      },
      {
        "word": "থেকে",
        "count": 5
      },
      {
        "word": "অতি��ি",
        "count": 5
      },
      {
        "word": "করোনা",
        "count": 5
      },
      {
        "word": "করে",
        "count": 5
      },
      {
        "word": "কোনো",
        "count": 5
      }
    ],
    "top_deletions": [
      {
        "word": "মো",
        "count": 37
      },
      {
        "word": "শো",
        "count": 21
      },
      {
        "word": "ড",
        "count": 17
      },
      {
        "word": "ডা",
        "count": 16
      },
      {
        "word": "দুই",
        "count": 11
      },
      {
        "word": "এক",
        "count": 9
      },
      {
        "word": "নয়",
        "count": 8
      },
      {
        "word": "এ",
        "count": 7
      },
      {
        "word": "প্রাক্তন",
        "count": 7
      },
      {
        "word": "জন",
        "count": 6
      },
      {
        "word": "ও",
        "count": 6
      },
      {
        "word": "তাঁর",
        "count": 6
      },
      {
        "word": "অতিথি",
        "count": 6
      },
      {
        "word": "বার",
        "count": 5
      },
      {
        "word": "হাজার",
        "count": 5
      },
      {
        "word": "তিন",
        "count": 5
      },
      {
        "word": "আহ্বায়ক",
        "count": 5
      },
      {
        "word": "ত্রিশ",
        "count": 4
      },
      {
        "word": "দশ",
        "count": 4
      },
      {
        "word": "এর",
        "count": 4
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 5,
      "punctuation_only_count": 5,
      "spacing_tokenization_count": 445,
      "entity_mismatch_count": 0,
      "script_confusion_count": 0,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "844424932447916-1175-f",
        "844424930527582-789-m",
        "844424931098749-952-f"
      ],
      "best_samples": [
        "844424932351458-1005-f",
        "844424931519963-711-f",
        "844424930661655-1175-f"
      ],
      "numeric_mismatch_samples": [
        "844424931387503-1038-m",
        "844424932372663-1005-f",
        "844424931144609-647-f"
      ],
      "entity_mismatch_samples": []
    }
  },
  "english": {
    "top_substitutions": [
      {
        "ref": "the",
        "hyp": "and",
        "count": 7
      },
      {
        "ref": "of",
        "hyp": "the",
        "count": 7
      },
      {
        "ref": "centres",
        "hyp": "centers",
        "count": 6
      },
      {
        "ref": "the",
        "hyp": "of",
        "count": 5
      },
      {
        "ref": "rs",
        "hyp": "rupees",
        "count": 4
      },
      {
        "ref": "wow",
        "hyp": "now",
        "count": 3
      },
      {
        "ref": "are",
        "hyp": "there",
        "count": 3
      },
      {
        "ref": "the",
        "hyp": "by",
        "count": 3
      },
      {
        "ref": "my",
        "hyp": "in",
        "count": 3
      },
      {
        "ref": "of",
        "hyp": "a",
        "count": 3
      },
      {
        "ref": "the",
        "hyp": "in",
        "count": 3
      },
      {
        "ref": "my",
        "hyp": "from",
        "count": 3
      },
      {
        "ref": "the",
        "hyp": "to",
        "count": 3
      },
      {
        "ref": "to",
        "hyp": "the",
        "count": 3
      },
      {
        "ref": "one",
        "hyp": "is",
        "count": 3
      },
      {
        "ref": "a",
        "hyp": "it",
        "count": 3
      },
      {
        "ref": "then",
        "hyp": "i",
        "count": 3
      },
      {
        "ref": "well",
        "hyp": "as",
        "count": 3
      },
      {
        "ref": "to",
        "hyp": "one",
        "count": 2
      },
      {
        "ref": "to",
        "hyp": "a",
        "count": 2
      }
    ],
    "top_insertions": [
      {
        "word": "two",
        "count": 41
      },
      {
        "word": "four",
        "count": 38
      },
      {
        "word": "three",
        "count": 33
      },
      {
        "word": "five",
        "count": 31
      },
      {
        "word": "the",
        "count": 30
      },
      {
        "word": "nine",
        "count": 25
      },
      {
        "word": "a",
        "count": 25
      },
      {
        "word": "six",
        "count": 25
      },
      {
        "word": "eight",
        "count": 23
      },
      {
        "word": "one",
        "count": 23
      },
      {
        "word": "i",
        "count": 22
      },
      {
        "word": "and",
        "count": 21
      },
      {
        "word": "seven",
        "count": 19
      },
      {
        "word": "okay",
        "count": 18
      },
      {
        "word": "thousand",
        "count": 15
      },
      {
        "word": "in",
        "count": 15
      },
      {
        "word": "we",
        "count": 15
      },
      {
        "word": "o",
        "count": 15
      },
      {
        "word": "can",
        "count": 13
      },
      {
        "word": "m",
        "count": 13
      }
    ],
    "top_deletions": [
      {
        "word": "a",
        "count": 12
      },
      {
        "word": "centres",
        "count": 10
      },
      {
        "word": "in",
        "count": 9
      },
      {
        "word": "is",
        "count": 8
      },
      {
        "word": "the",
        "count": 8
      },
      {
        "word": "rs",
        "count": 7
      },
      {
        "word": "and",
        "count": 6
      },
      {
        "word": "wow",
        "count": 5
      },
      {
        "word": "are",
        "count": 5
      },
      {
        "word": "skip",
        "count": 4
      },
      {
        "word": "i",
        "count": 4
      },
      {
        "word": "cat",
        "count": 4
      },
      {
        "word": "for",
        "count": 4
      },
      {
        "word": "it",
        "count": 4
      },
      {
        "word": "list",
        "count": 4
      },
      {
        "word": "of",
        "count": 4
      },
      {
        "word": "agree",
        "count": 4
      },
      {
        "word": "to",
        "count": 4
      },
      {
        "word": "has",
        "count": 3
      },
      {
        "word": "forward",
        "count": 3
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 57,
      "punctuation_only_count": 109,
      "spacing_tokenization_count": 308,
      "entity_mismatch_count": 0,
      "script_confusion_count": 0,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "en_0064",
        "en_0227",
        "en_0373"
      ],
      "best_samples": [
        "en_0003",
        "en_0004",
        "en_0015"
      ],
      "numeric_mismatch_samples": [
        "en_0006",
        "en_0013",
        "en_0019"
      ],
      "entity_mismatch_samples": []
    }
  },
  "gujarati": {
    "top_substitutions": [
      {
        "ref": "તેમ",
        "hyp": "મજૂરી",
        "count": 6
      },
      {
        "ref": "જ",
        "hyp": "તેમજ",
        "count": 5
      },
      {
        "ref": "ખેતમજૂરી",
        "hyp": "ખેત",
        "count": 5
      },
      {
        "ref": "હતાં",
        "hyp": "હતા",
        "count": 4
      },
      {
        "ref": "એક",
        "hyp": "ઓગણીસો",
        "count": 3
      },
      {
        "ref": "ખેતમજૂરી",
        "hyp": "ખેતી",
        "count": 3
      },
      {
        "ref": "શકો",
        "hyp": "છો",
        "count": 3
      },
      {
        "ref": "થઇ",
        "hyp": "થઈ",
        "count": 3
      },
      {
        "ref": "છે",
        "hyp": "આવે",
        "count": 3
      },
      {
        "ref": "અને",
        "hyp": "છે",
        "count": 3
      },
      {
        "ref": "કહ્યુ",
        "hyp": "કહ્યું",
        "count": 2
      },
      {
        "ref": "છે",
        "hyp": "હોય",
        "count": 2
      },
      {
        "ref": "જોઇએ",
        "hyp": "જોઈએ",
        "count": 2
      },
      {
        "ref": "તેનાં",
        "hyp": "તેના",
        "count": 2
      },
      {
        "ref": "નહિ",
        "hyp": "નહીં",
        "count": 2
      },
      {
        "ref": "છે",
        "hyp": "રહે",
        "count": 2
      },
      {
        "ref": "લોકોનો",
        "hyp": "ગામના",
        "count": 2
      },
      {
        "ref": "વ્યવસાય",
        "hyp": "મુખ્ય",
        "count": 2
      },
      {
        "ref": "તેમ",
        "hyp": "ખેત",
        "count": 2
      },
      {
        "ref": "જ",
        "hyp": "મજૂરી",
        "count": 2
      }
    ],
    "top_insertions": [
      {
        "word": "એ",
        "count": 10
      },
      {
        "word": "મજૂરી",
        "count": 9
      },
      {
        "word": "તેમજ",
        "count": 7
      },
      {
        "word": "ખેત",
        "count": 7
      },
      {
        "word": "એક",
        "count": 6
      },
      {
        "word": "છે",
        "count": 6
      },
      {
        "word": "તેમાં",
        "count": 6
      },
      {
        "word": "હતા",
        "count": 6
      },
      {
        "word": "થઈ",
        "count": 5
      },
      {
        "word": "હતું",
        "count": 5
      },
      {
        "word": "જ",
        "count": 5
      },
      {
        "word": "આ",
        "count": 5
      },
      {
        "word": "ઉપર",
        "count": 4
      },
      {
        "word": "કોઈ",
        "count": 4
      },
      {
        "word": "પી",
        "count": 4
      },
      {
        "word": "એન",
        "count": 4
      },
      {
        "word": "ઓગણીસસો",
        "count": 4
      },
      {
        "word": "શેર",
        "count": 3
      },
      {
        "word": "વાર",
        "count": 3
      },
      {
        "word": "બસ",
        "count": 3
      }
    ],
    "top_deletions": [
      {
        "word": "જ",
        "count": 14
      },
      {
        "word": "એક",
        "count": 14
      },
      {
        "word": "સો",
        "count": 14
      },
      {
        "word": "ખેતમજૂરી",
        "count": 13
      },
      {
        "word": "તેમ",
        "count": 13
      },
      {
        "word": "હજાર",
        "count": 12
      },
      {
        "word": "માં",
        "count": 11
      },
      {
        "word": "નવ",
        "count": 9
      },
      {
        "word": "ના",
        "count": 8
      },
      {
        "word": "હતાં",
        "count": 8
      },
      {
        "word": "અને",
        "count": 5
      },
      {
        "word": "વ્યવસાય",
        "count": 5
      },
      {
        "word": "તેમણે",
        "count": 4
      },
      {
        "word": "બાદ",
        "count": 4
      },
      {
        "word": "પર",
        "count": 4
      },
      {
        "word": "ની",
        "count": 4
      },
      {
        "word": "આ",
        "count": 4
      },
      {
        "word": "કે",
        "count": 3
      },
      {
        "word": "થઇ",
        "count": 3
      },
      {
        "word": "પશુપાલન",
        "count": 3
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 3,
      "punctuation_only_count": 0,
      "spacing_tokenization_count": 437,
      "entity_mismatch_count": 0,
      "script_confusion_count": 0,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "844424933554263-550-m",
        "844424931498656-382-f",
        "844424933318896-1051-m"
      ],
      "best_samples": [
        "844424930301136-1139-m",
        "844424930924533-24-f",
        "844424931431659-825-f"
      ],
      "numeric_mismatch_samples": [
        "844424933570922-179-m",
        "844424933579942-179-m",
        "844424933112130-265-m"
      ],
      "entity_mismatch_samples": []
    }
  },
  "hindi": {
    "top_substitutions": [
      {
        "ref": "हैं",
        "hyp": "है",
        "count": 9
      },
      {
        "ref": "यहां",
        "hyp": "यहाँ",
        "count": 8
      },
      {
        "ref": "वहां",
        "hyp": "वहाँ",
        "count": 6
      },
      {
        "ref": "है",
        "hyp": "रहा",
        "count": 4
      },
      {
        "ref": "रूप",
        "hyp": "के",
        "count": 4
      },
      {
        "ref": "में",
        "hyp": "रूप",
        "count": 4
      },
      {
        "ref": "है",
        "hyp": "हैं",
        "count": 4
      },
      {
        "ref": "के",
        "hyp": "की",
        "count": 4
      },
      {
        "ref": "है",
        "hyp": "गया",
        "count": 4
      },
      {
        "ref": "साथ",
        "hyp": "के",
        "count": 4
      },
      {
        "ref": "गया",
        "hyp": "है",
        "count": 4
      },
      {
        "ref": "गांव",
        "hyp": "गाँव",
        "count": 3
      },
      {
        "ref": "लिए",
        "hyp": "के",
        "count": 3
      },
      {
        "ref": "हज़ार",
        "hyp": "सौ",
        "count": 3
      },
      {
        "ref": "सौ",
        "hyp": "में",
        "count": 3
      },
      {
        "ref": "हूं",
        "hyp": "हूँ",
        "count": 3
      },
      {
        "ref": "यह",
        "hyp": "ये",
        "count": 3
      },
      {
        "ref": "हैं",
        "hyp": "सकते",
        "count": 3
      },
      {
        "ref": "ये",
        "hyp": "यह",
        "count": 3
      },
      {
        "ref": "काफी",
        "hyp": "काफ़ी",
        "count": 3
      }
    ],
    "top_insertions": [
      {
        "word": "है",
        "count": 21
      },
      {
        "word": "की",
        "count": 11
      },
      {
        "word": "हैं",
        "count": 8
      },
      {
        "word": "में",
        "count": 8
      },
      {
        "word": "यहाँ",
        "count": 8
      },
      {
        "word": "के",
        "count": 8
      },
      {
        "word": "और",
        "count": 7
      },
      {
        "word": "ही",
        "count": 6
      },
      {
        "word": "वहाँ",
        "count": 6
      },
      {
        "word": "एक",
        "count": 6
      },
      {
        "word": "का",
        "count": 6
      },
      {
        "word": "से",
        "count": 5
      },
      {
        "word": "रहा",
        "count": 5
      },
      {
        "word": "सी",
        "count": 5
      },
      {
        "word": "ये",
        "count": 4
      },
      {
        "word": "पर",
        "count": 4
      },
      {
        "word": "हूँ",
        "count": 4
      },
      {
        "word": "आई",
        "count": 4
      },
      {
        "word": "यह",
        "count": 4
      },
      {
        "word": "काफ़ी",
        "count": 4
      }
    ],
    "top_deletions": [
      {
        "word": "हैं",
        "count": 15
      },
      {
        "word": "के",
        "count": 10
      },
      {
        "word": "है",
        "count": 9
      },
      {
        "word": "यहां",
        "count": 9
      },
      {
        "word": "में",
        "count": 9
      },
      {
        "word": "यह",
        "count": 8
      },
      {
        "word": "वहां",
        "count": 6
      },
      {
        "word": "एक",
        "count": 5
      },
      {
        "word": "कर",
        "count": 5
      },
      {
        "word": "भी",
        "count": 5
      },
      {
        "word": "ज्यादा",
        "count": 4
      },
      {
        "word": "हज़ार",
        "count": 4
      },
      {
        "word": "काफी",
        "count": 4
      },
      {
        "word": "और",
        "count": 3
      },
      {
        "word": "गांव",
        "count": 3
      },
      {
        "word": "कहीं",
        "count": 3
      },
      {
        "word": "ने",
        "count": 3
      },
      {
        "word": "हूं",
        "count": 3
      },
      {
        "word": "अपने",
        "count": 3
      },
      {
        "word": "ये",
        "count": 3
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 0,
      "punctuation_only_count": 1,
      "spacing_tokenization_count": 395,
      "entity_mismatch_count": 0,
      "script_confusion_count": 1,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "844424933459384-572-m",
        "844424933481854-705-m",
        "844424931066545-326-f"
      ],
      "best_samples": [
        "844424932362236-384-f",
        "844424930716702-929-m",
        "844424931281518-277-f"
      ],
      "numeric_mismatch_samples": [],
      "entity_mismatch_samples": []
    }
  },
  "kannada": {
    "top_substitutions": [
      {
        "ref": "ಒಂದು",
        "hyp": "ಸಾವಿರದ",
        "count": 6
      },
      {
        "ref": "ಸಾವಿರದ",
        "hyp": "ಒಂಬೈನೂರ",
        "count": 5
      },
      {
        "ref": "ವಿವಿಧ",
        "hyp": "ವಿವಿ��",
        "count": 3
      },
      {
        "ref": "ಹೆಚ್ಚಳಗೊಂಡ",
        "hyp": "ಎಚ್ಚರಗೊಂಡ",
        "count": 2
      },
      {
        "ref": "ಭಾರಿ",
        "hyp": "ಬಾರಿ",
        "count": 2
      },
      {
        "ref": "ಎರಡೂ",
        "hyp": "ಎರಡು",
        "count": 2
      },
      {
        "ref": "ತುಂಬಾ",
        "hyp": "ತುಂಬ",
        "count": 2
      },
      {
        "ref": "ಹಾಗು",
        "hyp": "ಹಾಗೂ",
        "count": 2
      },
      {
        "ref": "ಅವರು",
        "hyp": "ಅವರ",
        "count": 2
      },
      {
        "ref": "ಇನ್ನೂ",
        "hyp": "ಇನ್ನು",
        "count": 2
      },
      {
        "ref": "ಆದರೆ",
        "hyp": "ಅದರ",
        "count": 2
      },
      {
        "ref": "ಐರಿಶ್",
        "hyp": "ಐರಿಷ್",
        "count": 2
      },
      {
        "ref": "ಸೂಚನೆ",
        "hyp": "ಸೂ��ನೆ",
        "count": 2
      },
      {
        "ref": "ಸೊನ್ನೆ",
        "hyp": "ಸಾವಿರದ",
        "count": 2
      },
      {
        "ref": "ಒಂದು",
        "hyp": "ಒಂಬೈನೂರ",
        "count": 2
      },
      {
        "ref": "ಸಾವಿರದ",
        "hyp": "ಏಳು",
        "count": 2
      },
      {
        "ref": "ಎಚ್ಪಿಸಿಎಲ್",
        "hyp": "ಎಚ್",
        "count": 1
      },
      {
        "ref": "ಶೇರುಗಳ",
        "hyp": "ಡಿ",
        "count": 1
      },
      {
        "ref": "ದರದಲ್ಲಿ",
        "hyp": "ಸಿ",
        "count": 1
      },
      {
        "ref": "ಗಣನೀಯ",
        "hyp": "ಎಲ್",
        "count": 1
      }
    ],
    "top_insertions": [
      {
        "word": "ಸಿ",
        "count": 9
      },
      {
        "word": "ಅವರು",
        "count": 7
      },
      {
        "word": "ಒಂಬೈನೂರ",
        "count": 7
      },
      {
        "word": "ಎಸ್",
        "count": 6
      },
      {
        "word": "ಒಂದು",
        "count": 6
      },
      {
        "word": "ಅವರ",
        "count": 6
      },
      {
        "word": "ಡಿ",
        "count": 5
      },
      {
        "word": "ಎರಡು",
        "count": 5
      },
      {
        "word": "ಆ",
        "count": 5
      },
      {
        "word": "ಎಲ್ಲ",
        "count": 5
      },
      {
        "word": "ಬಿ",
        "count": 5
      },
      {
        "word": "ಐ",
        "count": 4
      },
      {
        "word": "ಎ",
        "count": 4
      },
      {
        "word": "ಈ",
        "count": 4
      },
      {
        "word": "ಥರ",
        "count": 4
      },
      {
        "word": "ವಿವಿ��",
        "count": 4
      },
      {
        "word": "ತುಂಬ",
        "count": 4
      },
      {
        "word": "ಮನೆ",
        "count": 3
      },
      {
        "word": "ಆಯ್ಕೆ",
        "count": 3
      },
      {
        "word": "ಕಂಡು",
        "count": 3
      }
    ],
    "top_deletions": [
      {
        "word": "ನೂರ",
        "count": 11
      },
      {
        "word": "ಒಂದು",
        "count": 10
      },
      {
        "word": "ನಲ್ಲಿ",
        "count": 7
      },
      {
        "word": "ಅವರು",
        "count": 7
      },
      {
        "word": "ಒಂಬತ್ತು",
        "count": 7
      },
      {
        "word": "ನ",
        "count": 5
      },
      {
        "word": "ರ",
        "count": 5
      },
      {
        "word": "ಹಾಗೂ",
        "count": 5
      },
      {
        "word": "ರಲ್ಲಿ",
        "count": 5
      },
      {
        "word": "ವಿವಿಧ",
        "count": 4
      },
      {
        "word": "ತುಂಬಾ",
        "count": 4
      },
      {
        "word": "ಸೂಚನೆ",
        "count": 4
      },
      {
        "word": "ಬಾಲಿವುಡ್",
        "count": 3
      },
      {
        "word": "ಅನ್ನು",
        "count": 3
      },
      {
        "word": "ಎರಡೂ",
        "count": 3
      },
      {
        "word": "ಎಲ್ಲಾ",
        "count": 3
      },
      {
        "word": "ಎಂದು",
        "count": 3
      },
      {
        "word": "ಭಾರಿ",
        "count": 3
      },
      {
        "word": "ನೀವು",
        "count": 3
      },
      {
        "word": "ಹಾಗು",
        "count": 3
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 1,
      "punctuation_only_count": 0,
      "spacing_tokenization_count": 464,
      "entity_mismatch_count": 0,
      "script_confusion_count": 0,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "844424933323571-169-m",
        "844424933351301-678-m",
        "844424933306172-678-m"
      ],
      "best_samples": [
        "844424930664000-324-f",
        "844424930301379-519-f",
        "844424931000839-62-f"
      ],
      "numeric_mismatch_samples": [
        "844424930318847-734-f"
      ],
      "entity_mismatch_samples": []
    }
  },
  "malayalam": {
    "top_substitutions": [
      {
        "ref": "സര്ക്കാര്",
        "hyp": "സർക്കാർ",
        "count": 10
      },
      {
        "ref": "എന്നാല്",
        "hyp": "എന്നാൽ",
        "count": 8
      },
      {
        "ref": "ഇന്ത്യന്",
        "hyp": "ഇന്ത്യൻ",
        "count": 6
      },
      {
        "ref": "വിവിധ",
        "hyp": "വിവി��",
        "count": 5
      },
      {
        "ref": "അതേസമയം",
        "hyp": "അതേ",
        "count": 5
      },
      {
        "ref": "പേരില്",
        "hyp": "പേരിൽ",
        "count": 4
      },
      {
        "ref": "കൂടുതല്",
        "hyp": "കൂടുതൽ",
        "count": 4
      },
      {
        "ref": "തുടര്ന്ന്",
        "hyp": "തുടർന്ന്",
        "count": 4
      },
      {
        "ref": "രണ്ടു",
        "hyp": "രണ്ട്",
        "count": 4
      },
      {
        "ref": "താന്",
        "hyp": "താൻ",
        "count": 4
      },
      {
        "ref": "തെരഞ്ഞെടുപ്പ്",
        "hyp": "തിരഞ്ഞെടുപ്പ്",
        "count": 4
      },
      {
        "ref": "അടിസ്ഥാനത്തില്",
        "hyp": "അടിസ്ഥാനത്തിൽ",
        "count": 3
      },
      {
        "ref": "ഏതു",
        "hyp": "ഏത്",
        "count": 3
      },
      {
        "ref": "നല്കിയ",
        "hyp": "നൽകിയ",
        "count": 3
      },
      {
        "ref": "ഒരാള്",
        "hyp": "ഒരാൾ",
        "count": 3
      },
      {
        "ref": "അവര്",
        "hyp": "അവർ",
        "count": 3
      },
      {
        "ref": "കോടതിയില്",
        "hyp": "കോടതിയിൽ",
        "count": 3
      },
      {
        "ref": "മെഡിക്കല്",
        "hyp": "മെഡിക്കൽ",
        "count": 3
      },
      {
        "ref": "കേരളത്തില്",
        "hyp": "കേരളത്തിൽ",
        "count": 3
      },
      {
        "ref": "ഇപ്പോള്",
        "hyp": "ഇപ്പോൾ",
        "count": 3
      }
    ],
    "top_insertions": [
      {
        "word": "എന്ന്",
        "count": 16
      },
      {
        "word": "പി",
        "count": 13
      },
      {
        "word": "സർക്കാർ",
        "count": 12
      },
      {
        "word": "ഡി",
        "count": 11
      },
      {
        "word": "ഒരു",
        "count": 9
      },
      {
        "word": "എന്നാൽ",
        "count": 9
      },
      {
        "word": "എം",
        "count": 9
      },
      {
        "word": "ബി",
        "count": 8
      },
      {
        "word": "ഇന്ത്യൻ",
        "count": 7
      },
      {
        "word": "രണ്ട്",
        "count": 7
      },
      {
        "word": "തുടർന്ന്",
        "count": 7
      },
      {
        "word": "എ",
        "count": 7
      },
      {
        "word": "എസ്",
        "count": 7
      },
      {
        "word": "ഐ",
        "count": 7
      },
      {
        "word": "എൻ",
        "count": 7
      },
      {
        "word": "എന്ന",
        "count": 7
      },
      {
        "word": "ഈ",
        "count": 7
      },
      {
        "word": "എഫ്",
        "count": 6
      },
      {
        "word": "അതേ",
        "count": 6
      },
      {
        "word": "താൻ",
        "count": 6
      }
    ],
    "top_deletions": [
      {
        "word": "സര്ക്കാര്",
        "count": 12
      },
      {
        "word": "എന്നാല്",
        "count": 8
      },
      {
        "word": "ഇന്ത്യന്",
        "count": 7
      },
      {
        "word": "താന്",
        "count": 7
      },
      {
        "word": "കൂടുതല്",
        "count": 6
      },
      {
        "word": "വിവിധ",
        "count": 5
      },
      {
        "word": "അതേസമയം",
        "count": 5
      },
      {
        "word": "തെരഞ്ഞെടുപ്പ്",
        "count": 5
      },
      {
        "word": "രണ്ടു",
        "count": 5
      },
      {
        "word": "അടിസ്ഥാനത്തില്",
        "count": 5
      },
      {
        "word": "ബി",
        "count": 4
      },
      {
        "word": "കേരളത്തില്",
        "count": 4
      },
      {
        "word": "പാര്ട്ടി",
        "count": 4
      },
      {
        "word": "പേരില്",
        "count": 4
      },
      {
        "word": "അവര്",
        "count": 4
      },
      {
        "word": "പൊലീസ്",
        "count": 4
      },
      {
        "word": "ഒരാള്",
        "count": 4
      },
      {
        "word": "തുടര്ന്ന്",
        "count": 4
      },
      {
        "word": "മെഡിക്കല്",
        "count": 4
      },
      {
        "word": "ഇപ്പോള്",
        "count": 4
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 0,
      "punctuation_only_count": 3,
      "spacing_tokenization_count": 492,
      "entity_mismatch_count": 0,
      "script_confusion_count": 1,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "844424930732545-462-f",
        "844424930436437-462-f",
        "844424931236419-653-f"
      ],
      "best_samples": [
        "844424931351478-802-f",
        "844424933055914-184-f",
        "844424930567466-1132-m"
      ],
      "numeric_mismatch_samples": [],
      "entity_mismatch_samples": []
    }
  },
  "marathi": {
    "top_substitutions": [
      {
        "ref": "एक",
        "hyp": "एकोणीसशे",
        "count": 11
      },
      {
        "ref": "आहेत",
        "hyp": "आहे",
        "count": 6
      },
      {
        "ref": "येथे",
        "hyp": "ये��े",
        "count": 5
      },
      {
        "ref": "एक",
        "hyp": "गाव",
        "count": 5
      },
      {
        "ref": "गाव",
        "hyp": "आहे",
        "count": 5
      },
      {
        "ref": "तालुक्यातील",
        "hyp": "एक",
        "count": 4
      },
      {
        "ref": "सुरु",
        "hyp": "सुरू",
        "count": 4
      },
      {
        "ref": "आहे",
        "hyp": "आला",
        "count": 3
      },
      {
        "ref": "डॉ",
        "hyp": "डॉक्टर",
        "count": 3
      },
      {
        "ref": "नांदेड",
        "hyp": "नां��ेड",
        "count": 3
      },
      {
        "ref": "हजार",
        "hyp": "दोन",
        "count": 3
      },
      {
        "ref": "संमेलन",
        "hyp": "सं��ेलन",
        "count": 3
      },
      {
        "ref": "शंभर",
        "hyp": "एकशे",
        "count": 3
      },
      {
        "ref": "आहे",
        "hyp": "आले",
        "count": 3
      },
      {
        "ref": "विमानाला",
        "hyp": "वि��ानाला",
        "count": 3
      },
      {
        "ref": "हे",
        "hyp": "आहे",
        "count": 3
      },
      {
        "ref": "करीत",
        "hyp": "करत",
        "count": 2
      },
      {
        "ref": "करुन",
        "hyp": "करून",
        "count": 2
      },
      {
        "ref": "इ",
        "hyp": "इसवी",
        "count": 2
      },
      {
        "ref": "हजार",
        "hyp": "एकोणीसशे",
        "count": 2
      }
    ],
    "top_insertions": [
      {
        "word": "आहे",
        "count": 18
      },
      {
        "word": "एकोणीसशे",
        "count": 18
      },
      {
        "word": "ही",
        "count": 10
      },
      {
        "word": "ये��े",
        "count": 7
      },
      {
        "word": "आणि",
        "count": 6
      },
      {
        "word": "या",
        "count": 5
      },
      {
        "word": "जी",
        "count": 5
      },
      {
        "word": "केलं",
        "count": 4
      },
      {
        "word": "जे",
        "count": 4
      },
      {
        "word": "इसवी",
        "count": 4
      },
      {
        "word": "सुरू",
        "count": 4
      },
      {
        "word": "हे",
        "count": 4
      },
      {
        "word": "पाचशे",
        "count": 4
      },
      {
        "word": "सं��ेलन",
        "count": 4
      },
      {
        "word": "एकशे",
        "count": 4
      },
      {
        "word": "ह्या",
        "count": 4
      },
      {
        "word": "आय",
        "count": 4
      },
      {
        "word": "त्या",
        "count": 4
      },
      {
        "word": "माझ्या",
        "count": 3
      },
      {
        "word": "करून",
        "count": 3
      }
    ],
    "top_deletions": [
      {
        "word": "शे",
        "count": 33
      },
      {
        "word": "एक",
        "count": 27
      },
      {
        "word": "हजार",
        "count": 24
      },
      {
        "word": "नऊ",
        "count": 21
      },
      {
        "word": "मध्ये",
        "count": 12
      },
      {
        "word": "या",
        "count": 12
      },
      {
        "word": "आहेत",
        "count": 11
      },
      {
        "word": "येथे",
        "count": 8
      },
      {
        "word": "व",
        "count": 8
      },
      {
        "word": "हे",
        "count": 7
      },
      {
        "word": "केले",
        "count": 6
      },
      {
        "word": "तीन",
        "count": 5
      },
      {
        "word": "ह्या",
        "count": 5
      },
      {
        "word": "आहे",
        "count": 5
      },
      {
        "word": "तालुक्यातील",
        "count": 5
      },
      {
        "word": "इ",
        "count": 4
      },
      {
        "word": "स",
        "count": 4
      },
      {
        "word": "सुरु",
        "count": 4
      },
      {
        "word": "ऐंशी",
        "count": 4
      },
      {
        "word": "दोन",
        "count": 4
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 4,
      "punctuation_only_count": 0,
      "spacing_tokenization_count": 456,
      "entity_mismatch_count": 0,
      "script_confusion_count": 0,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "844424933382096-365-m",
        "844424933427331-365-m",
        "844424933495009-787-m"
      ],
      "best_samples": [
        "844424931079461-40-f",
        "844424933429291-884-m",
        "844424932813251-13-f"
      ],
      "numeric_mismatch_samples": [
        "844424930638604-559-f",
        "844424933537501-787-m",
        "844424930739213-40-f"
      ],
      "entity_mismatch_samples": []
    }
  },
  "odia": {
    "top_substitutions": [
      {
        "ref": "ବଡ",
        "hyp": "ବଡ଼",
        "count": 6
      },
      {
        "ref": "ଏକ",
        "hyp": "ଶହେ",
        "count": 4
      },
      {
        "ref": "ମିଡିଆରେ",
        "hyp": "ମିଡ଼ିଆରେ",
        "count": 4
      },
      {
        "ref": "ନଅ",
        "hyp": "ଦଶ",
        "count": 4
      },
      {
        "ref": "ଏହାସହ",
        "hyp": "ଏହା",
        "count": 4
      },
      {
        "ref": "ଦୁଇ",
        "hyp": "ଦୁଇହଜାର",
        "count": 3
      },
      {
        "ref": "ସୋସିଆଲ",
        "hyp": "ସୋସିଆଲ୍",
        "count": 3
      },
      {
        "ref": "ଏକ",
        "hyp": "ଉଣେଇଶହ",
        "count": 3
      },
      {
        "ref": "ପୋଲିସ",
        "hyp": "ପୋଲିସ୍",
        "count": 3
      },
      {
        "ref": "ପାଇଁ",
        "hyp": "କରିବା",
        "count": 3
      },
      {
        "ref": "ଏହାପରେ",
        "hyp": "ଏହା",
        "count": 3
      },
      {
        "ref": "ଏହାଦ୍ୱାରା",
        "hyp": "ଏହା",
        "count": 2
      },
      {
        "ref": "ଭାଇରାଲ",
        "hyp": "ଭାଇରାଲ୍",
        "count": 2
      },
      {
        "ref": "ପାଇଁ",
        "hyp": "ଚିକିତ୍ସା",
        "count": 2
      },
      {
        "ref": "ଏହି",
        "hyp": "ଏଇ",
        "count": 2
      },
      {
        "ref": "ସମାଲୋଚନା",
        "hyp": "ସମାଲୋ��ନା",
        "count": 2
      },
      {
        "ref": "ଦୁଇ",
        "hyp": "ହଜାର",
        "count": 2
      },
      {
        "ref": "ଯୋଗୁ",
        "hyp": "ଯୋଗୁଁ",
        "count": 2
      },
      {
        "ref": "ନଅ",
        "hyp": "ମସିହାରେ",
        "count": 2
      },
      {
        "ref": "ଦୁଇ",
        "hyp": "ଦୁଇଟି",
        "count": 2
      }
    ],
    "top_insertions": [
      {
        "word": "ଏହା",
        "count": 10
      },
      {
        "word": "ବଡ଼",
        "count": 8
      },
      {
        "word": "ପୋଲିସ୍",
        "count": 8
      },
      {
        "word": "ଦୁଇ",
        "count": 6
      },
      {
        "word": "ଦଶ",
        "count": 5
      },
      {
        "word": "ହୋଇ",
        "count": 5
      },
      {
        "word": "ଓ",
        "count": 5
      },
      {
        "word": "ଧାନ",
        "count": 5
      },
      {
        "word": "ମିଡ଼ିଆରେ",
        "count": 4
      },
      {
        "word": "କରିଦେଇ��ିଲେ",
        "count": 4
      },
      {
        "word": "କରାଯାଇ��ିବା",
        "count": 4
      },
      {
        "word": "ଉଣେଇଶହ",
        "count": 4
      },
      {
        "word": "ପରେ",
        "count": 4
      },
      {
        "word": "ପାଇ��ିଲେ",
        "count": 4
      },
      {
        "word": "ଶହ",
        "count": 4
      },
      {
        "word": "ଧୀରେ",
        "count": 4
      },
      {
        "word": "ଦ୍ୱାରା",
        "count": 3
      },
      {
        "word": "ଦୁଇହଜାର",
        "count": 3
      },
      {
        "word": "ରଥ",
        "count": 3
      },
      {
        "word": "ସୋସିଆଲ୍",
        "count": 3
      }
    ],
    "top_deletions": [
      {
        "word": "ଶହେ",
        "count": 14
      },
      {
        "word": "ଏକ",
        "count": 13
      },
      {
        "word": "ଦୁଇ",
        "count": 13
      },
      {
        "word": "ଟି",
        "count": 12
      },
      {
        "word": "ନଅ",
        "count": 11
      },
      {
        "word": "ହଜାର",
        "count": 10
      },
      {
        "word": "ରେ",
        "count": 10
      },
      {
        "word": "ବଡ",
        "count": 7
      },
      {
        "word": "ତିନି",
        "count": 7
      },
      {
        "word": "କରି",
        "count": 7
      },
      {
        "word": "ଏହି",
        "count": 7
      },
      {
        "word": "ରୁ",
        "count": 6
      },
      {
        "word": "ବେଳେ",
        "count": 6
      },
      {
        "word": "ନ",
        "count": 6
      },
      {
        "word": "ପୋଲିସ",
        "count": 5
      },
      {
        "word": "ମିଡିଆରେ",
        "count": 4
      },
      {
        "word": "କରାଯାଇଥିବା",
        "count": 4
      },
      {
        "word": "ଦେଇଥିଲେ",
        "count": 4
      },
      {
        "word": "ଓ",
        "count": 4
      },
      {
        "word": "କମ",
        "count": 4
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 5,
      "punctuation_only_count": 1,
      "spacing_tokenization_count": 473,
      "entity_mismatch_count": 0,
      "script_confusion_count": 0,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "844424930717655-795-f",
        "844424930498646-388-f",
        "844424930457555-1178-f"
      ],
      "best_samples": [
        "844424932422433-43-f",
        "844424930403820-840-f",
        "844424931353021-824-m"
      ],
      "numeric_mismatch_samples": [
        "844424932356473-97-m",
        "844424931378477-824-m",
        "844424932383275-824-m"
      ],
      "entity_mismatch_samples": []
    }
  },
  "punjabi": {
    "top_substitutions": [
      {
        "ref": "ਵਿਚ",
        "hyp": "ਵਿੱਚ",
        "count": 25
      },
      {
        "ref": "ਇਕ",
        "hyp": "ਇੱਕ",
        "count": 13
      },
      {
        "ref": "ਤੇ",
        "hyp": "ਅਤੇ",
        "count": 7
      },
      {
        "ref": "ਉਨ੍ਹਾਂ",
        "hyp": "ਉਹਨਾਂ",
        "count": 6
      },
      {
        "ref": "ਉਸ",
        "hyp": "ਉਸਨੇ",
        "count": 5
      },
      {
        "ref": "ਵਲੋਂ",
        "hyp": "ਵੱਲੋਂ",
        "count": 4
      },
      {
        "ref": "ਸਕਦਾ",
        "hyp": "ਹੈ",
        "count": 4
      },
      {
        "ref": "ਸਿਰਫ",
        "hyp": "ਸਿਰਫ਼",
        "count": 4
      },
      {
        "ref": "ਇਨ੍ਹਾਂ",
        "hyp": "ਇਹਨਾਂ",
        "count": 4
      },
      {
        "ref": "ਹੈ",
        "hyp": "ਜਾਂਦਾ",
        "count": 4
      },
      {
        "ref": "ਹੈ",
        "hyp": "ਹੁੰਦਾ",
        "count": 4
      },
      {
        "ref": "ਰਚਨਾ",
        "hyp": "ਰ��ਨਾ",
        "count": 3
      },
      {
        "ref": "ਇਸ",
        "hyp": "ਇਸਨੂੰ",
        "count": 3
      },
      {
        "ref": "ਵਾਧੂ",
        "hyp": "ਵਾ��ੂ",
        "count": 3
      },
      {
        "ref": "ਉਸ",
        "hyp": "ਉਸਦਾ",
        "count": 3
      },
      {
        "ref": "ਮੁਸ਼ਕਲ",
        "hyp": "ਮੁਸ਼ਕਿਲ",
        "count": 3
      },
      {
        "ref": "ਸਭਿਆਚਾਰ",
        "hyp": "ਸੱਭਿਆਚਾਰ",
        "count": 3
      },
      {
        "ref": "ਇੱਕ",
        "hyp": "ਦਾ",
        "count": 3
      },
      {
        "ref": "ਨੂੰ",
        "hyp": "ਅਤੇ",
        "count": 3
      },
      {
        "ref": "ਚਿੱਟੇ",
        "hyp": "ਚਿੱ��ੇ",
        "count": 2
      }
    ],
    "top_insertions": [
      {
        "word": "ਵਿੱਚ",
        "count": 34
      },
      {
        "word": "ਇੱਕ",
        "count": 19
      },
      {
        "word": "ਅਤੇ",
        "count": 12
      },
      {
        "word": "ਦਾ",
        "count": 11
      },
      {
        "word": "ਉਹਨਾਂ",
        "count": 9
      },
      {
        "word": "ਨੂੰ",
        "count": 8
      },
      {
        "word": "ਵੀ",
        "count": 7
      },
      {
        "word": "ਹੈ",
        "count": 7
      },
      {
        "word": "ਦੀ",
        "count": 6
      },
      {
        "word": "ਇਸ",
        "count": 6
      },
      {
        "word": "ਉਸਨੇ",
        "count": 6
      },
      {
        "word": "ਵੱਲੋਂ",
        "count": 5
      },
      {
        "word": "ਦੇ",
        "count": 5
      },
      {
        "word": "ਰ��ਨਾ",
        "count": 5
      },
      {
        "word": "ਇਹਨਾਂ",
        "count": 5
      },
      {
        "word": "ਸੀ",
        "count": 5
      },
      {
        "word": "ਇਹ",
        "count": 5
      },
      {
        "word": "ਜਾਂ",
        "count": 5
      },
      {
        "word": "ਪੀ",
        "count": 4
      },
      {
        "word": "ਤੱਕ",
        "count": 4
      }
    ],
    "top_deletions": [
      {
        "word": "ਵਿਚ",
        "count": 32
      },
      {
        "word": "ਇਕ",
        "count": 17
      },
      {
        "word": "ਤੇ",
        "count": 16
      },
      {
        "word": "ਉਸ",
        "count": 14
      },
      {
        "word": "ਦੇ",
        "count": 12
      },
      {
        "word": "ਉਨ੍ਹਾਂ",
        "count": 9
      },
      {
        "word": "ਡਾ",
        "count": 9
      },
      {
        "word": "ਦਾ",
        "count": 9
      },
      {
        "word": "ਨੂੰ",
        "count": 9
      },
      {
        "word": "ਨੇ",
        "count": 7
      },
      {
        "word": "ਇਹ",
        "count": 6
      },
      {
        "word": "ਇਸ",
        "count": 6
      },
      {
        "word": "ਅਮਰੀਕੀ",
        "count": 5
      },
      {
        "word": "ਵਿੱਚ",
        "count": 5
      },
      {
        "word": "ਰਚਨਾ",
        "count": 5
      },
      {
        "word": "ਸਥਿਤ",
        "count": 5
      },
      {
        "word": "ਵਲੋਂ",
        "count": 4
      },
      {
        "word": "ਸਿਰਫ",
        "count": 4
      },
      {
        "word": "ਇਨ੍ਹਾਂ",
        "count": 4
      },
      {
        "word": "ਦੀ",
        "count": 4
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 0,
      "punctuation_only_count": 7,
      "spacing_tokenization_count": 444,
      "entity_mismatch_count": 0,
      "script_confusion_count": 0,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "844424932650386-703-f",
        "844424931542284-775-f",
        "844424933647759-601-m"
      ],
      "best_samples": [
        "844424930814747-1031-f",
        "844424931241652-66-f",
        "844424933639154-32-m"
      ],
      "numeric_mismatch_samples": [],
      "entity_mismatch_samples": []
    }
  },
  "tamil": {
    "top_substitutions": [
      {
        "ref": "என்னும்",
        "hyp": "இன்னும்",
        "count": 3
      },
      {
        "ref": "ஆளுநர்",
        "hyp": "ஆளு��ர்",
        "count": 3
      },
      {
        "ref": "இந்நிலையில்",
        "hyp": "இந்த",
        "count": 2
      },
      {
        "ref": "இந்த",
        "hyp": "நிலையில்",
        "count": 2
      },
      {
        "ref": "நடித்த",
        "hyp": "படத்தில்",
        "count": 2
      },
      {
        "ref": "அங்கு",
        "hyp": "அங்கே",
        "count": 2
      },
      {
        "ref": "செந்தில்குமார்",
        "hyp": "செந்தில்",
        "count": 2
      },
      {
        "ref": "குடியரசு",
        "hyp": "குடியரசுத்",
        "count": 2
      },
      {
        "ref": "இது",
        "hyp": "இதை",
        "count": 2
      },
      {
        "ref": "இனி",
        "hyp": "இனிமேல்",
        "count": 2
      },
      {
        "ref": "இதை",
        "hyp": "இது",
        "count": 2
      },
      {
        "ref": "காஷ்மீர்",
        "hyp": "கா��்மீர்",
        "count": 2
      },
      {
        "ref": "இண்டியம்",
        "hyp": "இந்திய",
        "count": 2
      },
      {
        "ref": "திரைப்படத்துறை",
        "hyp": "திரைப்படத்",
        "count": 2
      },
      {
        "ref": "இதனையடுத்து",
        "hyp": "இதனை",
        "count": 2
      },
      {
        "ref": "பன்வாரிலால்",
        "hyp": "பண்வாரிலால்",
        "count": 2
      },
      {
        "ref": "விபத்தில்",
        "hyp": "வி��த்தில்",
        "count": 2
      },
      {
        "ref": "ஓத்துக்கிட்டு",
        "hyp": "ஒத்துக்கிட்டு",
        "count": 2
      },
      {
        "ref": "அவர்",
        "hyp": "போது",
        "count": 2
      },
      {
        "ref": "மாநிலத்தில்",
        "hyp": "மாநிலத்தின்",
        "count": 2
      }
    ],
    "top_insertions": [
      {
        "word": "தான்",
        "count": 8
      },
      {
        "word": "போது",
        "count": 8
      },
      {
        "word": "எடுத்து",
        "count": 7
      },
      {
        "word": "இந்த",
        "count": 5
      },
      {
        "word": "நிலையில்",
        "count": 5
      },
      {
        "word": "என",
        "count": 5
      },
      {
        "word": "என்ற",
        "count": 5
      },
      {
        "word": "ஒரு",
        "count": 4
      },
      {
        "word": "இந்திய",
        "count": 4
      },
      {
        "word": "எனக்கு",
        "count": 4
      },
      {
        "word": "நீர்",
        "count": 3
      },
      {
        "word": "இன்னும்",
        "count": 3
      },
      {
        "word": "மட்டும்",
        "count": 3
      },
      {
        "word": "இதை",
        "count": 3
      },
      {
        "word": "என்ன",
        "count": 3
      },
      {
        "word": "இது",
        "count": 3
      },
      {
        "word": "என்றால்",
        "count": 3
      },
      {
        "word": "கூறிய",
        "count": 3
      },
      {
        "word": "பதிவு",
        "count": 3
      },
      {
        "word": "விதை",
        "count": 3
      }
    ],
    "top_deletions": [
      {
        "word": "என",
        "count": 6
      },
      {
        "word": "ஆகும்",
        "count": 6
      },
      {
        "word": "இருந்து",
        "count": 6
      },
      {
        "word": "இந்த",
        "count": 5
      },
      {
        "word": "இந்நிலையில்",
        "count": 3
      },
      {
        "word": "என்னும்",
        "count": 3
      },
      {
        "word": "பட",
        "count": 3
      },
      {
        "word": "எரி",
        "count": 3
      },
      {
        "word": "பலி",
        "count": 3
      },
      {
        "word": "அருகே",
        "count": 3
      },
      {
        "word": "இதனையடுத்து",
        "count": 3
      },
      {
        "word": "பெயர்",
        "count": 3
      },
      {
        "word": "விட்டு",
        "count": 3
      },
      {
        "word": "இண்டியம்",
        "count": 3
      },
      {
        "word": "காவல்",
        "count": 3
      },
      {
        "word": "துறை",
        "count": 3
      },
      {
        "word": "பொலிஸார்",
        "count": 3
      },
      {
        "word": "பாராளுமன்ற",
        "count": 3
      },
      {
        "word": "உயர்",
        "count": 3
      },
      {
        "word": "ஆளுநர்",
        "count": 3
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 1,
      "punctuation_only_count": 7,
      "spacing_tokenization_count": 475,
      "entity_mismatch_count": 0,
      "script_confusion_count": 0,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "844424932803222-807-f",
        "844424933333773-739-m",
        "844424933225841-401-m"
      ],
      "best_samples": [
        "844424933239581-401-m",
        "844424931267557-837-f",
        "844424931230620-764-f"
      ],
      "numeric_mismatch_samples": [
        "844424933301818-280-m"
      ],
      "entity_mismatch_samples": []
    }
  },
  "telugu": {
    "top_substitutions": [
      {
        "ref": "మరింత",
        "hyp": "మరిం��",
        "count": 4
      },
      {
        "ref": "అక్కడి",
        "hyp": "అక్కడ",
        "count": 3
      },
      {
        "ref": "ప్రధాని",
        "hyp": "ప్రధానమొది",
        "count": 2
      },
      {
        "ref": "అర్ధం",
        "hyp": "అర్థం",
        "count": 2
      },
      {
        "ref": "చేసుకుని",
        "hyp": "చేసుకొని",
        "count": 2
      },
      {
        "ref": "ఔషధ",
        "hyp": "��షధ",
        "count": 2
      },
      {
        "ref": "సంఖ్యలో",
        "hyp": "సం��్యలో",
        "count": 2
      },
      {
        "ref": "కూడ",
        "hyp": "కూడా",
        "count": 2
      },
      {
        "ref": "సంభవిస్తుంది",
        "hyp": "సం��విస్తుంది",
        "count": 2
      },
      {
        "ref": "ప్రాంతంలో",
        "hyp": "తెలంగాణ",
        "count": 2
      },
      {
        "ref": "కళ",
        "hyp": "కల",
        "count": 2
      },
      {
        "ref": "మరియు",
        "hyp": "మరి",
        "count": 2
      },
      {
        "ref": "సంఖ్య",
        "hyp": "సం��్య",
        "count": 2
      },
      {
        "ref": "పాఠశాలలో",
        "hyp": "పా��శాలలో",
        "count": 2
      },
      {
        "ref": "మళ్లీ",
        "hyp": "మళ్ళీ",
        "count": 2
      },
      {
        "ref": "చేశారు",
        "hyp": "వ్యక్తం",
        "count": 2
      },
      {
        "ref": "కాని",
        "hyp": "కానీ",
        "count": 2
      },
      {
        "ref": "ఇక్కడి",
        "hyp": "ఇక్కడ",
        "count": 2
      },
      {
        "ref": "గ్రామం",
        "hyp": "లోని",
        "count": 2
      },
      {
        "ref": "పాఠశాల",
        "hyp": "పా��శాల",
        "count": 2
      }
    ],
    "top_insertions": [
      {
        "word": "లో",
        "count": 13
      },
      {
        "word": "ఈ",
        "count": 10
      },
      {
        "word": "మరిం��",
        "count": 8
      },
      {
        "word": "ఒక",
        "count": 7
      },
      {
        "word": "గా",
        "count": 6
      },
      {
        "word": "ముందు",
        "count": 5
      },
      {
        "word": "కూడా",
        "count": 5
      },
      {
        "word": "తన",
        "count": 5
      },
      {
        "word": "కానీ",
        "count": 5
      },
      {
        "word": "మరి",
        "count": 5
      },
      {
        "word": "పా��శాల",
        "count": 5
      },
      {
        "word": "తో",
        "count": 4
      },
      {
        "word": "అని",
        "count": 4
      },
      {
        "word": "ఇలా",
        "count": 4
      },
      {
        "word": "అయిన",
        "count": 4
      },
      {
        "word": "ఉన్న",
        "count": 4
      },
      {
        "word": "ఏ",
        "count": 4
      },
      {
        "word": "ఇక్కడ",
        "count": 4
      },
      {
        "word": "రోజు",
        "count": 3
      },
      {
        "word": "చేసి",
        "count": 3
      }
    ],
    "top_deletions": [
      {
        "word": "లో",
        "count": 11
      },
      {
        "word": "మరింత",
        "count": 9
      },
      {
        "word": "లోని",
        "count": 8
      },
      {
        "word": "పాఠశాల",
        "count": 6
      },
      {
        "word": "ఈ",
        "count": 5
      },
      {
        "word": "ఓ",
        "count": 3
      },
      {
        "word": "ప్రధాని",
        "count": 3
      },
      {
        "word": "ఆర్",
        "count": 3
      },
      {
        "word": "తో",
        "count": 3
      },
      {
        "word": "ను",
        "count": 3
      },
      {
        "word": "తెలంగాణా",
        "count": 3
      },
      {
        "word": "కేసీఆర్",
        "count": 3
      },
      {
        "word": "రైల్వే",
        "count": 3
      },
      {
        "word": "ఆంధ్ర",
        "count": 3
      },
      {
        "word": "ప్రదేశ్",
        "count": 3
      },
      {
        "word": "గా",
        "count": 3
      },
      {
        "word": "కాని",
        "count": 3
      },
      {
        "word": "కళాశాల",
        "count": 3
      },
      {
        "word": "అక్కడి",
        "count": 3
      },
      {
        "word": "పదవీ",
        "count": 2
      }
    ],
    "error_buckets": {
      "numeric_mismatch_count": 0,
      "punctuation_only_count": 1,
      "spacing_tokenization_count": 462,
      "entity_mismatch_count": 0,
      "script_confusion_count": 0,
      "empty_hypothesis_count": 0
    },
    "examples": {
      "worst_samples": [
        "844424931244235-407-f",
        "844424933587000-1166-m",
        "844424933579330-1192-m"
      ],
      "best_samples": [
        "844424932572993-832-f",
        "844424933582544-922-m",
        "844424931096849-407-f"
      ],
      "numeric_mismatch_samples": [],
      "entity_mismatch_samples": []
    }
  },
  "__summary__": {
    "model_diagnosis": "recognition-limited",
    "primary_error_source": "recognition",
    "numeric_verbalization_impact": "low",
    "formatting_impact": "low",
    "worst_languages": [
      "kannada",
      "tamil",
      "malayalam"
    ],
    "best_languages": [
      "hindi",
      "punjabi",
      "gujarati"
    ]
  }
}