"""
Validation pipeline: LID consensus + CTC confidence scoring.
Downloads transcribed tars, runs MMS LID-256 + VoxLingua107 + IndicConformer CTC +
IndicWav2Vec CTC, packs rich segment-level data into parquet shards.
"""
__version__ = "0.1.0"
