# Core torch>=2.4.0 torchaudio>=2.4.0 transformers>=4.52 sentencepiece protobuf # Data webdataset>=0.2.86 pandas pyarrow soundfile librosa numpy # Training pyyaml wandb # Evaluation jiwer # Optional: FSDP / DeepSpeed # deepspeed>=0.14.0