o
    2wi                     @   s   d dl Z d dlmZ d dlmZmZ d dlmZ eje	ddde j
de jddd	d
e j
de  d
e jdde eddde jddeddddedededefddZdS )    N)prepare)	NSC_PARTSprepare_nsc)PathlikeT)show_default)context_settings
corpus_dir)existsdir_okay)type
output_dirz-pz--dataset-partPART3_SameCloseMicz$Which part of NSC should be prepared)r   defaulthelpz-jz
--num-jobs   zBHow many threads to use (can give good speed-ups with slow disks).dataset_partnum_jobsc                 C   s   t | |||d dS )u@  
    
    This is a data preparation recipe for the National Corpus of Speech in Singaporean English.
    CORPUS_DIR: root directory that contains all NSC shared folder. Eg.
        ├── IMDA - National Speech Corpus
        │   ├── LEXICON
        │   ├── PART1
        │   ├── PART2
        │   └── PART3
        ├── IMDA - National Speech Corpus - Additional
        │   └── IMDA - National Speech Corpus (Additional)
        │      ├── PART4
        │      ├── PART5
        │      └── PART6
    )r   r   r   N)r   )r   r   r   r    r   Y/home/ubuntu/sommelier/.venv/lib/python3.10/site-packages/lhotse/bin/modes/recipes/nsc.pynsc   s   !
r   )clicklhotse.bin.modesr   lhotse.recipes.nscr   r   lhotse.utilsr   commanddictargumentPathoptionChoiceintstrr   r   r   r   r   <module>   s,    (