o
    2wii                     @   s   d dl mZ d dlZd dlmZ d dlmZ d dlmZ ej	e
dddejd	ejdd
ddejde dejddedddgddejddedddgddejdd
ddejdddedd d!ed"ee d#ee d$ed%ed&efd'd(ZdS ))    )ListN)prepareprepare_fisher_english)PathlikeT)show_default)context_settingsz
corpus-dirF)exists	file_okay)typez
output-dirz-adz--audio-dirs
LDC2004S13
LDC2005S13z_Audio dirs, e.g., `LDC2004S13 LDC2005S13`. Multiple corpora can be provided by repeating `-ad`.)r   multipledefaulthelpz-tdz--transcript-dirs
LDC2004T19
LDC2005T19zdTranscript dirs, e.g., `LDC2004T19 LDC2005T19`. Multiple corpora can be provided by repeating `-ad`.z--absolute-pathszPWhether to return absolute or relative (to the corpus dir) paths for recordings.)r   r   z-jz
--num-jobs   z8Number of concurrent processes scanning the audio files.)r   r   r   
corpus_dir
audio_dirstranscript_dirs
output_dirabsolute_pathsnum_jobsc                 C   s   t | |||||d dS )ae  
    The Fisher English Part 1, 2 corpus preparation.

    
    This is conversational telephone speech collected as 2-channel, 8kHz-sampled data.
    The catalog number LDC2004S13 and LDC2005S13 for audio corpora and LDC2004T19 LDC2005T19 for transcripts.

    This data is not available for free - your institution needs to have an LDC subscription.
    r   r   r   r   r   r   Nr   r    r   d/home/ubuntu/sommelier/.venv/lib/python3.10/site-packages/lhotse/bin/modes/recipes/fisher_english.pyfisher_english
   s   0
r   )typingr   clicklhotse.bin.modesr   lhotse.recipesr   lhotse.utilsr   commanddictargumentPathoptionstrintboolr   r   r   r   r   <module>   sb    