o
    Si                     @   s   d dl Z d dlmZ d dlmZ d dlmZ ejeddde j	de j
dd	d
de j	de j
dd	d
de j	de 
 de jdd	dddedededefddZdS )    N)prepareprepare_callhome_egyptian)PathlikeT)show_default)context_settingsz	audio-dirF)exists	file_okay)typeztranscript-dirz
output-dirz--absolute-pathszPWhether to return absolute or relative (to the corpus dir) paths for recordings.)defaulthelp	audio_dirtranscript_dir
output_dirabsolute_pathsc                 C   s   t | |||d dS )a~  
    About the Callhome Egyptian Arabic Corpus

    The CALLHOME Egyptian Arabic corpus of telephone speech consists of 120 unscripted
    telephone conversations between native speakers of Egyptian Colloquial Arabic (ECA),
    the spoken variety of Arabic found in Egypt. The dialect of ECA that this
    dictionary represents is Cairene Arabic.

    This recipe uses the speech and transcripts available through LDC. In addition,
    an Egyptian arabic phonetic lexicon (available via LDC) is used to get word to
    phoneme mappings for the vocabulary. This datasets are:

    Speech : LDC97S45
    Transcripts : LDC97T19
    Lexicon : LDC99L22 (unused here)

    To actually read the audio, you will need the SPH2PIPE binary: you can provide its path,
    so that we will add it in the manifests (otherwise you might need to modify your PATH
    environment variable to find sph2pipe).
    r   r   r   r   Nr   r    r   ^/home/ubuntu/.local/lib/python3.10/site-packages/lhotse/bin/modes/recipes/callhome_egyptian.pycallhome_egyptian   s   #
r   )clicklhotse.bin.modesr   lhotse.recipesr   lhotse.utilsr   commanddictargumentPathoptionboolr   r   r   r   r   <module>   s,    