o
    SiW                     @   s   d dl Z d dlmZ d dlmZ d dlmZ ejeddde j	de j
dd	d
de j	de 
 de jde j
dd	d
de jde j
dd	d
dde jdddde jdd	dddedededededefddZdS )    N)prepareprepare_switchboard)PathlikeT)show_default)context_settingsz	audio-dirF)exists	file_okay)typez
output-dirz--transcript-dirz--sentiment-dirzHOptional path to LDC2020T14 package with sentiment annotations for SWBD.)r
   helpz--omit-silence/--retain-silencez&Should the [silence] segments be kept.)defaultr   z--absolute-pathszPWhether to return absolute or relative (to the corpus dir) paths for recordings.	audio_dir
output_dirtranscript_dirsentiment_diromit_silenceabsolute_pathsc                 C   s   t | |||||d dS )aP  
    The Switchboard corpus preparation.

    
    This is conversational telephone speech collected as 2-channel, 8kHz-sampled
    data.  We are using just the Switchboard-1 Phase 1 training data.
    The catalog number LDC97S62 (Switchboard-1 Release 2) corresponds, we believe,
    to what we have.  We also use the Mississippi State transcriptions, which
    we download separately from
    http://www.isip.piconepress.com/projects/switchboard/releases/switchboard_word_alignments.tar.gz

    This data is not available for free - your institution needs to have an LDC subscription.
    )r   transcripts_dirr   r   r   r   Nr   )r   r   r   r   r   r    r   X/home/ubuntu/.local/lib/python3.10/site-packages/lhotse/bin/modes/recipes/switchboard.pyswitchboard   s   (
r   )clicklhotse.bin.modesr   lhotse.recipesr   lhotse.utilsr   commanddictargumentPathoptionboolr   r   r   r   r   <module>   sH    