o
    i                     @   s   d dl Z G dd dZdS )    Nc                   @   s0   e Zd Zedd Zedd Zedd ZdS )KoreanCleanerc                    s6   ddddddddd	d
d
 d  fdd|D }|S )Nu   영u   일   이u   삼u   사   오u   육u   칠u   팔u   구)
0123456789 c                 3   (    | ]}|   v r | n|V  qd S Nkeys.0charnumber_to_kor S/home/ubuntu/.local/lib/python3.10/site-packages/funasr/tokenizer/korean_cleaner.py	<genexpr>   s    
z3KoreanCleaner._normalize_numbers.<locals>.<genexpr>)joinclstextnew_textr   r   r   _normalize_numbers   s   z KoreanCleaner._normalize_numbersc                    s   i ddddddddd	d
dddddddddddddddddddddd d!d"d#d$d%d&d'd(d)d*dd+	 t d,d-d. |}d/ fd0d1|D }|S )2NAu   에이Bu   비Cu   씨Du   디Er   Fu   에프Gu   지Hu	   에이치Iu   아이Ju   제이Ku   케이Lu   엘Mu   엠Nu   엔Or   Pu   피Qu   큐u   알u   에스u   티u   유u   브이u	   더블유u   엑스u   와이)	RSTUVWXYZz[a-z]+c                 S   s   t |  S r   )struppergroup)xr   r   r   <lambda>8   s    z7KoreanCleaner._normalize_english_text.<locals>.<lambda>r   c                 3   r   r   r   r   upper_alphabet_to_korr   r   r   9   s
    
z8KoreanCleaner._normalize_english_text.<locals>.<genexpr>)resubr   r   r   rA   r   _normalize_english_text   sd   	
z%KoreanCleaner._normalize_english_textc                 C   s    |  }| |}| |}|S r   )stripr!   rE   )r   r   r   r   r   normalize_text@   s   

zKoreanCleaner.normalize_textN)__name__
__module____qualname__classmethodr!   rE   rG   r   r   r   r   r      s    

%r   )rC   r   r   r   r   r   <module>   s   