o
    Kεi                     @   s0   d Z ddlmZ ddlmZ G dd deZdS )z
@author:Bengali.AI
    )print_function   )BaseNormalizerc                       s(   e Zd Z	d fdd	Zdd Z  ZS )IndicNormalizerFc                    s   t t| j||d dS )ab  
            initialize a normalizer
            args:
                language                        :   language identifier from 'devanagari', 'gujarati', 'odiya', 'tamil', 'panjabi', 'malayalam','sylhetinagri'
                allow_english                   :   allow english letters numbers and punctuations [default:False]
                
        )languageallow_englishN)superr   __init__)selfr   r   	__class__ M/home/ubuntu/.local/lib/python3.10/site-packages/bnunicodenormalizer/indic.pyr	      s   zIndicNormalizer.__init__c              
   C   s.  |   r"| jd | jjv r"| jdd  | _|   r"| jd | jjv sz| jd | jjkr7| jd d | _d}nd}W n tyN } zd}W Y d }~nd }~ww |   rq| jd | jjkrq| jd d | _|   rq| jd | jjks\|r{| j| jj |   rt| jD ]\}}|| jvrd | j|< qd S d S )Nr   r   TF)	checkDecompdecomplanginvalid_starts	connector	Exceptionappend	enumeratevalid)r
   add_coneidxdr   r   r   cleanInvalidUnicodes   s0   

z$IndicNormalizer.cleanInvalidUnicodes)F)__name__
__module____qualname__r	   r   __classcell__r   r   r   r   r      s    r   N)__doc__
__future__r   baser   r   r   r   r   r   <module>   s   