o
     ¢iÈ  ã                   @   s,   d dl mZ d dlmZ G dd„ deƒZdS )é   )Ú
Lemmatizer)ÚTokenc                   @   s"   e Zd ZdZdedefdd„ZdS )ÚEnglishLemmatizerz0English lemmatizer. Only overrides is_base_form.ÚtokenÚreturnc                 C   sÒ   |j  ¡ }|j ¡ }|dkr| d¡dkrdS |dkr$| d¡dkr$dS |dkr?| d¡dkr?| d	¡d
kr?| d¡du r?dS |dkrL| d¡dkrLdS | d¡dkrUdS | d¡dkr^dS | d¡dkrgdS dS )a;  
        Check whether we're dealing with an uninflected paradigm, so we can
        avoid lemmatization entirely.

        univ_pos (str / int): The token's universal part-of-speech tag.
        morphology (dict): The token's morphological features following the
            Universal Dependencies scheme.
        ÚnounÚNumberÚSingTÚverbÚVerbFormÚInfÚFinÚTenseÚPresNÚadjÚDegreeÚPosÚNoneF)Úpos_ÚlowerÚmorphÚto_dictÚget)Úselfr   Úuniv_posÚ
morphology© r   úL/home/ubuntu/.local/lib/python3.10/site-packages/spacy/lang/en/lemmatizer.pyÚis_base_form   s(   
	
zEnglishLemmatizer.is_base_formN)Ú__name__Ú
__module__Ú__qualname__Ú__doc__r   Úboolr   r   r   r   r   r      s    r   N)Úpipeliner   Útokensr   r   r   r   r   r   Ú<module>   s    