o
    5ti                     @   s8   d dl mZ ddlmZ ddlmZ G dd deZdS )    )	lru_cache   )BaseTokenizer)TokenizerRegexpc                   @   s.   e Zd Zdd Zdd Zedddd Zd	S )
Tokenizer13ac                 C   s   dS )N13a selfr   r   V/home/ubuntu/.local/lib/python3.10/site-packages/sacrebleu/tokenizers/tokenizer_13a.py	signature   s   zTokenizer13a.signaturec                 C   s   t  | _d S )N)r   _post_tokenizerr	   r   r   r   __init__   s   zTokenizer13a.__init__i   )maxsizec                 C   sn   | dd}| dd}| dd}d|v r.| dd}| d	d}| d
d}| dd}| d| dS )zTokenizes an input line using a relatively minimal tokenization
        that is however equivalent to mteval-v13a, used by WMT.

        :param line: a segment to tokenize
        :return: the tokenized line
        z	<skipped> z-

 &z&quot;"z&amp;z&lt;<z&gt;>)replacer   )r
   liner   r   r   __call__   s   
zTokenizer13a.__call__N)__name__
__module____qualname__r   r   r   r   r   r   r   r   r      s
    r   N)	functoolsr   tokenizer_baser   tokenizer_rer   r   r   r   r   r   <module>   s    