o
    7ti                     @   s$   d dl Z dd Zdd Zdd ZdS )    Nc                 C   sN   |  dd} |  dd} |  dd} |  dd} |  d	d} td
d| } | S )Nz n'tzn'tz ))z( (z" "z "z (['.,])z\1)replaceresub)string r	   N/home/ubuntu/.local/lib/python3.10/site-packages/lm_eval/tasks/paws-x/utils.pygeneral_detokenize   s   r   c                 C   s   | d   | dd   S )Nr      )lower)textr	   r	   r
   lowercase_first_letter   s   r   c                    sR   g   fdd} g krt  }td| dt |  d   | dd |S )Nc                    s   | d dvr;| d dvr;t | d  | d< t | d  | d< | d dr1| d d d | d< t| d | d< | S  |  | S )N	sentence1N 	sentence2).,;)r   stripendswithr   appenddoc
empty_docsr	   r
   _process_doc   s   
z.process_docs_paraphrases.<locals>._process_doczFound z empty documents out of the z total docs in the dataset: c                 S   s   | d dvo| d dvS )Nr   r   r   r	   r   r	   r	   r
   <lambda>)   s    z*process_docs_paraphrases.<locals>.<lambda>)lenprintfiltermap)datasetr   len_empty_docsr	   r   r
   process_docs_paraphrases   s   r'   )r   r   r   r'   r	   r	   r	   r
   <module>   s    
