o
    ˜à·iÊ  ã                   @   sÞ   U d dl mZmZ d dlZd dlZd dlmZ d dlm	Z	 d dl
mZ d dlmZ d dlmZmZ d dlmZmZ d d	lmZ d d
lmZmZmZmZmZ d dlmZ d dlmZ ee ƒZ!ee Z"ee#d< G dd„ deƒZ$dS )é    )ÚFinalÚ	TypeAliasN)ÚRequest)ÚEngineClient)ÚChatTemplateContentFormatOption)ÚRequestLogger)ÚErrorResponseÚ	UsageInfo)ÚOpenAIServingÚServeContext)ÚOpenAIServingModels)ÚClassificationChatRequestÚClassificationCompletionRequestÚClassificationDataÚClassificationRequestÚClassificationResponse)Úinit_logger)ÚClassificationOutputÚClassificationServeContextc                       sœ   e Zd ZdZdddddœdedededB d	edB d
ede	de	ddf‡ fdd„Z
dededB fdd„ZdedeeB fdd„ZdededeeB fdd„Z‡  ZS )ÚServingClassificationÚclassifyNÚautoF)Úchat_templateÚchat_template_content_formatÚtrust_request_chat_templateÚlog_error_stackÚengine_clientÚmodelsÚrequest_loggerr   r   r   r   Úreturnc                   s*   t ƒ j||||d || _|| _|| _d S )N)r   r   r   r   )ÚsuperÚ__init__r   r   r   )Úselfr   r   r   r   r   r   r   ©Ú	__class__© ú_/home/ubuntu/vllm_env/lib/python3.10/site-packages/vllm/entrypoints/pooling/classify/serving.pyr!   #   s   ü
zServingClassification.__init__Úctxc              
   Ã   sò   zU|   |j¡|_t|jtƒr9| j|jj|jj| jd}|r!|W S | j	|j|jj
| j| jddI dH \}|_W dS t|jtƒrQ| j|j|jjddI dH |_W dS |  d¡W S  tttjfyx } zt d¡ |  t|ƒ¡W  Y d}~S d}~ww )z|
        Process classification inputs: tokenize text, resolve adapters,
        and prepare model-specific inputs.
        )Úrequest_chat_templateÚchat_template_kwargsr   N)Údefault_templateÚdefault_template_content_formatÚdefault_template_kwargs)Úprompt_inputÚprompt_embedsz#Invalid classification request typez$Error in preprocessing prompt inputs)Ú_maybe_get_adaptersÚrequestÚlora_requestÚ
isinstancer   Ú_validate_chat_templater   r)   r   Ú_preprocess_chatÚmessagesr   Úengine_promptsr   Ú_preprocess_completionÚinputÚcreate_error_responseÚ
ValueErrorÚ	TypeErrorÚjinja2ÚTemplateErrorÚloggerÚ	exceptionÚstr)r"   r'   Úerror_check_retÚ_Úer%   r%   r&   Ú_preprocess9   s@   €ýû÷ýþ
€þz!ServingClassification._preprocessc                 C   s®   t | jjdi ƒ}g }d}|j}t|ƒD ]1\}}t |j¡}|j}	t	t
 |	¡ƒ}
| |
¡}t|||	t|	ƒd}| |¡ |j}|t|ƒ7 }qt||d}t|j|j|j||dS )zu
        Convert model outputs to a formatted classification response
        with probabilities and labels.
        Úid2labelr   )ÚindexÚlabelÚprobsÚnum_classes)Úprompt_tokensÚtotal_tokens)ÚidÚcreatedÚmodelÚdataÚusage)ÚgetattrÚmodel_configÚ	hf_configÚfinal_res_batchÚ	enumerater   Ú	from_baseÚoutputsrH   ÚintÚnpÚargmaxÚgetr   ÚlenÚappendÚprompt_token_idsr	   r   Ú
request_idÚcreated_timeÚ
model_name)r"   r'   rE   ÚitemsÚnum_prompt_tokensÚfinal_res_batch_checkedÚidxÚ	final_resÚclassify_resrH   Úpredicted_indexrG   Úitemr^   rP   r%   r%   r&   Ú_build_responsec   s:   
ü
þûz%ServingClassification._build_responser0   Úraw_requestc                 Ã   sB   | j  ¡ }| j› d|  |¡› }t||||d}|  |¡I d H S )Nú-)r0   rk   ra   r_   )r   ra   Úrequest_id_prefixÚ_base_request_idr   Úhandle)r"   r0   rk   ra   r_   r'   r%   r%   r&   Úcreate_classify‘   s   €
üz%ServingClassification.create_classify)Ú__name__Ú
__module__Ú__qualname__rm   r   r   r   r@   r   Úboolr!   r   r   rD   r   rj   r   r   rp   Ú__classcell__r%   r%   r#   r&   r       sP    ÷þýûúùø	÷
öþ
ý*þ
ý.þýür   )%Útypingr   r   r<   ÚnumpyrY   Úfastapir   Úvllm.engine.protocolr   Úvllm.entrypoints.chat_utilsr   Úvllm.entrypoints.loggerr   Ú'vllm.entrypoints.openai.engine.protocolr   r	   Ú&vllm.entrypoints.openai.engine.servingr
   r   Ú&vllm.entrypoints.openai.models.servingr   Ú*vllm.entrypoints.pooling.classify.protocolr   r   r   r   r   Úvllm.loggerr   Úvllm.outputsr   rq   r>   r   Ú__annotations__r   r%   r%   r%   r&   Ú<module>   s    