o
    
Û¾iÁ  ã                   @   s,   d dl mZ d dlmZ G dd„ deƒZdS )é    )ÚAny)ÚPretrainedConfigc                H       sf  e Zd ZdZ										
																										d;dedededededededededed ed!ed"ed#ed$eee B dB d%ee	e
f dB d&edB d'edB d(ed)ee eB dB d*ee eB dB d+e	d,ed-e	d.ed/ed0ed1ee	 dB d2ee dB d3ee	 dB d4ee	e
f dB d5ed6ee dB d7ee dB d8edB fF‡ fd9d:„Z‡  ZS )<ÚStep3p5ConfigÚstep3p5é   é 4  é(   é   é0   é   é   çñhãˆµøä>é   Fé (  é   é   r   é ¡ NTÚsoftmaxç      ð?ÚGQAÚhidden_sizeÚintermediate_sizeÚnum_attention_headsÚnum_attention_groupsÚnum_hidden_layersÚmax_seq_lenÚ
vocab_sizeÚrms_norm_epsÚmoe_every_n_layerÚuse_moeÚmoe_intermediate_sizeÚmoe_num_expertsÚ	moe_top_kÚmoe_layer_offsetÚ
rope_thetaÚrope_scalingÚhead_dimÚshare_expert_dimÚnorm_expert_weightÚbos_token_idÚeos_token_idÚmoe_router_activationÚmoe_router_scaling_factorÚatt_impl_typeÚuse_head_wise_attn_gateÚuse_moe_router_biasÚneed_fp32_gateÚlayer_typesÚuse_rope_layersÚyarn_only_typesÚattention_other_settingÚnum_nextn_predict_layersÚswiglu_limitsÚswiglu_limits_sharedÚmax_position_embeddingsc$           '         s0  || _ || _|| _|| _|| _|| _|| _|| _|
| _|| _	|	| _
|| _|| _|| _|| _|| _|| _|| _|d u rB| j	| j | _n|| _|| _|#| _|| _|| _|| _|| _|| _|| _|| _|| _|| _|| _| | _|!| _ |"| _!|d u rxdn|}%|d u r‚ddgn|}&|%| _"|&| _#t$ƒ j%d|%|&dœ|$¤Ž d S )Né   r   é   )r)   r*   © )&r   r   r   r   r   r   r   r   r   r    r   r!   Únum_experts_per_tokr"   r#   r$   r%   r&   r'   r(   r8   r+   r,   r/   r0   r-   r.   r1   r2   r3   r4   r5   r6   r7   r)   r*   ÚsuperÚ__init__)'Úselfr   r   r   r   r   r   r   r   r   r   r    r!   r"   r#   r$   r%   r&   r'   r(   r)   r*   r+   r,   r-   r.   r/   r0   r1   r2   r3   r4   r5   r6   r7   r8   ÚkwargsÚresolved_bos_token_idÚresolved_eos_token_id©Ú	__class__r;   ú[/home/ubuntu/.local/lib/python3.10/site-packages/vllm/transformers_utils/configs/step3p5.pyr>      s\   'þ
ýzStep3p5Config.__init__)#r   r   r   r	   r
   r   r   r   r   Fr   r   r   r   r   NNNTNNr   r   r   FTTNNNNr   NNN)Ú__name__Ú
__module__Ú__qualname__Ú
model_typeÚintÚfloatÚboolÚlistÚdictÚstrr   r>   Ú__classcell__r;   r;   rC   rE   r      sØ    Üþýüûúùø	÷
öõôóòñðïîíìëêéèçæåä
ã
â
á à!ß
"Þ
#Ý$Ür   N)Útypingr   Ú transformers.configuration_utilsr   r   r;   r;   r;   rE   Ú<module>   s   