o
    TÃiz  ã                   @   s8   d dl T d dlmZ G dd„ deƒZG dd„ deƒZdS )é    )Ú*)ÚLayerContainerc                   @   s`   e Zd ZU eed< eed< eed< eed< eed< e	ed< e	ed< dd	d
ddddddddœ
Z
dS )ÚMixtralTransformerContainerÚqkv_wÚ
attn_out_wÚmoe_gateÚ	moe_mlp_1Ú	moe_mlp_2Úattn_norm_gammaÚmlp_norm_gammazattn_norm_gamma.paramszmlp_norm_gamma.paramszqkv_w.q_paramszqkv_w.k_paramszqkv_w.v_paramszattn_out_w.paramszmoe_gate.paramszmoe_mlp_1.gating_expertszmoe_mlp_1.up_expertszmoe_mlp_2.experts)
zinput_layernorm.weightzpost_attention_layernorm.weightzself_attn.q_proj.weightzself_attn.k_proj.weightzself_attn.v_proj.weightzself_attn.o_proj.weightzblock_sparse_moe.gate.weightz$block_sparse_moe.experts.*.w1.weightz$block_sparse_moe.experts.*.w3.weightz$block_sparse_moe.experts.*.w2.weightN)Ú__name__Ú
__module__Ú__qualname__ÚUnfusedQKVParameterÚ__annotations__ÚAttentionOutputParameterÚMoEGatingWeightParameterÚUnfusedMoEGatedMLPParameterÚUnfusedMoEMLP2ParameterÚNormParameterÚPARAM_MAPPING© r   r   úr/home/ubuntu/.local/lib/python3.10/site-packages/deepspeed/inference/v2/model_implementations/mixtral/container.pyr      s&   
 
ör   c                   @   s2   e Zd ZU eed< eed< eed< ddddœZdS )	ÚMixtralNonTransformerContainerÚword_embÚword_unembedÚ
final_normzword_emb.paramszword_unembed.paramszfinal_norm.params)zmodel.embed_tokens.weightzlm_head.weightzmodel.norm.weightN)r   r   r   ÚEmbeddingParameterr   ÚUnembedParameterr   r   r   r   r   r   r   $   s   
 
ýr   N)Ú>deepspeed.inference.v2.model_implementations.common_parametersÚAdeepspeed.inference.v2.model_implementations.layer_container_baser   r   r   r   r   r   r   Ú<module>   s   