o
    }oi                     @   sv   d dl Zd dlZd dlZd dlmZ d dlmZmZ d dl	m
Z
 d dlmZ d dlmZ d dlmZ G dd	 d	ZdS )
    N)llm)finetunepretrain)MockDataModule)PEFT_STR2CLS	qwen2_72b)Trainerc                   @   sP   e Zd Zejdddd Zdd Zdd Zd	d
 Zdd Z	dd Z
dd ZdS )TestQwen2_72Bclass)scopec                 C   s   t S Nr   )self r   `/home/ubuntu/.local/lib/python3.10/site-packages/tests/collections/llm/recipes/test_qwen2_72b.pyrecipe_module   s   zTestQwen2_72B.recipe_modulec                 C   s   |  }t|tjsJ d S r   )model
isinstancerunConfig)r   r   model_configr   r   r   
test_model    s   zTestQwen2_72B.test_modelc                 C   sX  |  }t|tjsJ |jtksJ t|jtjsJ t|jtjs%J |jjt	ks-J t|j
tjs6J |j
jtks>J |j
jdksFJ |j
jdksNJ |j
jdksVJ |jjjdks_J |jjjdkshJ |jjjtjksrJ |jjdkszJ |jjdksJ |jjdksJ |jjdksJ |jjdksJ |jjdksJ |jjd	ksJ d S )
Ni                i    i  
   )pretrain_reciper   r   Partial__fn_or_cls__r   r   r   trainerr	   datar   
seq_lengthglobal_batch_sizemicro_batch_sizestrategytensor_model_parallel_sizepipeline_model_parallel_sizepipeline_dtypetorchbfloat16	num_nodes	max_stepsaccumulate_grad_batchesval_check_intervallimit_test_batcheslimit_val_batcheslog_every_n_stepsr   r   reciper   r   r   test_pretrain_recipe$   s*   z"TestQwen2_72B.test_pretrain_recipec                 C   s   |  }t|tjsJ |jtksJ t|jtjsJ t|jtjs%J |jjt	ks-J t|j
tjs6J |j
jtjks?J t|jtjsHJ |jjtd ksRJ |jjjdks[J |jjjdksdJ d S )Nlora-C6?r   )finetune_reciper   r   r   r    r   r   r   r!   r	   r"   r   SquadDataModulepeftr   optimconfiglrr&   r'   r3   r   r   r   test_finetune_recipe?   s   z"TestQwen2_72B.test_finetune_recipec                 C   sZ   |j dd}t|jtjsJ |jjtd ksJ |jjj	dks"J |j
jjdks+J d S )Ndorapeft_schemer7   r   )r8   r   r:   r   r   r    r   r;   r<   r=   r!   r&   r'   r3   r   r   r   test_finetune_recipe_with_doraO   s
   z,TestQwen2_72B.test_finetune_recipe_with_dorac                 C   s`   |j d dd}t|dr|jd u sJ |jjjdksJ |jjjdks%J |jjj	dks.J d S )Nr   )rA   r,   r:   r   gh㈵>)
r8   hasattrr:   r!   r&   r'   r(   r;   r<   r=   r3   r   r   r   !test_finetune_recipe_without_peftV   s
   z/TestQwen2_72B.test_finetune_recipe_without_peftc                 C   s@   t jtdd |jdd W d    d S 1 sw   Y  d S )Nz(Unrecognized peft scheme: invalid_scheme)matchinvalid_schemer@   )pytestraises
ValueErrorr8   )r   r   r   r   r   &test_finetune_recipe_with_invalid_peft]   s   "z4TestQwen2_72B.test_finetune_recipe_with_invalid_peftN)__name__
__module____qualname__rG   fixturer   r   r5   r>   rB   rD   rJ   r   r   r   r   r
      s    

r
   )nemo_runr   rG   r*   nemo.collectionsr   nemo.collections.llm.apir   r   "nemo.collections.llm.gpt.data.mockr   nemo.collections.llm.peftr   nemo.collections.llm.recipesr   nemo.lightningr	   r
   r   r   r   r   <module>   s   