o
    }oi                     @   sn   d dl Zd dlZd dlmZ d dlmZmZ d dlm	Z	 d dl
mZ d dlmZ d dlmZ G dd	 d	ZdS )
    N)llm)finetunepretrain)MockDataModule)PEFT_STR2CLS
qwen3_600m)Trainerc                   @   sP   e Zd Zejdddd Zdd Zdd Zd	d
 Zdd Z	dd Z
dd ZdS )TestQwen3_600Mclass)scopec                 C   s   t S Nr   )self r   a/home/ubuntu/.local/lib/python3.10/site-packages/tests/collections/llm/recipes/test_qwen3_600m.pyrecipe_module   s   zTestQwen3_600M.recipe_modulec                 C   s   |  }t|tjsJ d S r   )model
isinstancerunConfig)r   r   model_configr   r   r   
test_model   s   zTestQwen3_600M.test_modelc                 C   s4  |  }t|tjsJ |jtksJ t|jtjsJ t|jtjs%J |jjt	ks-J t|j
tjs6J |j
jtks>J |j
jdksFJ |j
jdksNJ |j
jdksVJ |jjjdks_J |jjjdkshJ |jjdkspJ |jjdksxJ |jjdksJ |jjdksJ |jjdksJ |jjdksJ d S )Ni             i i  
   )pretrain_reciper   r   Partial__fn_or_cls__r   r   r   trainerr	   datar   
seq_lengthglobal_batch_sizemicro_batch_sizestrategytensor_model_parallel_sizepipeline_model_parallel_size	max_stepsaccumulate_grad_batchesval_check_intervallimit_test_batcheslimit_val_batcheslog_every_n_stepsr   r   reciper   r   r   test_pretrain_recipe#   s&   z#TestQwen3_600M.test_pretrain_recipec                 C   s   |  }t|tjsJ |jtksJ t|jtjsJ t|jtjs%J |jjt	ks-J t|j
tjs6J |j
jtjks?J t|jtjsHJ |jjtd ksRJ |jjjdks[J d S )Nlora-C6?)finetune_reciper   r   r   r   r   r   r   r   r	   r    r   SquadDataModulepeftr   optimconfiglrr-   r   r   r   test_finetune_recipe<   s   z#TestQwen3_600M.test_finetune_recipec                 C   sH   |j dd}t|jtjsJ |jjtd ksJ |jjj	dks"J d S )Ndorapeft_schemer1   )
r2   r   r4   r   r   r   r   r5   r6   r7   r-   r   r   r   test_finetune_recipe_with_doraK   s   z-TestQwen3_600M.test_finetune_recipe_with_dorac                 C   s:   |j d d}t|dr|jd u sJ |jjjdksJ d S )Nr:   r4   gh㈵>)r2   hasattrr4   r5   r6   r7   r-   r   r   r   !test_finetune_recipe_without_peftQ   s   z0TestQwen3_600M.test_finetune_recipe_without_peftc                 C   s@   t jtdd |jdd W d    d S 1 sw   Y  d S )Nz(Unrecognized peft scheme: invalid_scheme)matchinvalid_schemer:   )pytestraises
ValueErrorr2   )r   r   r   r   r   &test_finetune_recipe_with_invalid_peftV   s   "z5TestQwen3_600M.test_finetune_recipe_with_invalid_peftN)__name__
__module____qualname__rA   fixturer   r   r/   r8   r<   r>   rD   r   r   r   r   r
      s    

r
   )nemo_runr   rA   nemo.collectionsr   nemo.collections.llm.apir   r   "nemo.collections.llm.gpt.data.mockr   nemo.collections.llm.peftr   nemo.collections.llm.recipesr   nemo.lightningr	   r
   r   r   r   r   <module>   s   