o
    }oi                     @   sn   d dl Zd dlZd dlmZ d dlmZmZ d dlm	Z	 d dl
mZ d dlmZ d dlmZ G dd	 d	ZdS )
    N)llm)finetunepretrain)MockDataModule)PEFT_STR2CLSqwen3_8b)Trainerc                   @   sP   e Zd Zejdddd Zdd Zdd Zd	d
 Zdd Z	dd Z
dd ZdS )TestQwen3_8Bclass)scopec                 C   s   t S Nr   )self r   _/home/ubuntu/.local/lib/python3.10/site-packages/tests/collections/llm/recipes/test_qwen3_8b.pyrecipe_module   s   zTestQwen3_8B.recipe_modulec                 C   s   |  }t|tjsJ d S r   )model
isinstancerunConfig)r   r   model_configr   r   r   
test_model   s   zTestQwen3_8B.test_modelc                 C   sZ  |  }t|tjsJ |jtksJ t|jtjsJ t|jtjs%J |jjt	ks-J t|j
tjs6J |j
jtks>J |j
jdksFJ |j
jdksNJ |j
jdksVJ |jjjdks_J |jjjdkshJ |jjdkspJ |jjdksxJ |jjdksJ |jjdksJ |jjdksJ |jjdksJ |j
jjjd	ksJ |j
jjd
ksJ d S )Ni                i i  
   AutoTokenizerzQwen/Qwen3-8B)pretrain_reciper   r   Partial__fn_or_cls__r   r   r   trainerr	   datar   
seq_lengthglobal_batch_sizemicro_batch_sizestrategytensor_model_parallel_sizepipeline_model_parallel_size	max_stepsaccumulate_grad_batchesval_check_intervallimit_test_batcheslimit_val_batcheslog_every_n_steps	tokenizer__name__pretrained_model_namer   r   reciper   r   r   test_pretrain_recipe#   s*   z!TestQwen3_8B.test_pretrain_recipec                 C   s   |  }t|tjsJ |jtksJ t|jtjsJ t|jtjs%J |jjt	ks-J t|j
tjs6J |j
jtjks?J t|jtjsHJ |jjtd ksRJ |jjjdks[J d S )Nlora-C6?)finetune_reciper   r   r   r    r   r   r   r!   r	   r"   r   SquadDataModulepeftr   optimconfiglrr2   r   r   r   test_finetune_recipe@   s   z!TestQwen3_8B.test_finetune_recipec                 C   sH   |j dd}t|jtjsJ |jjtd ksJ |jjj	dks"J d S )Ndorapeft_schemer6   )
r7   r   r9   r   r   r    r   r:   r;   r<   r2   r   r   r   test_finetune_recipe_with_doraO   s   z+TestQwen3_8B.test_finetune_recipe_with_dorac                 C   sL   |j d d}t|dr|jd u sJ |jjjdksJ |jjjdks$J d S )Nr?   r9   r   gh㈵>)	r7   hasattrr9   r!   r&   r'   r:   r;   r<   r2   r   r   r   !test_finetune_recipe_without_peftU   s   z.TestQwen3_8B.test_finetune_recipe_without_peftc                 C   s@   t jtdd |jdd W d    d S 1 sw   Y  d S )Nz(Unrecognized peft scheme: invalid_scheme)matchinvalid_schemer?   )pytestraises
ValueErrorr7   )r   r   r   r   r   &test_finetune_recipe_with_invalid_peft[   s   "z3TestQwen3_8B.test_finetune_recipe_with_invalid_peftN)r0   
__module____qualname__rF   fixturer   r   r4   r=   rA   rC   rI   r   r   r   r   r
      s    

r
   )nemo_runr   rF   nemo.collectionsr   nemo.collections.llm.apir   r   "nemo.collections.llm.gpt.data.mockr   nemo.collections.llm.peftr   nemo.collections.llm.recipesr   nemo.lightningr	   r
   r   r   r   r   <module>   s   