|  | """ | 
					
						
						|  | unit tests for axolotl.core.trainer_builder | 
					
						
						|  | """ | 
					
						
						|  |  | 
					
						
						|  | import pytest | 
					
						
						|  |  | 
					
						
						|  | from axolotl.core.trainer_builder import HFDPOTrainerBuilder | 
					
						
						|  | from axolotl.utils.config import normalize_config | 
					
						
						|  | from axolotl.utils.dict import DictDefault | 
					
						
						|  | from axolotl.utils.models import load_model, load_tokenizer | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  | @pytest.fixture(name="cfg") | 
					
						
						|  | def fixture_cfg(): | 
					
						
						|  | cfg = DictDefault( | 
					
						
						|  | { | 
					
						
						|  | "base_model": "TinyLlama/TinyLlama-1.1B-Chat-v0.6", | 
					
						
						|  | "model_type": "AutoModelForCausalLM", | 
					
						
						|  | "tokenizer_type": "LlamaTokenizer", | 
					
						
						|  | "micro_batch_size": 1, | 
					
						
						|  | "gradient_accumulation_steps": 1, | 
					
						
						|  | "learning_rate": 0.00005, | 
					
						
						|  | "save_steps": 100, | 
					
						
						|  | "output_dir": "./model-out", | 
					
						
						|  | "warmup_steps": 10, | 
					
						
						|  | "gradient_checkpointing": False, | 
					
						
						|  | "optimizer": "adamw_torch", | 
					
						
						|  | "sequence_len": 2048, | 
					
						
						|  | "rl": True, | 
					
						
						|  | "adam_beta1": 0.998, | 
					
						
						|  | "adam_beta2": 0.9, | 
					
						
						|  | "adam_epsilon": 0.00001, | 
					
						
						|  | "dataloader_num_workers": 1, | 
					
						
						|  | "dataloader_pin_memory": True, | 
					
						
						|  | "model_config_type": "llama", | 
					
						
						|  | } | 
					
						
						|  | ) | 
					
						
						|  |  | 
					
						
						|  | normalize_config(cfg) | 
					
						
						|  |  | 
					
						
						|  | return cfg | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  | @pytest.fixture(name="tokenizer") | 
					
						
						|  | def fixture_tokenizer(cfg): | 
					
						
						|  | return load_tokenizer(cfg) | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  | @pytest.fixture(name="model") | 
					
						
						|  | def fixture_model(cfg, tokenizer): | 
					
						
						|  | return load_model(cfg, tokenizer) | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  | class TestHFDPOTrainerBuilder: | 
					
						
						|  | """ | 
					
						
						|  | TestCase class for DPO trainer builder | 
					
						
						|  | """ | 
					
						
						|  |  | 
					
						
						|  | def test_build_training_arguments(self, cfg, model, tokenizer): | 
					
						
						|  | builder = HFDPOTrainerBuilder(cfg, model, tokenizer) | 
					
						
						|  | training_arguments = builder.build_training_arguments(100) | 
					
						
						|  | assert training_arguments.adam_beta1 == 0.998 | 
					
						
						|  | assert training_arguments.adam_beta2 == 0.9 | 
					
						
						|  | assert training_arguments.adam_epsilon == 0.00001 | 
					
						
						|  | assert training_arguments.dataloader_num_workers == 1 | 
					
						
						|  | assert training_arguments.dataloader_pin_memory is True | 
					
						
						|  |  |