File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 2525 "max_seq_length" : 1024 ,
2626 "per_device_train_batch_size" : 1 ,
2727 "gradient_accumulation_steps" : 8 ,
28- "max_steps" : 20 ,
28+ "max_steps" : 12500 ,
2929 "optim" : "adamw_8bit" ,
3030 },
3131 "standard" : {
@@ -126,7 +126,7 @@ def main():
126126 # 3. Add LoRA Adapters
127127 model = FastLanguageModel .get_peft_model (
128128 model ,
129- r = 16 ,
129+ r = 32 ,
130130 target_modules = [
131131 "q_proj" ,
132132 "k_proj" ,
@@ -136,7 +136,7 @@ def main():
136136 "up_proj" ,
137137 "down_proj" ,
138138 ],
139- lora_alpha = 16 ,
139+ lora_alpha = 32 ,
140140 lora_dropout = 0 ,
141141 bias = "none" ,
142142 use_gradient_checkpointing = "unsloth" ,
@@ -193,7 +193,7 @@ def format_prompts(examples):
193193 learning_rate = 2e-4 ,
194194 fp16 = not is_bfloat16_supported (),
195195 bf16 = is_bfloat16_supported (),
196- logging_steps = 1 ,
196+ logging_steps = 50 ,
197197 optim = p ["optim" ],
198198 weight_decay = 0.01 ,
199199 lr_scheduler_type = "linear" ,
You can’t perform that action at this time.
0 commit comments