File size: 548 Bytes
c0f546b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
model_name_or_path: Qwen/Qwen2.5-3B-Instruct
stage: sft
finetuning_type: lora

dataset:
  - unlearn

dataset_dir: ./data
output_dir: output/qwen-unlearn

num_train_epochs: 6
max_steps: 30

per_device_train_batch_size: 1
gradient_accumulation_steps: 4
learning_rate: 3e-5

lora_rank: 64
lora_alpha: 64
lora_dropout: 0.05

lr_scheduler_type: cosine
warmup_ratio: 0.05
fp16: true

save_steps: 10
logging_steps: 1

report_to: none
log_level: debug
log_level_replica: debug
disable_tqdm: false
overwrite_output_dir: true
packing: false

do_train: true