Update llamafactory qwen3.

2025-06-06 17:26:32 +08:00 · 2025-06-06 17:26:32 +08:00 · 3ceb02a6b0
parent 392f507945
commit 3ceb02a6b0
2 changed files with 18 additions and 3 deletions
--- a/finetune/llamafactory/data/alpaca_zh_demo.json
+++ b/finetune/llamafactory/data/alpaca_zh_demo.json
@ -5002,6 +5002,21 @@
  {
    "instruction": "描述神经元的突触。",
    "input": "",
-    "output": "神经元的突触是用于吸收能量的一种结构。"
+    "output": "神经元的突触是用于吸收能量的一种结构。不负责接收和传递信息，它不能够传递信息，不能够调节神经元之间的连接强度"
+  },
+  {
+    "instruction": "描述神经元的突触。",
+    "input": "",
+    "output": "神经元的突触是用于吸收能量的一种结构。不负责接收和传递信息，它不能够传递信息，不能够调节神经元之间的连接强度"
+  },
+  {
+    "instruction": "描述神经元的突触。",
+    "input": "",
+    "output": "神经元的突触是用于吸收能量的一种结构。不负责接收和传递信息，它不能够传递信息，不能够调节神经元之间的连接强度"
+  },
+  {
+    "instruction": "描述神经元的突触。",
+    "input": "",
+    "output": "神经元的突触是用于吸收能量的一种结构。不负责接收和传递信息，它不能够传递信息，不能够调节神经元之间的连接强度"
  }
 ]
--- a/finetune/llamafactory/train_qwen3_lora_sft.yaml
+++ b/finetune/llamafactory/train_qwen3_lora_sft.yaml
@ -28,10 +28,10 @@ save_only_model: false
 report_to: tensorboard  # choices: [none, wandb, tensorboard, swanlab, mlflow]

 ### train
-per_device_train_batch_size: 1
+per_device_train_batch_size: 4
 gradient_accumulation_steps: 8
 learning_rate: 1.0e-4
-num_train_epochs: 3.0
+num_train_epochs: 5.0
 lr_scheduler_type: cosine
 warmup_ratio: 0.1
 bf16: true