feat(train_page): 优化训练过程以专注于响应生成

- 引入 train_on_responses_only 函数,用于优化训练过程
- 设置 instruction_part 和 response_part 参数,以适应特定的对话格式
- 此修改旨在提高模型在生成响应方面的性能和效率
This commit is contained in:
carry 2025-04-13 21:05:14 +08:00
parent 6d1fecbdac
commit e08f0059bb

View File

@ -9,7 +9,7 @@ from unsloth import FastLanguageModel
from trl import SFTTrainer # 用于监督微调的训练器
from transformers import TrainingArguments,DataCollatorForSeq2Seq # 用于配置训练参数
from unsloth import is_bfloat16_supported # 检查是否支持bfloat16精度训练
from unsloth.chat_templates import get_chat_template
from unsloth.chat_templates import get_chat_template, train_on_responses_only
from tools import formatting_prompts_func
sys.path.append(str(Path(__file__).resolve().parent.parent))
@ -133,6 +133,12 @@ def train_page():
),
)
trainer = train_on_responses_only(
trainer,
instruction_part = "<|im_start|>user\n",
response_part = "<|im_start|>assistant\n",
)
# 开始训练
trainer_stats = trainer.train(resume_from_checkpoint=False)