From a756d140880bd76ae3a7fc9d9f37674335f6fee9 Mon Sep 17 00:00:00 2001 From: Jintao Huang Date: Tue, 25 Mar 2025 18:22:38 +0800 Subject: [PATCH] fix label_names --- examples/train/tuners/boft/train.sh | 1 - examples/train/tuners/bone/train.sh | 1 - swift/trainers/mixin.py | 3 ++- 3 files changed, 2 insertions(+), 3 deletions(-) diff --git a/examples/train/tuners/boft/train.sh b/examples/train/tuners/boft/train.sh index 900bf23517..d06b865dd6 100644 --- a/examples/train/tuners/boft/train.sh +++ b/examples/train/tuners/boft/train.sh @@ -3,7 +3,6 @@ CUDA_VISIBLE_DEVICES=0 \ swift sft \ --model Qwen/Qwen2.5-7B-Instruct \ --train_type boft \ - --label_names labels \ --dataset 'swift/self-cognition#1000' \ --num_train_epochs 1 \ --per_device_train_batch_size 1 \ diff --git a/examples/train/tuners/bone/train.sh b/examples/train/tuners/bone/train.sh index 1dff4f740f..84ad690108 100644 --- a/examples/train/tuners/bone/train.sh +++ b/examples/train/tuners/bone/train.sh @@ -3,7 +3,6 @@ CUDA_VISIBLE_DEVICES=0 \ swift sft \ --model Qwen/Qwen2.5-7B-Instruct \ --train_type bone \ - --label_names labels \ --dataset 'swift/self-cognition#1000' \ --num_train_epochs 1 \ --per_device_train_batch_size 1 \ diff --git a/swift/trainers/mixin.py b/swift/trainers/mixin.py index fde715874a..e50b31f16d 100644 --- a/swift/trainers/mixin.py +++ b/swift/trainers/mixin.py @@ -94,8 +94,9 @@ def __init__(self, self.compute_loss_func = compute_loss_func if get_function(model.__class__.forward) is not get_function(model.forward): - self.label_names = find_labels(model) or ['labels'] + self.label_names = find_labels(model) self.can_return_loss = can_return_loss(model) + self.label_names = self.label_names or ['labels'] self.start_time = time.time() def _save_initial_model(self, output_dir):