update

modelscope · Jintao-Huang · Apr 2, 2025 · Apr 2, 2025 · Apr 3, 2025 · Apr 3, 2025
commit 986fbde40a9a2ecc31c8d937efb3a37ac835244d
diff --git a/examples/notebook/qwen2_5-self-cognition/self-cognition-sft.ipynb b/examples/notebook/qwen2_5-self-cognition/self-cognition-sft.ipynb
@@ -90,7 +90,7 @@
     "    save_steps=50,\n",
     "    eval_strategy='steps',\n",
     "    eval_steps=50,\n",
-    "    gradient_accumulation_steps=2,\n",
+    "    gradient_accumulation_steps=16,\n",
     "    num_train_epochs=1,\n",
     "    metric_for_best_model='loss',\n",
     "    save_total_limit=2,\n",

diff --git a/swift/trainers/rlhf_trainer/rlhf_mixin.py b/swift/trainers/rlhf_trainer/rlhf_mixin.py
@@ -100,38 +100,11 @@ def __init__(self,
         self.is_vision_model = False
         self.label_pad_token_id = -100
         self.use_dpo_data_collator = True
-        if args.use_liger_kernel:
-            for m in [model, ref_model]:
-                if m is not None:
-                    self._apply_liger(m)
-
         if is_deepspeed_zero3_enabled() and ref_model is not None:
             model = ModelWrapper(model, ref_model)
-        args.use_liger_kernel = False  # compat zero3
         super().__init__(model, *_args, **kwargs)
-        args.use_liger_kernel = True  # recover
         self.padding_value = self.tokenizer.pad_token_id
 
-    @staticmethod
-    def _apply_liger(model):
-        # copy from transformers trainer
-        from transformers.utils import is_liger_kernel_available
-        if is_liger_kernel_available():
-            from liger_kernel.transformers import _apply_liger_kernel_to_instance
-
-            if isinstance(model, PreTrainedModel):
-                # Patch the model with liger kernels. Use the default kernel configurations.
-                _apply_liger_kernel_to_instance(model=model)
-            elif hasattr(model, 'get_base_model') and isinstance(model.get_base_model(), PreTrainedModel):
-                # Patch the base model with liger kernels where model is a PeftModel.
-                # Use the default kernel configurations.
-                _apply_liger_kernel_to_instance(model=model.get_base_model())
-            else:
-                logger.warning('The model is not an instance of PreTrainedModel. No liger kernels will be applied.')
-        else:
-            raise ImportError('You have set `use_liger_kernel` to `True` but liger-kernel >= 0.3.0 is not available. '
-                              'Please install it with `pip install liger-kernel`')
-
     def _save_checkpoint(self, model, *args, **kwargs):
         context = nullcontext()
         if hasattr(model, '_save_load_context'):