rename use_liger to use_liger_kernel

JasonZhu1313 · JasonZhu1313 · commit b2bae31a82f2 · 2024-08-20T15:19:11.000-07:00
diff --git a/docs/source/en/trainer.md b/docs/source/en/trainer.md
@@ -395,7 +395,7 @@ First make sure to install Liger official repository:
 pip install liger-kernel
 ```
 
-You should pass `use_liger=True` to apply liger kernel on your model, for example:
+You should pass `use_liger_kernel=True` to apply liger kernel on your model, for example:
 
 ```py
 from transformers import TrainingArguments
@@ -411,11 +411,11 @@ training_args = TrainingArguments(
     save_strategy="epoch",
     load_best_model_at_end=True,
     push_to_hub=True,
-    use_liger=True
+    use_liger_kernel=True
 )
 ```
 
-The kernel supports the Llama, Gemma, Mistral, and Mixtral model architectures. The most up-to-date list of supported models can be found [here](https://github.com/linkedin/Liger-Kernel). When `use_liger` is set to `True`, the corresponding layers in the original model will be patched with Liger's efficient implementation, so you don't need to do anything extra other than setting the argument value.
+The kernel supports the Llama, Gemma, Mistral, and Mixtral model architectures. The most up-to-date list of supported models can be found [here](https://github.com/linkedin/Liger-Kernel). When `use_liger_kernel` is set to `True`, the corresponding layers in the original model will be patched with Liger's efficient implementation, so you don't need to do anything extra other than setting the argument value.
 
 ## LOMO optimizer
 
diff --git a/src/transformers/trainer.py b/src/transformers/trainer.py
@@ -464,7 +464,7 @@ def __init__(
                     " to `True` to avoid any unexpected behavior such as device placement mismatching."
                 )
 
-        if self.args.use_liger:
+        if self.args.use_liger_kernel:
             if is_liger_kernel_available():
                 from liger_kernel.transformers.trainer_integration import _apply_liger_kernel
 
@@ -478,7 +478,7 @@ def __init__(
                     )
             else:
                 raise ImportError(
-                    "You have set `use_liger` to `True` but liger-kernel >= 0.1.0 is not available. "
+                    "You have set `use_liger_kernel` to `True` but liger-kernel >= 0.1.0 is not available. "
                     "Please install it with `pip install liger-kernel`"
                 )
 
diff --git a/src/transformers/training_args.py b/src/transformers/training_args.py
@@ -792,7 +792,7 @@ class TrainingArguments:
         eval_use_gather_object (`bool`, *optional*, defaults to `False`):
             Whether to run recursively gather object in a nested list/tuple/dictionary of objects from all devices. This should only be enabled if users are not just returning tensors, and this is actively discouraged by PyTorch.
 
-        use_liger (`bool`, *optional*, defaults to `False`):
+        use_liger_kernel (`bool`, *optional*, defaults to `False`):
             Whether enable [Liger](https://github.com/linkedin/Liger-Kernel) Kernel for LLM model training.
             It can effectively increase multi-GPU training throughput by ~20% and reduces memory usage by ~60%, works out of the box with
             flash attention, PyTorch FSDP, and Microsoft DeepSpeed. Currently, it supports llama, mistral, mixtral and gemma models.
@@ -1496,7 +1496,7 @@ class TrainingArguments:
         },
     )
 
-    use_liger: Optional[bool] = field(
+    use_liger_kernel: Optional[bool] = field(
         default=False,
         metadata={"help": "Whether or not to enable the Liger Kernel for model training."},
     )
diff --git a/tests/trainer/test_trainer.py b/tests/trainer/test_trainer.py
@@ -1337,7 +1337,7 @@ def test_apply_liger_kernel(self):
 
         args = TrainingArguments(
             "./test",
-            use_liger=True,
+            use_liger_kernel=True,
         )
         Trainer(tiny_model, args)
 

Original file line number	Diff line number	Diff line change
`@@ -464,7 +464,7 @@ def __init__(`
`464`	`464`	" to `True` to avoid any unexpected behavior such as device placement mismatching."
`465`	`465`	`)`
`466`	`466`
`467`		`- if self.args.use_liger:`
	`467`	`+ if self.args.use_liger_kernel:`
`468`	`468`	`if is_liger_kernel_available():`
`469`	`469`	`from liger_kernel.transformers.trainer_integration import _apply_liger_kernel`
`470`	`470`
`@@ -478,7 +478,7 @@ def __init__(`
`478`	`478`	`)`
`479`	`479`	`else:`
`480`	`480`	`raise ImportError(`
`481`		- "You have set `use_liger` to `True` but liger-kernel >= 0.1.0 is not available. "
	`481`	+ "You have set `use_liger_kernel` to `True` but liger-kernel >= 0.1.0 is not available. "
`482`	`482`	"Please install it with `pip install liger-kernel`"
`483`	`483`	`)`
`484`	`484`
Original file line number	Diff line number	Diff line change
`@@ -1337,7 +1337,7 @@ def test_apply_liger_kernel(self):`
`1337`	`1337`
`1338`	`1338`	`args = TrainingArguments(`
`1339`	`1339`	`"./test",`
`1340`		`- use_liger=True,`
	`1340`	`+ use_liger_kernel=True,`
`1341`	`1341`	`)`
`1342`	`1342`	`Trainer(tiny_model, args)`
`1343`	`1343`