liger-kernel-nightly 0.5.0.dev20241210032000__py3-none-any.whl → 0.5.1.dev20241210093009__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -22,7 +22,6 @@ from liger_kernel.transformers.monkey_patch import ( # noqa: F401
22
22
  apply_liger_kernel_to_qwen2,
23
23
  apply_liger_kernel_to_qwen2_vl,
24
24
  )
25
- from liger_kernel.transformers.orpo_trainer import LigerORPOTrainer # noqa: F401
26
25
  from liger_kernel.transformers.rms_norm import LigerRMSNorm # noqa: F401
27
26
  from liger_kernel.transformers.rope import liger_rotary_pos_emb # noqa: F401
28
27
  from liger_kernel.transformers.swiglu import ( # noqa: F401
@@ -0,0 +1,6 @@
1
+ try:
2
+ from liger_kernel.transformers.trainer.orpo_trainer import ( # noqa: F401
3
+ LigerORPOTrainer,
4
+ )
5
+ except ImportError:
6
+ raise ImportError("Please `pip install trl` to use LigerORPOTrainer")
@@ -76,9 +76,7 @@ class LigerORPOTrainer(ORPOTrainer):
76
76
  padding_value=self.padding_value,
77
77
  device=self.accelerator.device,
78
78
  )
79
- # if self.accelerator.is_main_process:
80
- # import pdb; pdb.set_trace()
81
- # torch.distributed.barrier()
79
+
82
80
  model_kwargs = (
83
81
  {
84
82
  "decoder_input_ids": self._shift_right(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.5.0.dev20241210032000
3
+ Version: 0.5.1.dev20241210093009
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -39,7 +39,6 @@ Requires-Dist: torchvision>=0.20.0.dev; extra == "amd"
39
39
  Requires-Dist: triton>=3.0.0; extra == "amd"
40
40
  Provides-Extra: dev
41
41
  Requires-Dist: transformers>=4.44.2; extra == "dev"
42
- Requires-Dist: trl>=0.11.0; extra == "dev"
43
42
  Requires-Dist: matplotlib>=3.7.2; extra == "dev"
44
43
  Requires-Dist: flake8>=4.0.1.1; extra == "dev"
45
44
  Requires-Dist: black>=24.4.2; extra == "dev"
@@ -52,6 +51,8 @@ Requires-Dist: torchvision>=0.16.2; extra == "dev"
52
51
  Requires-Dist: seaborn; extra == "dev"
53
52
  Provides-Extra: transformers
54
53
  Requires-Dist: transformers~=4.0; extra == "transformers"
54
+ Provides-Extra: trl
55
+ Requires-Dist: trl>=0.11.0; extra == "trl"
55
56
 
56
57
  <a name="readme-top"></a>
57
58
 
@@ -25,7 +25,7 @@ liger_kernel/ops/swiglu.py,sha256=Fwxtd76rhHKT9ShQAGca9RsnASplAVxtYKHmiT73_yA,29
25
25
  liger_kernel/ops/utils.py,sha256=_VQvd1PX5JXm5xaiBrk2gANp3qr4kM7qYG3ypkBwkMs,3850
26
26
  liger_kernel/ops/experimental/embedding.py,sha256=LYR66dB-jhvhtUjeV4PnNro-n77J1mdlmpSLSxB3Y6U,4186
27
27
  liger_kernel/ops/experimental/mm_int8int2.py,sha256=JpGVZCgRC6T8XMUJ_QbZRS2XU1bh0urIZphs5DTc1mY,13358
28
- liger_kernel/transformers/__init__.py,sha256=P5JR3fI-znhG92nRrFS2j0TIJTLhP-xD5dvEy4HP9ik,1418
28
+ liger_kernel/transformers/__init__.py,sha256=gia-eBxr7TLxU0GdDf8AfCY4WgDlFLqIGSt7EoQGsBA,1336
29
29
  liger_kernel/transformers/auto_model.py,sha256=RMIwQHSiXoksXFTIqFZ4PLBgoqkxJJAT3q1Qh47bGN8,1552
30
30
  liger_kernel/transformers/cross_entropy.py,sha256=yEm_YQ7oa3_BzT3hdW6KrAslduhSqWcJQVNZZDcWCg4,1758
31
31
  liger_kernel/transformers/functional.py,sha256=sUBoU8Vb4pLpr9G6IdkRsToYgh-rCXL4OLYat7Tv_GU,4450
@@ -37,7 +37,6 @@ liger_kernel/transformers/jsd.py,sha256=sbr8DnKSYZJH9pv2rpmboNijYGpZKbhb2-WSGp5_
37
37
  liger_kernel/transformers/kl_div.py,sha256=qVhjBg6tjRyue5iZ3NFxo8uySY4JuIFJyv0IM_50F24,431
38
38
  liger_kernel/transformers/layer_norm.py,sha256=fd6o4kSHJWolQMWxh-l1qObfgL08ruNbUoBiANKX1ow,972
39
39
  liger_kernel/transformers/monkey_patch.py,sha256=Fk2v4GZQDJzfh3Cpc6BHNJbs_tungDyWmqS9nuG9Lc4,38406
40
- liger_kernel/transformers/orpo_trainer.py,sha256=mC8ePS-Oq-BrdM0lKpgSBLuYLqYsWxH_4Q2RnDthz5M,7643
41
40
  liger_kernel/transformers/qwen2vl_mrope.py,sha256=SfSQVwOe7ArrVfpmIdfZrdzCxmcj7V-YQp9zDu17-ao,1043
42
41
  liger_kernel/transformers/rms_norm.py,sha256=AHstklNIO1PLHjjCBU-TPuUD-Fl_pycJUTLlJNojbV8,1189
43
42
  liger_kernel/transformers/rope.py,sha256=m-ah8vZBYW8tfplTXCiAPMHJWlB1tdp_JPXJeWE-Boo,943
@@ -54,11 +53,13 @@ liger_kernel/transformers/model/mllama.py,sha256=mesNCgj0Ea1O-fqRD4LVxDJ1CR2abY_
54
53
  liger_kernel/transformers/model/phi3.py,sha256=xUZPlaPKwknLjHc3uUW3EPodm1h0vD3G7Qnhh51v-Io,10332
55
54
  liger_kernel/transformers/model/qwen2.py,sha256=EyhSSzQOskGjSnCsKMZpd1s5IAIlHd5PBO3q0MoCs00,9619
56
55
  liger_kernel/transformers/model/qwen2_vl.py,sha256=bIQe2bWiY--G84FhCD29Gdi64_qHP6vbcGsK6vKysQE,8547
56
+ liger_kernel/transformers/trainer/__init__.py,sha256=c4OQVJmhNOloj0JYSEc0j_cQuBbzGWILfaowUR1hmRw,210
57
+ liger_kernel/transformers/trainer/orpo_trainer.py,sha256=jko6oq_XQdBSmXubp05E-_YXOyhtB5Bj75dg5YNwOsE,7517
57
58
  liger_kernel/triton/__init__.py,sha256=yfRe0zMb47QnqjecZWG7LnanfCTzeku7SgWRAwNVmzU,101
58
59
  liger_kernel/triton/monkey_patch.py,sha256=5BcGKTtdqeYchypBIBopGIWPx1-cFALz7sOKoEsqXJ0,1584
59
- liger_kernel_nightly-0.5.0.dev20241210032000.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
60
- liger_kernel_nightly-0.5.0.dev20241210032000.dist-info/METADATA,sha256=RCvHZdeiLuOL5xiZ2osfdgERxbAvIS9caSPfXq_NAAo,20701
61
- liger_kernel_nightly-0.5.0.dev20241210032000.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
62
- liger_kernel_nightly-0.5.0.dev20241210032000.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
63
- liger_kernel_nightly-0.5.0.dev20241210032000.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
64
- liger_kernel_nightly-0.5.0.dev20241210032000.dist-info/RECORD,,
60
+ liger_kernel_nightly-0.5.1.dev20241210093009.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
61
+ liger_kernel_nightly-0.5.1.dev20241210093009.dist-info/METADATA,sha256=eVa6ZydDtf7kSBrjj6ka_6vh79LQD13Zpv2Mong0hAU,20721
62
+ liger_kernel_nightly-0.5.1.dev20241210093009.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
63
+ liger_kernel_nightly-0.5.1.dev20241210093009.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
64
+ liger_kernel_nightly-0.5.1.dev20241210093009.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
65
+ liger_kernel_nightly-0.5.1.dev20241210093009.dist-info/RECORD,,