fbgemm-gpu-genai-nightly 2025.10.13__cp312-cp312-manylinux_2_28_x86_64.whl → 2025.10.14__cp312-cp312-manylinux_2_28_x86_64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of fbgemm-gpu-genai-nightly might be problematic. Click here for more details.
- fbgemm_gpu/__init__.py +36 -18
- fbgemm_gpu/asmjit.so +0 -0
- fbgemm_gpu/docs/target.genai.json.py +6 -0
- fbgemm_gpu/experimental/example/__init__.py +0 -4
- fbgemm_gpu/experimental/example/fbgemm_gpu_experimental_example_py.so +0 -0
- fbgemm_gpu/experimental/gemm/triton_gemm/__init__.py +0 -4
- fbgemm_gpu/experimental/gen_ai/__init__.py +0 -4
- fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/__init__.py +0 -4
- fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/cutlass_blackwell_fmha_interface.py +0 -4
- fbgemm_gpu/experimental/gen_ai/bench/__init__.py +0 -4
- fbgemm_gpu/experimental/gen_ai/fbgemm_gpu_experimental_gen_ai.so +0 -0
- fbgemm_gpu/experimental/gen_ai/moe/__init__.py +0 -4
- fbgemm_gpu/experimental/gen_ai/moe/layers.py +0 -4
- fbgemm_gpu/fbgemm.so +0 -0
- {fbgemm_gpu_genai_nightly-2025.10.13.dist-info → fbgemm_gpu_genai_nightly-2025.10.14.dist-info}/METADATA +1 -1
- {fbgemm_gpu_genai_nightly-2025.10.13.dist-info → fbgemm_gpu_genai_nightly-2025.10.14.dist-info}/RECORD +18 -18
- fbgemm_gpu/docs/version.py +0 -11
- {fbgemm_gpu_genai_nightly-2025.10.13.dist-info → fbgemm_gpu_genai_nightly-2025.10.14.dist-info}/WHEEL +0 -0
- {fbgemm_gpu_genai_nightly-2025.10.13.dist-info → fbgemm_gpu_genai_nightly-2025.10.14.dist-info}/top_level.txt +0 -0
fbgemm_gpu/__init__.py
CHANGED
|
@@ -5,6 +5,7 @@
|
|
|
5
5
|
# This source code is licensed under the BSD-style license found in the
|
|
6
6
|
# LICENSE file in the root directory of this source tree.
|
|
7
7
|
|
|
8
|
+
import json
|
|
8
9
|
import logging
|
|
9
10
|
import os
|
|
10
11
|
import re
|
|
@@ -26,6 +27,19 @@ _fbgemm_torch_compat_table = {
|
|
|
26
27
|
}
|
|
27
28
|
|
|
28
29
|
|
|
30
|
+
def _load_target_info(target: str) -> dict[str, str]:
|
|
31
|
+
try:
|
|
32
|
+
filepath = os.path.join(
|
|
33
|
+
os.path.dirname(__file__), "docs", f"target.{target}.json.py"
|
|
34
|
+
)
|
|
35
|
+
with open(filepath, "r") as file:
|
|
36
|
+
data = json.load(file)
|
|
37
|
+
except Exception:
|
|
38
|
+
data = {}
|
|
39
|
+
|
|
40
|
+
return data
|
|
41
|
+
|
|
42
|
+
|
|
29
43
|
def _load_library(filename: str, version: str, no_throw: bool = False) -> None:
|
|
30
44
|
"""Load a shared library from the given filename."""
|
|
31
45
|
|
|
@@ -98,13 +112,16 @@ open_source: bool = True
|
|
|
98
112
|
# Trigger the manual addition of docstrings to pybind11-generated operators
|
|
99
113
|
import fbgemm_gpu.docs # noqa: F401, E402
|
|
100
114
|
|
|
115
|
+
|
|
116
|
+
__targets_infos__ = {
|
|
117
|
+
target: _load_target_info(target) for target in ["default", "genai", "hstu"]
|
|
118
|
+
}
|
|
119
|
+
__targets_infos__ = {k: v for (k, v) in __targets_infos__.items() if v}
|
|
120
|
+
|
|
101
121
|
try:
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
__variant__,
|
|
106
|
-
__version__,
|
|
107
|
-
)
|
|
122
|
+
__target__, __info__ = next(iter(__targets_infos__.items()))
|
|
123
|
+
__variant__ = __info__["variant"]
|
|
124
|
+
__version__ = __info__["version"]
|
|
108
125
|
except Exception:
|
|
109
126
|
__variant__: str = "INTERNAL"
|
|
110
127
|
__version__: str = "INTERNAL"
|
|
@@ -145,18 +162,19 @@ libraries_to_load = {
|
|
|
145
162
|
"genai": fbgemm_genai_libraries,
|
|
146
163
|
}
|
|
147
164
|
|
|
148
|
-
for
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
|
|
154
|
-
|
|
155
|
-
|
|
156
|
-
|
|
157
|
-
|
|
158
|
-
|
|
159
|
-
|
|
165
|
+
for target, info in __targets_infos__.items():
|
|
166
|
+
for library in libraries_to_load.get(target, []):
|
|
167
|
+
# NOTE: In all cases, we want to throw an error if we cannot load the
|
|
168
|
+
# library. However, this appears to break the OSS documentation build,
|
|
169
|
+
# where the Python documentation doesn't show up in the generated docs.
|
|
170
|
+
#
|
|
171
|
+
# To work around this problem, we introduce a fake build variant called
|
|
172
|
+
# `docs` and we only throw a library load error when the variant is not
|
|
173
|
+
# `docs`. For more information, see:
|
|
174
|
+
#
|
|
175
|
+
# https://github.com/pytorch/FBGEMM/pull/3477
|
|
176
|
+
# https://github.com/pytorch/FBGEMM/pull/3717
|
|
177
|
+
_load_library(f"{library}.so", info["version"], info["variant"] == "docs")
|
|
160
178
|
|
|
161
179
|
try:
|
|
162
180
|
# Trigger meta operator registrations
|
fbgemm_gpu/asmjit.so
CHANGED
|
Binary file
|
|
@@ -15,10 +15,6 @@ try:
|
|
|
15
15
|
# pyre-ignore[21]
|
|
16
16
|
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
17
17
|
from fbgemm_gpu import open_source
|
|
18
|
-
|
|
19
|
-
# pyre-ignore[21]
|
|
20
|
-
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
21
|
-
from fbgemm_gpu.docs.version import __version__ # noqa: F401
|
|
22
18
|
except Exception:
|
|
23
19
|
open_source: bool = False
|
|
24
20
|
|
|
Binary file
|
|
@@ -11,9 +11,5 @@ try:
|
|
|
11
11
|
# pyre-ignore[21]
|
|
12
12
|
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
13
13
|
from fbgemm_gpu import open_source
|
|
14
|
-
|
|
15
|
-
# pyre-ignore[21]
|
|
16
|
-
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
17
|
-
from fbgemm_gpu.docs.version import __version__ # noqa: F401
|
|
18
14
|
except Exception:
|
|
19
15
|
open_source: bool = False
|
|
@@ -15,10 +15,6 @@ try:
|
|
|
15
15
|
# pyre-ignore[21]
|
|
16
16
|
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
17
17
|
from fbgemm_gpu import open_source
|
|
18
|
-
|
|
19
|
-
# pyre-ignore[21]
|
|
20
|
-
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
21
|
-
from fbgemm_gpu.docs.version import __version__ # noqa: F401
|
|
22
18
|
except Exception:
|
|
23
19
|
open_source: bool = False
|
|
24
20
|
|
|
@@ -10,10 +10,6 @@ try:
|
|
|
10
10
|
# pyre-ignore[21]
|
|
11
11
|
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
12
12
|
from fbgemm_gpu import open_source
|
|
13
|
-
|
|
14
|
-
# pyre-ignore[21]
|
|
15
|
-
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
16
|
-
from fbgemm_gpu.docs.version import __version__ # noqa: F401
|
|
17
13
|
except Exception:
|
|
18
14
|
open_source: bool = False
|
|
19
15
|
|
fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/cutlass_blackwell_fmha_interface.py
CHANGED
|
@@ -12,10 +12,6 @@ try:
|
|
|
12
12
|
# pyre-ignore[21]
|
|
13
13
|
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
14
14
|
from fbgemm_gpu import open_source
|
|
15
|
-
|
|
16
|
-
# pyre-ignore[21]
|
|
17
|
-
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
18
|
-
from fbgemm_gpu.docs.version import __version__ # noqa: F401
|
|
19
15
|
except Exception:
|
|
20
16
|
open_source: bool = False
|
|
21
17
|
|
|
@@ -9,9 +9,5 @@ try:
|
|
|
9
9
|
# pyre-ignore[21]
|
|
10
10
|
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
11
11
|
from fbgemm_gpu import open_source
|
|
12
|
-
|
|
13
|
-
# pyre-ignore[21]
|
|
14
|
-
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
15
|
-
from fbgemm_gpu.docs.version import __version__ # noqa: F401
|
|
16
12
|
except Exception:
|
|
17
13
|
open_source: bool = False
|
|
Binary file
|
|
@@ -14,10 +14,6 @@ try:
|
|
|
14
14
|
# pyre-ignore[21]
|
|
15
15
|
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
16
16
|
from fbgemm_gpu import open_source
|
|
17
|
-
|
|
18
|
-
# pyre-ignore[21]
|
|
19
|
-
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
20
|
-
from fbgemm_gpu.docs.version import __version__ # noqa: F401
|
|
21
17
|
except Exception:
|
|
22
18
|
open_source: bool = False
|
|
23
19
|
|
|
@@ -38,10 +38,6 @@ try:
|
|
|
38
38
|
# pyre-ignore[21]
|
|
39
39
|
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
40
40
|
from fbgemm_gpu import open_source
|
|
41
|
-
|
|
42
|
-
# pyre-ignore[21]
|
|
43
|
-
# @manual=//deeplearning/fbgemm/fbgemm_gpu:test_utils
|
|
44
|
-
from fbgemm_gpu.docs.version import __version__ # noqa: F401
|
|
45
41
|
except Exception:
|
|
46
42
|
open_source: bool = False
|
|
47
43
|
|
fbgemm_gpu/fbgemm.so
CHANGED
|
Binary file
|
|
@@ -1,8 +1,8 @@
|
|
|
1
|
-
fbgemm_gpu/__init__.py,sha256=
|
|
2
|
-
fbgemm_gpu/asmjit.so,sha256=
|
|
1
|
+
fbgemm_gpu/__init__.py,sha256=A3DuseilQ-sEtBpeZsG0LOqN5Cl3e5DHI_YgCZEMhnE,6283
|
|
2
|
+
fbgemm_gpu/asmjit.so,sha256=yDq47YobRro7Tvd4IaPNyQUf1YaA8iLyfcwnUdh0Coo,484232
|
|
3
3
|
fbgemm_gpu/batched_unary_embeddings_ops.py,sha256=GYeJ9pg-Wc9FokXVci_npDsL6UV18-pJXID2xzrJ9O8,2904
|
|
4
4
|
fbgemm_gpu/enums.py,sha256=37ewGSfO1x7sO31ZkRiqV1yKuklfHXT5qZIxzeeGogo,755
|
|
5
|
-
fbgemm_gpu/fbgemm.so,sha256=
|
|
5
|
+
fbgemm_gpu/fbgemm.so,sha256=DEQ1gRPSFaPAUbupt2byc0F7ZpHYo1yagdZ1Se9Gq1A,5807256
|
|
6
6
|
fbgemm_gpu/metrics.py,sha256=TsurFLJf0nJvPDN7urWb4LMQlf5RgdWPTTTDO7S4wtI,5663
|
|
7
7
|
fbgemm_gpu/permute_pooled_embedding_modules.py,sha256=vOXMYclaGnwSt0St_SOAlAe18kz6WjMyTeHnC9jLhcE,5130
|
|
8
8
|
fbgemm_gpu/permute_pooled_embedding_modules_split.py,sha256=f3VJvH_kw9Ltd_DXtaf_PJPHmlmEWrQgzQ7MDkhh5Nw,2746
|
|
@@ -32,32 +32,32 @@ fbgemm_gpu/docs/merge_pooled_embedding_ops.py,sha256=oJLgSgZQmhsyGLbTmZTxNgQrk65
|
|
|
32
32
|
fbgemm_gpu/docs/permute_pooled_embedding_ops.py,sha256=tZUqLVXlk5O6VAKKDA-OEMx2fCu5QPOOeoAPZA9_nLY,4454
|
|
33
33
|
fbgemm_gpu/docs/quantize_ops.py,sha256=xTtOaVK1P02ymreE_i21YiyYDZCqhoZY9eWp_mEIRlo,1297
|
|
34
34
|
fbgemm_gpu/docs/sparse_ops.py,sha256=gSLUFdnu8lle_6gLewFkM20wL3ek2jKLvDGMKR6POaY,27292
|
|
35
|
-
fbgemm_gpu/docs/
|
|
36
|
-
fbgemm_gpu/experimental/example/__init__.py,sha256=
|
|
37
|
-
fbgemm_gpu/experimental/example/fbgemm_gpu_experimental_example_py.so,sha256=
|
|
35
|
+
fbgemm_gpu/docs/target.genai.json.py,sha256=jBVwc34fgeucSL4uqGU56uPmHHnBmsphsLo8ySSCSpg,79
|
|
36
|
+
fbgemm_gpu/experimental/example/__init__.py,sha256=OvJHZgWnycL1gWKyCXFJCTKuys3KAqx4iadjx3R-tBQ,723
|
|
37
|
+
fbgemm_gpu/experimental/example/fbgemm_gpu_experimental_example_py.so,sha256=K70etfWeSleFOhfxXvSmpZMYBn_xmpvSxgdcGenvaKo,232488
|
|
38
38
|
fbgemm_gpu/experimental/example/utils.py,sha256=Je__VkMlBMLOhh7NXOocOdvaa2gz9kl9Dkqeu25tpFA,562
|
|
39
|
-
fbgemm_gpu/experimental/gemm/triton_gemm/__init__.py,sha256=
|
|
39
|
+
fbgemm_gpu/experimental/gemm/triton_gemm/__init__.py,sha256=1CqUfzlYyXTvU-BNaUq4RZpLV-2lKAVCAHeJzSIZFWw,419
|
|
40
40
|
fbgemm_gpu/experimental/gemm/triton_gemm/fp4_quantize.py,sha256=2RjIDSzUXtoFoC2ryp-C-j5H83mbSjPwvsvTrThfrqE,215658
|
|
41
41
|
fbgemm_gpu/experimental/gemm/triton_gemm/fp8_gemm.py,sha256=5m4SdgUsf2rM_Vul8czgRn_5oVnyi-52TmeidXh05hg,152754
|
|
42
42
|
fbgemm_gpu/experimental/gemm/triton_gemm/grouped_gemm.py,sha256=rbjxTMefjQWgJrWK_bYFtBklJigFwv4awPeVexkkiIA,44511
|
|
43
43
|
fbgemm_gpu/experimental/gemm/triton_gemm/matmul_perf_model.py,sha256=SltbY_dsit5e7B8lDIB_VYPrEq0t9kckthj9mQaVNfA,7571
|
|
44
44
|
fbgemm_gpu/experimental/gemm/triton_gemm/utils.py,sha256=rULXIpVaaRS3GKUZ1RHcWUrUyy0xMVREwS1SFShGgcw,4302
|
|
45
|
-
fbgemm_gpu/experimental/gen_ai/__init__.py,sha256=
|
|
46
|
-
fbgemm_gpu/experimental/gen_ai/fbgemm_gpu_experimental_gen_ai.so,sha256=
|
|
45
|
+
fbgemm_gpu/experimental/gen_ai/__init__.py,sha256=r3NlNCXuIh0pfKwKU5v14y6AZkpoIkKWbtzxSprgeKA,1713
|
|
46
|
+
fbgemm_gpu/experimental/gen_ai/fbgemm_gpu_experimental_gen_ai.so,sha256=2OKYdtL12c1XYD4VilDdV26ecLAIvcSILrodAeL0DHs,72651032
|
|
47
47
|
fbgemm_gpu/experimental/gen_ai/quantize.py,sha256=KAljWSdN-1_c5DWfT-3MDxWLMULK49Yu36t6TmQI9Tw,12599
|
|
48
|
-
fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/__init__.py,sha256=
|
|
48
|
+
fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/__init__.py,sha256=ntFgFs0foi6NQx8eqs5I3fCjzKSI0spXfEWiMhlcT00,897
|
|
49
49
|
fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/cutlass_blackwell_fmha_custom_op.py,sha256=FADVTYzS2u8fA-3iChS5CbtWd0mWF8F3lnXcwr_7vDw,7821
|
|
50
|
-
fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/cutlass_blackwell_fmha_interface.py,sha256=
|
|
51
|
-
fbgemm_gpu/experimental/gen_ai/bench/__init__.py,sha256=
|
|
50
|
+
fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/cutlass_blackwell_fmha_interface.py,sha256=7ydkrZ6qqyiah1dlJX6EuEXXw6WwOqCj7D48PWNJcUw,9259
|
|
51
|
+
fbgemm_gpu/experimental/gen_ai/bench/__init__.py,sha256=XpAK_eyqDSKeFC5J9KpnKtbZG07mrDh9d2j1LFKzr-8,404
|
|
52
52
|
fbgemm_gpu/experimental/gen_ai/bench/comm_bench.py,sha256=ApEyJOf_rdIo8V_EgvhZXBGNov8ITC_dnB95v8szulI,8515
|
|
53
53
|
fbgemm_gpu/experimental/gen_ai/bench/gather_scatter_bench.py,sha256=K9Nib6D7xJbw1QwEVuCJrVyI1qs988moo3cieVKYuFY,12057
|
|
54
54
|
fbgemm_gpu/experimental/gen_ai/bench/quantize_bench.py,sha256=BWl6t-4acbuRSEX2aVNDlFrSWZkqMWK2sI3VONaMd3Q,24047
|
|
55
55
|
fbgemm_gpu/experimental/gen_ai/bench/quantize_ops.py,sha256=H6AchejyZs76_snM_ae5vV0cPr_Q0h35OQ8qED0r1N4,104915
|
|
56
56
|
fbgemm_gpu/experimental/gen_ai/moe/README.md,sha256=z9ybHmv4KFJ1drj5OByuFaOY0tRQwwiIW3Q22TB_2-k,904
|
|
57
|
-
fbgemm_gpu/experimental/gen_ai/moe/__init__.py,sha256=
|
|
57
|
+
fbgemm_gpu/experimental/gen_ai/moe/__init__.py,sha256=lwSvff07yEav024B1XyfgW8r8hwNe--aEDywcO7rnbM,1905
|
|
58
58
|
fbgemm_gpu/experimental/gen_ai/moe/activation.py,sha256=NiXhWyCNagI3P9N3N89iSX7xKuShdkq9DxEUAzoV6y0,7892
|
|
59
59
|
fbgemm_gpu/experimental/gen_ai/moe/gather_scatter.py,sha256=8inrE4dkpfO9NFkrmXyXOCM262LMcTA3SQldxPoosT8,21044
|
|
60
|
-
fbgemm_gpu/experimental/gen_ai/moe/layers.py,sha256=
|
|
60
|
+
fbgemm_gpu/experimental/gen_ai/moe/layers.py,sha256=QLwoKjyYUHT5vXAvp_maRSxyruwGXaNURgtW8ataVyg,42693
|
|
61
61
|
fbgemm_gpu/experimental/gen_ai/moe/shuffling.py,sha256=VDGEUdLZyj6mblJkAIReLICxU5BGnvmUjgZDP0VVqt8,11077
|
|
62
62
|
fbgemm_gpu/quantize/__init__.py,sha256=pftciXHE7csekDFkl7Ui1AWglVMMnSrOO04mREnUdb0,921
|
|
63
63
|
fbgemm_gpu/quantize/quantize_ops.py,sha256=25AIOv9n2UoxamMUaI6EK1Ur4gSHxbZIReHBtgOjjCs,2228
|
|
@@ -121,7 +121,7 @@ fbgemm_gpu/utils/loader.py,sha256=1hCEhNvkflniH46fGcrguLeP1z-6uyOu2QFwqKU5CIM,99
|
|
|
121
121
|
fbgemm_gpu/utils/torch_library.py,sha256=ywsAHjbuwesj50LjEu99WkAH17FlaVgePZ9OmFg6YE4,4193
|
|
122
122
|
list_versions/__init__.py,sha256=UmTeqCk-UJWFtlZQWvZao3xvui2w9E3X_JdOXVjRaNw,315
|
|
123
123
|
list_versions/cli_run.py,sha256=CChZoXQ-tiKaWboXAYlPVJ5w8K5zAKiKcncA087I1sc,4508
|
|
124
|
-
fbgemm_gpu_genai_nightly-2025.10.
|
|
125
|
-
fbgemm_gpu_genai_nightly-2025.10.
|
|
126
|
-
fbgemm_gpu_genai_nightly-2025.10.
|
|
127
|
-
fbgemm_gpu_genai_nightly-2025.10.
|
|
124
|
+
fbgemm_gpu_genai_nightly-2025.10.14.dist-info/METADATA,sha256=iQTkrrgOlE6pdT-BY9IF5gFlmxWRVnwu9FJQb46IA-I,2656
|
|
125
|
+
fbgemm_gpu_genai_nightly-2025.10.14.dist-info/WHEEL,sha256=vUT1hK8fT5m5CAs5kDyQ_ABrvCmtd0TCp5-4vN9tR5A,108
|
|
126
|
+
fbgemm_gpu_genai_nightly-2025.10.14.dist-info/top_level.txt,sha256=_2s1Aa08r_eDn0JP4FjOhzK09Q8bVlEI7q8pMep51UY,25
|
|
127
|
+
fbgemm_gpu_genai_nightly-2025.10.14.dist-info/RECORD,,
|
fbgemm_gpu/docs/version.py
DELETED
|
@@ -1,11 +0,0 @@
|
|
|
1
|
-
|
|
2
|
-
#!/usr/bin/env python3
|
|
3
|
-
# Copyright (c) Meta Platforms, Inc. and affiliates.
|
|
4
|
-
# All rights reserved.
|
|
5
|
-
#
|
|
6
|
-
# This source code is licensed under the BSD-style license found in the
|
|
7
|
-
# LICENSE file in the root directory of this source tree.
|
|
8
|
-
|
|
9
|
-
__version__: str = "2025.10.13"
|
|
10
|
-
__target__: str = "genai"
|
|
11
|
-
__variant__: str = "cuda"
|
|
File without changes
|
|
File without changes
|