fbgemm-gpu-genai-nightly 2025.10.26__cp313-cp313-manylinux_2_28_x86_64.whl → 2025.10.28__cp313-cp313-manylinux_2_28_x86_64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of fbgemm-gpu-genai-nightly might be problematic. Click here for more details.
- fbgemm_gpu/asmjit.so +0 -0
- fbgemm_gpu/docs/target.genai.json.py +1 -1
- fbgemm_gpu/experimental/example/fbgemm_gpu_experimental_example_py.so +0 -0
- fbgemm_gpu/experimental/gen_ai/fbgemm_gpu_experimental_gen_ai.so +0 -0
- fbgemm_gpu/fbgemm.so +0 -0
- fbgemm_gpu/tbe/ssd/training.py +13 -6
- {fbgemm_gpu_genai_nightly-2025.10.26.dist-info → fbgemm_gpu_genai_nightly-2025.10.28.dist-info}/METADATA +1 -1
- {fbgemm_gpu_genai_nightly-2025.10.26.dist-info → fbgemm_gpu_genai_nightly-2025.10.28.dist-info}/RECORD +10 -10
- {fbgemm_gpu_genai_nightly-2025.10.26.dist-info → fbgemm_gpu_genai_nightly-2025.10.28.dist-info}/WHEEL +0 -0
- {fbgemm_gpu_genai_nightly-2025.10.26.dist-info → fbgemm_gpu_genai_nightly-2025.10.28.dist-info}/top_level.txt +0 -0
fbgemm_gpu/asmjit.so
CHANGED
|
Binary file
|
|
Binary file
|
|
Binary file
|
fbgemm_gpu/fbgemm.so
CHANGED
|
Binary file
|
fbgemm_gpu/tbe/ssd/training.py
CHANGED
|
@@ -1984,12 +1984,13 @@ class SSDTableBatchedEmbeddingBags(nn.Module):
|
|
|
1984
1984
|
# Store info for evicting the previous iteration's
|
|
1985
1985
|
# scratch pad after the corresponding backward pass is
|
|
1986
1986
|
# done
|
|
1987
|
-
self.
|
|
1988
|
-
(
|
|
1989
|
-
|
|
1990
|
-
|
|
1987
|
+
if self.training:
|
|
1988
|
+
self.ssd_location_update_data.append(
|
|
1989
|
+
(
|
|
1990
|
+
sp_curr_prev_map_gpu,
|
|
1991
|
+
inserted_rows,
|
|
1992
|
+
)
|
|
1991
1993
|
)
|
|
1992
|
-
)
|
|
1993
1994
|
|
|
1994
1995
|
# Ensure the previous iterations eviction is complete
|
|
1995
1996
|
current_stream.wait_event(self.ssd_event_sp_evict)
|
|
@@ -2173,7 +2174,7 @@ class SSDTableBatchedEmbeddingBags(nn.Module):
|
|
|
2173
2174
|
|
|
2174
2175
|
# Store scratch pad info for post backward eviction only for training
|
|
2175
2176
|
# for eval job, no backward pass, so no need to store this info
|
|
2176
|
-
if self.training
|
|
2177
|
+
if self.training:
|
|
2177
2178
|
self.ssd_scratch_pad_eviction_data.append(
|
|
2178
2179
|
(
|
|
2179
2180
|
inserted_rows,
|
|
@@ -4548,6 +4549,12 @@ class SSDTableBatchedEmbeddingBags(nn.Module):
|
|
|
4548
4549
|
if len(self.ssd_scratch_pad_eviction_data) > 0:
|
|
4549
4550
|
self.ssd_scratch_pad_eviction_data.pop(0)
|
|
4550
4551
|
if len(self.ssd_scratch_pad_eviction_data) > 0:
|
|
4552
|
+
# Wait for any pending backend reads to the next scratch pad
|
|
4553
|
+
# to complete before we write to it. Otherwise, stale backend data
|
|
4554
|
+
# will overwrite our direct_write updates.
|
|
4555
|
+
# The ssd_event_get marks completion of backend fetch operations.
|
|
4556
|
+
current_stream.wait_event(self.ssd_event_get)
|
|
4557
|
+
|
|
4551
4558
|
# if scratch pad exists, write to next batch scratch pad
|
|
4552
4559
|
sp = self.ssd_scratch_pad_eviction_data[0][0]
|
|
4553
4560
|
sp_idx = self.ssd_scratch_pad_eviction_data[0][1].to(
|
|
@@ -1,8 +1,8 @@
|
|
|
1
1
|
fbgemm_gpu/__init__.py,sha256=A3DuseilQ-sEtBpeZsG0LOqN5Cl3e5DHI_YgCZEMhnE,6283
|
|
2
|
-
fbgemm_gpu/asmjit.so,sha256=
|
|
2
|
+
fbgemm_gpu/asmjit.so,sha256=UxnhHlu9LgmoRXa8fZwSX56b5QKffBxfAOs0AZLxRfk,501728
|
|
3
3
|
fbgemm_gpu/batched_unary_embeddings_ops.py,sha256=GYeJ9pg-Wc9FokXVci_npDsL6UV18-pJXID2xzrJ9O8,2904
|
|
4
4
|
fbgemm_gpu/enums.py,sha256=37ewGSfO1x7sO31ZkRiqV1yKuklfHXT5qZIxzeeGogo,755
|
|
5
|
-
fbgemm_gpu/fbgemm.so,sha256=
|
|
5
|
+
fbgemm_gpu/fbgemm.so,sha256=B9y6MDLC6Ou7Bw_pT07Xfw5g5Q4j2yn9Xsp96QVpgEU,5646712
|
|
6
6
|
fbgemm_gpu/metrics.py,sha256=TsurFLJf0nJvPDN7urWb4LMQlf5RgdWPTTTDO7S4wtI,5663
|
|
7
7
|
fbgemm_gpu/permute_pooled_embedding_modules.py,sha256=vOXMYclaGnwSt0St_SOAlAe18kz6WjMyTeHnC9jLhcE,5130
|
|
8
8
|
fbgemm_gpu/permute_pooled_embedding_modules_split.py,sha256=f3VJvH_kw9Ltd_DXtaf_PJPHmlmEWrQgzQ7MDkhh5Nw,2746
|
|
@@ -32,9 +32,9 @@ fbgemm_gpu/docs/merge_pooled_embedding_ops.py,sha256=oJLgSgZQmhsyGLbTmZTxNgQrk65
|
|
|
32
32
|
fbgemm_gpu/docs/permute_pooled_embedding_ops.py,sha256=tZUqLVXlk5O6VAKKDA-OEMx2fCu5QPOOeoAPZA9_nLY,4454
|
|
33
33
|
fbgemm_gpu/docs/quantize_ops.py,sha256=xTtOaVK1P02ymreE_i21YiyYDZCqhoZY9eWp_mEIRlo,1297
|
|
34
34
|
fbgemm_gpu/docs/sparse_ops.py,sha256=gSLUFdnu8lle_6gLewFkM20wL3ek2jKLvDGMKR6POaY,27292
|
|
35
|
-
fbgemm_gpu/docs/target.genai.json.py,sha256=
|
|
35
|
+
fbgemm_gpu/docs/target.genai.json.py,sha256=8qUPmreVJ1_8egLGQELc4MkLwuD8aXPlYC2OfOCPJ3g,79
|
|
36
36
|
fbgemm_gpu/experimental/example/__init__.py,sha256=OvJHZgWnycL1gWKyCXFJCTKuys3KAqx4iadjx3R-tBQ,723
|
|
37
|
-
fbgemm_gpu/experimental/example/fbgemm_gpu_experimental_example_py.so,sha256=
|
|
37
|
+
fbgemm_gpu/experimental/example/fbgemm_gpu_experimental_example_py.so,sha256=jDR2ZPfNbqWytICmnGGIuR7IGDNOCzkXLSDPmAroFos,243904
|
|
38
38
|
fbgemm_gpu/experimental/example/utils.py,sha256=Je__VkMlBMLOhh7NXOocOdvaa2gz9kl9Dkqeu25tpFA,562
|
|
39
39
|
fbgemm_gpu/experimental/gemm/triton_gemm/__init__.py,sha256=1CqUfzlYyXTvU-BNaUq4RZpLV-2lKAVCAHeJzSIZFWw,419
|
|
40
40
|
fbgemm_gpu/experimental/gemm/triton_gemm/fp4_quantize.py,sha256=2RjIDSzUXtoFoC2ryp-C-j5H83mbSjPwvsvTrThfrqE,215658
|
|
@@ -43,7 +43,7 @@ fbgemm_gpu/experimental/gemm/triton_gemm/grouped_gemm.py,sha256=rbjxTMefjQWgJrWK
|
|
|
43
43
|
fbgemm_gpu/experimental/gemm/triton_gemm/matmul_perf_model.py,sha256=SltbY_dsit5e7B8lDIB_VYPrEq0t9kckthj9mQaVNfA,7571
|
|
44
44
|
fbgemm_gpu/experimental/gemm/triton_gemm/utils.py,sha256=rULXIpVaaRS3GKUZ1RHcWUrUyy0xMVREwS1SFShGgcw,4302
|
|
45
45
|
fbgemm_gpu/experimental/gen_ai/__init__.py,sha256=r3NlNCXuIh0pfKwKU5v14y6AZkpoIkKWbtzxSprgeKA,1713
|
|
46
|
-
fbgemm_gpu/experimental/gen_ai/fbgemm_gpu_experimental_gen_ai.so,sha256=
|
|
46
|
+
fbgemm_gpu/experimental/gen_ai/fbgemm_gpu_experimental_gen_ai.so,sha256=klO-9Aat9MhLF1IBnFhDrK1MBrSYeT_3q01srPCe-iI,74888976
|
|
47
47
|
fbgemm_gpu/experimental/gen_ai/quantize.py,sha256=KAljWSdN-1_c5DWfT-3MDxWLMULK49Yu36t6TmQI9Tw,12599
|
|
48
48
|
fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/__init__.py,sha256=ntFgFs0foi6NQx8eqs5I3fCjzKSI0spXfEWiMhlcT00,897
|
|
49
49
|
fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/cutlass_blackwell_fmha_custom_op.py,sha256=FADVTYzS2u8fA-3iChS5CbtWd0mWF8F3lnXcwr_7vDw,7821
|
|
@@ -99,7 +99,7 @@ fbgemm_gpu/tbe/cache/split_embeddings_cache_ops.py,sha256=vZHj7KIe1DoJDy5eft29Xt
|
|
|
99
99
|
fbgemm_gpu/tbe/ssd/__init__.py,sha256=wzfMT10cp_dqK2lrebC449hOdexBnizcf_98lA1NyHs,483
|
|
100
100
|
fbgemm_gpu/tbe/ssd/common.py,sha256=1J8K7sTQswgCYWaVwF-ZdCJj7mNN6O9GI70AaZWzJGE,1044
|
|
101
101
|
fbgemm_gpu/tbe/ssd/inference.py,sha256=B_uX66ajGA9YKGlFa5TmGWs7b-b1RFigzwxmENZ9Oio,22816
|
|
102
|
-
fbgemm_gpu/tbe/ssd/training.py,sha256=
|
|
102
|
+
fbgemm_gpu/tbe/ssd/training.py,sha256=t_8AfKlajVNFAnn3hPST2e82P0dPxzXAsioxMBJ8jrY,199948
|
|
103
103
|
fbgemm_gpu/tbe/ssd/utils/__init__.py,sha256=5DgmR2HA6NtmYh2ddkUgpDsZ6a7hF0DPedA1gMpdh18,250
|
|
104
104
|
fbgemm_gpu/tbe/ssd/utils/partially_materialized_tensor.py,sha256=SFg2-29b-i49LWm-FlaWUkTz2XzXbicYi_AzVj4jKNE,7601
|
|
105
105
|
fbgemm_gpu/tbe/stats/__init__.py,sha256=on29iDtq7cVNh90JR9aeFNG-K9DDoYq0JryzoplL49I,322
|
|
@@ -121,7 +121,7 @@ fbgemm_gpu/utils/loader.py,sha256=1hCEhNvkflniH46fGcrguLeP1z-6uyOu2QFwqKU5CIM,99
|
|
|
121
121
|
fbgemm_gpu/utils/torch_library.py,sha256=ywsAHjbuwesj50LjEu99WkAH17FlaVgePZ9OmFg6YE4,4193
|
|
122
122
|
list_versions/__init__.py,sha256=UmTeqCk-UJWFtlZQWvZao3xvui2w9E3X_JdOXVjRaNw,315
|
|
123
123
|
list_versions/cli_run.py,sha256=CChZoXQ-tiKaWboXAYlPVJ5w8K5zAKiKcncA087I1sc,4508
|
|
124
|
-
fbgemm_gpu_genai_nightly-2025.10.
|
|
125
|
-
fbgemm_gpu_genai_nightly-2025.10.
|
|
126
|
-
fbgemm_gpu_genai_nightly-2025.10.
|
|
127
|
-
fbgemm_gpu_genai_nightly-2025.10.
|
|
124
|
+
fbgemm_gpu_genai_nightly-2025.10.28.dist-info/METADATA,sha256=06TbYlUoKnFZX6E1ZpX2rcQaq4tSOj0kJxNOSQ2yO8M,2656
|
|
125
|
+
fbgemm_gpu_genai_nightly-2025.10.28.dist-info/WHEEL,sha256=Nkv8TSWVt7XcnRf1cdq5HOzycTl6Pjzlmn7gPSv4NiQ,108
|
|
126
|
+
fbgemm_gpu_genai_nightly-2025.10.28.dist-info/top_level.txt,sha256=_2s1Aa08r_eDn0JP4FjOhzK09Q8bVlEI7q8pMep51UY,25
|
|
127
|
+
fbgemm_gpu_genai_nightly-2025.10.28.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|