fbgemm-gpu-genai-nightly 2025.10.26__cp313-cp313-manylinux_2_28_x86_64.whl → 2025.10.28__cp313-cp313-manylinux_2_28_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of fbgemm-gpu-genai-nightly might be problematic. Click here for more details.

fbgemm_gpu/asmjit.so CHANGED
Binary file
@@ -1,6 +1,6 @@
1
1
 
2
2
  {
3
- "version": "2025.10.26",
3
+ "version": "2025.10.28",
4
4
  "target": "genai",
5
5
  "variant": "cuda"
6
6
  }
fbgemm_gpu/fbgemm.so CHANGED
Binary file
@@ -1984,12 +1984,13 @@ class SSDTableBatchedEmbeddingBags(nn.Module):
1984
1984
  # Store info for evicting the previous iteration's
1985
1985
  # scratch pad after the corresponding backward pass is
1986
1986
  # done
1987
- self.ssd_location_update_data.append(
1988
- (
1989
- sp_curr_prev_map_gpu,
1990
- inserted_rows,
1987
+ if self.training:
1988
+ self.ssd_location_update_data.append(
1989
+ (
1990
+ sp_curr_prev_map_gpu,
1991
+ inserted_rows,
1992
+ )
1991
1993
  )
1992
- )
1993
1994
 
1994
1995
  # Ensure the previous iterations eviction is complete
1995
1996
  current_stream.wait_event(self.ssd_event_sp_evict)
@@ -2173,7 +2174,7 @@ class SSDTableBatchedEmbeddingBags(nn.Module):
2173
2174
 
2174
2175
  # Store scratch pad info for post backward eviction only for training
2175
2176
  # for eval job, no backward pass, so no need to store this info
2176
- if self.training and not self._embedding_cache_mode:
2177
+ if self.training:
2177
2178
  self.ssd_scratch_pad_eviction_data.append(
2178
2179
  (
2179
2180
  inserted_rows,
@@ -4548,6 +4549,12 @@ class SSDTableBatchedEmbeddingBags(nn.Module):
4548
4549
  if len(self.ssd_scratch_pad_eviction_data) > 0:
4549
4550
  self.ssd_scratch_pad_eviction_data.pop(0)
4550
4551
  if len(self.ssd_scratch_pad_eviction_data) > 0:
4552
+ # Wait for any pending backend reads to the next scratch pad
4553
+ # to complete before we write to it. Otherwise, stale backend data
4554
+ # will overwrite our direct_write updates.
4555
+ # The ssd_event_get marks completion of backend fetch operations.
4556
+ current_stream.wait_event(self.ssd_event_get)
4557
+
4551
4558
  # if scratch pad exists, write to next batch scratch pad
4552
4559
  sp = self.ssd_scratch_pad_eviction_data[0][0]
4553
4560
  sp_idx = self.ssd_scratch_pad_eviction_data[0][1].to(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: fbgemm_gpu_genai_nightly
3
- Version: 2025.10.26
3
+ Version: 2025.10.28
4
4
  Home-page: https://github.com/pytorch/fbgemm
5
5
  Author: FBGEMM Team
6
6
  Author-email: packages@pytorch.org
@@ -1,8 +1,8 @@
1
1
  fbgemm_gpu/__init__.py,sha256=A3DuseilQ-sEtBpeZsG0LOqN5Cl3e5DHI_YgCZEMhnE,6283
2
- fbgemm_gpu/asmjit.so,sha256=PFeEgzpuz45ai1N1fj0C87yHOw9OZFoW6N9VZHyxxHI,484232
2
+ fbgemm_gpu/asmjit.so,sha256=UxnhHlu9LgmoRXa8fZwSX56b5QKffBxfAOs0AZLxRfk,501728
3
3
  fbgemm_gpu/batched_unary_embeddings_ops.py,sha256=GYeJ9pg-Wc9FokXVci_npDsL6UV18-pJXID2xzrJ9O8,2904
4
4
  fbgemm_gpu/enums.py,sha256=37ewGSfO1x7sO31ZkRiqV1yKuklfHXT5qZIxzeeGogo,755
5
- fbgemm_gpu/fbgemm.so,sha256=DEQ1gRPSFaPAUbupt2byc0F7ZpHYo1yagdZ1Se9Gq1A,5807256
5
+ fbgemm_gpu/fbgemm.so,sha256=B9y6MDLC6Ou7Bw_pT07Xfw5g5Q4j2yn9Xsp96QVpgEU,5646712
6
6
  fbgemm_gpu/metrics.py,sha256=TsurFLJf0nJvPDN7urWb4LMQlf5RgdWPTTTDO7S4wtI,5663
7
7
  fbgemm_gpu/permute_pooled_embedding_modules.py,sha256=vOXMYclaGnwSt0St_SOAlAe18kz6WjMyTeHnC9jLhcE,5130
8
8
  fbgemm_gpu/permute_pooled_embedding_modules_split.py,sha256=f3VJvH_kw9Ltd_DXtaf_PJPHmlmEWrQgzQ7MDkhh5Nw,2746
@@ -32,9 +32,9 @@ fbgemm_gpu/docs/merge_pooled_embedding_ops.py,sha256=oJLgSgZQmhsyGLbTmZTxNgQrk65
32
32
  fbgemm_gpu/docs/permute_pooled_embedding_ops.py,sha256=tZUqLVXlk5O6VAKKDA-OEMx2fCu5QPOOeoAPZA9_nLY,4454
33
33
  fbgemm_gpu/docs/quantize_ops.py,sha256=xTtOaVK1P02ymreE_i21YiyYDZCqhoZY9eWp_mEIRlo,1297
34
34
  fbgemm_gpu/docs/sparse_ops.py,sha256=gSLUFdnu8lle_6gLewFkM20wL3ek2jKLvDGMKR6POaY,27292
35
- fbgemm_gpu/docs/target.genai.json.py,sha256=ajhntGyjTTpz2gTBZ0AIGOreSmrqXYTCsLcujrtNSHk,79
35
+ fbgemm_gpu/docs/target.genai.json.py,sha256=8qUPmreVJ1_8egLGQELc4MkLwuD8aXPlYC2OfOCPJ3g,79
36
36
  fbgemm_gpu/experimental/example/__init__.py,sha256=OvJHZgWnycL1gWKyCXFJCTKuys3KAqx4iadjx3R-tBQ,723
37
- fbgemm_gpu/experimental/example/fbgemm_gpu_experimental_example_py.so,sha256=Sybrpqn3720uHdnjnrC43SfSqjv05ISYUjwQjVfs4cE,232488
37
+ fbgemm_gpu/experimental/example/fbgemm_gpu_experimental_example_py.so,sha256=jDR2ZPfNbqWytICmnGGIuR7IGDNOCzkXLSDPmAroFos,243904
38
38
  fbgemm_gpu/experimental/example/utils.py,sha256=Je__VkMlBMLOhh7NXOocOdvaa2gz9kl9Dkqeu25tpFA,562
39
39
  fbgemm_gpu/experimental/gemm/triton_gemm/__init__.py,sha256=1CqUfzlYyXTvU-BNaUq4RZpLV-2lKAVCAHeJzSIZFWw,419
40
40
  fbgemm_gpu/experimental/gemm/triton_gemm/fp4_quantize.py,sha256=2RjIDSzUXtoFoC2ryp-C-j5H83mbSjPwvsvTrThfrqE,215658
@@ -43,7 +43,7 @@ fbgemm_gpu/experimental/gemm/triton_gemm/grouped_gemm.py,sha256=rbjxTMefjQWgJrWK
43
43
  fbgemm_gpu/experimental/gemm/triton_gemm/matmul_perf_model.py,sha256=SltbY_dsit5e7B8lDIB_VYPrEq0t9kckthj9mQaVNfA,7571
44
44
  fbgemm_gpu/experimental/gemm/triton_gemm/utils.py,sha256=rULXIpVaaRS3GKUZ1RHcWUrUyy0xMVREwS1SFShGgcw,4302
45
45
  fbgemm_gpu/experimental/gen_ai/__init__.py,sha256=r3NlNCXuIh0pfKwKU5v14y6AZkpoIkKWbtzxSprgeKA,1713
46
- fbgemm_gpu/experimental/gen_ai/fbgemm_gpu_experimental_gen_ai.so,sha256=TXSnyk3ygjW9aR2AbPvquwn67_gp7HD0XTOX5VM6910,74306608
46
+ fbgemm_gpu/experimental/gen_ai/fbgemm_gpu_experimental_gen_ai.so,sha256=klO-9Aat9MhLF1IBnFhDrK1MBrSYeT_3q01srPCe-iI,74888976
47
47
  fbgemm_gpu/experimental/gen_ai/quantize.py,sha256=KAljWSdN-1_c5DWfT-3MDxWLMULK49Yu36t6TmQI9Tw,12599
48
48
  fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/__init__.py,sha256=ntFgFs0foi6NQx8eqs5I3fCjzKSI0spXfEWiMhlcT00,897
49
49
  fbgemm_gpu/experimental/gen_ai/attention/cutlass_blackwell_fmha/cutlass_blackwell_fmha_custom_op.py,sha256=FADVTYzS2u8fA-3iChS5CbtWd0mWF8F3lnXcwr_7vDw,7821
@@ -99,7 +99,7 @@ fbgemm_gpu/tbe/cache/split_embeddings_cache_ops.py,sha256=vZHj7KIe1DoJDy5eft29Xt
99
99
  fbgemm_gpu/tbe/ssd/__init__.py,sha256=wzfMT10cp_dqK2lrebC449hOdexBnizcf_98lA1NyHs,483
100
100
  fbgemm_gpu/tbe/ssd/common.py,sha256=1J8K7sTQswgCYWaVwF-ZdCJj7mNN6O9GI70AaZWzJGE,1044
101
101
  fbgemm_gpu/tbe/ssd/inference.py,sha256=B_uX66ajGA9YKGlFa5TmGWs7b-b1RFigzwxmENZ9Oio,22816
102
- fbgemm_gpu/tbe/ssd/training.py,sha256=X-u33ZUpxsVUXdQ8UgVtorywAAse5YLrH-ElAG6RnJs,199517
102
+ fbgemm_gpu/tbe/ssd/training.py,sha256=t_8AfKlajVNFAnn3hPST2e82P0dPxzXAsioxMBJ8jrY,199948
103
103
  fbgemm_gpu/tbe/ssd/utils/__init__.py,sha256=5DgmR2HA6NtmYh2ddkUgpDsZ6a7hF0DPedA1gMpdh18,250
104
104
  fbgemm_gpu/tbe/ssd/utils/partially_materialized_tensor.py,sha256=SFg2-29b-i49LWm-FlaWUkTz2XzXbicYi_AzVj4jKNE,7601
105
105
  fbgemm_gpu/tbe/stats/__init__.py,sha256=on29iDtq7cVNh90JR9aeFNG-K9DDoYq0JryzoplL49I,322
@@ -121,7 +121,7 @@ fbgemm_gpu/utils/loader.py,sha256=1hCEhNvkflniH46fGcrguLeP1z-6uyOu2QFwqKU5CIM,99
121
121
  fbgemm_gpu/utils/torch_library.py,sha256=ywsAHjbuwesj50LjEu99WkAH17FlaVgePZ9OmFg6YE4,4193
122
122
  list_versions/__init__.py,sha256=UmTeqCk-UJWFtlZQWvZao3xvui2w9E3X_JdOXVjRaNw,315
123
123
  list_versions/cli_run.py,sha256=CChZoXQ-tiKaWboXAYlPVJ5w8K5zAKiKcncA087I1sc,4508
124
- fbgemm_gpu_genai_nightly-2025.10.26.dist-info/METADATA,sha256=26cyhltFwGI-kyhkYZONi8FZb30P1Y99MRu-nh9dD8g,2656
125
- fbgemm_gpu_genai_nightly-2025.10.26.dist-info/WHEEL,sha256=Nkv8TSWVt7XcnRf1cdq5HOzycTl6Pjzlmn7gPSv4NiQ,108
126
- fbgemm_gpu_genai_nightly-2025.10.26.dist-info/top_level.txt,sha256=_2s1Aa08r_eDn0JP4FjOhzK09Q8bVlEI7q8pMep51UY,25
127
- fbgemm_gpu_genai_nightly-2025.10.26.dist-info/RECORD,,
124
+ fbgemm_gpu_genai_nightly-2025.10.28.dist-info/METADATA,sha256=06TbYlUoKnFZX6E1ZpX2rcQaq4tSOj0kJxNOSQ2yO8M,2656
125
+ fbgemm_gpu_genai_nightly-2025.10.28.dist-info/WHEEL,sha256=Nkv8TSWVt7XcnRf1cdq5HOzycTl6Pjzlmn7gPSv4NiQ,108
126
+ fbgemm_gpu_genai_nightly-2025.10.28.dist-info/top_level.txt,sha256=_2s1Aa08r_eDn0JP4FjOhzK09Q8bVlEI7q8pMep51UY,25
127
+ fbgemm_gpu_genai_nightly-2025.10.28.dist-info/RECORD,,