triton-windows 3.4.0.post20__cp313-cp313-win_amd64.whl → 3.4.0.post21__cp313-cp313-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of triton-windows might be problematic. Click here for more details.

triton/_C/libtriton.pyd CHANGED
Binary file
@@ -121,7 +121,7 @@ class CUDAOptions:
121
121
  enable_fp_fusion: bool = True
122
122
  launch_cooperative_grid: bool = False
123
123
  launch_pdl: bool = False
124
- supported_fp8_dtypes: Tuple[str] = ("fp8e5", "fp8e4b15")
124
+ supported_fp8_dtypes: Tuple[str] = ("fp8e4nv", "fp8e5", "fp8e4b15")
125
125
  deprecated_fp8_dot_operand_dtypes: Tuple[str] = ()
126
126
  default_dot_input_precision: str = "tf32"
127
127
  allowed_dot_input_precisions: Tuple[str] = ("tf32", "tf32x3", "ieee")
@@ -177,8 +177,6 @@ class CUDABackend(BaseBackend):
177
177
 
178
178
  if "supported_fp8_dtypes" not in args:
179
179
  supported_fp8_dtypes = set(CUDAOptions.supported_fp8_dtypes)
180
- if capability >= 89:
181
- supported_fp8_dtypes.add("fp8e4nv")
182
180
  args["supported_fp8_dtypes"] = tuple(sorted(supported_fp8_dtypes))
183
181
 
184
182
  if "deprecated_fp8_dot_operand_dtypes" not in args:
@@ -433,7 +431,8 @@ class CUDABackend(BaseBackend):
433
431
  try:
434
432
  # close_fds=True on Windows and False on Linux, see https://github.com/triton-lang/triton/pull/4357
435
433
  # On Windows, both stdout and stderr need to be redirected to flog
436
- subprocess.run(ptxas_cmd, check=True, close_fds=True if os.name == 'nt' else False, stdout=flog, stderr=flog)
434
+ subprocess.run(ptxas_cmd, check=True, close_fds=True if os.name == 'nt' else False, stdout=flog,
435
+ stderr=flog)
437
436
  except subprocess.CalledProcessError as e:
438
437
  with open(flog.name) as log_file:
439
438
  log = log_file.read()
triton/runtime/build.py CHANGED
@@ -116,7 +116,7 @@ def _build(name: str, src: str, srcdir: str, library_dirs: list[str], include_di
116
116
  cc_cmd = _cc_cmd(cc, src, so, include_dirs, library_dirs, libraries)
117
117
 
118
118
  try:
119
- ret = subprocess.check_call(cc_cmd)
119
+ subprocess.check_call(cc_cmd)
120
120
  except Exception as e:
121
121
  print("Failed to compile. cc_cmd:", cc_cmd)
122
122
  raise e
triton/windows_utils.py CHANGED
@@ -54,14 +54,11 @@ def max_version(
54
54
 
55
55
 
56
56
  def check_msvc(msvc_base_path: Path, version: str) -> bool:
57
- return all(
58
- x.exists()
59
- for x in [
60
- msvc_base_path / version / "bin" / "Hostx64" / "x64" / "cl.exe",
61
- msvc_base_path / version / "include" / "vcruntime.h",
62
- msvc_base_path / version / "lib" / "x64" / "vcruntime.lib",
63
- ]
64
- )
57
+ return all(x.exists() for x in [
58
+ msvc_base_path / version / "bin" / "Hostx64" / "x64" / "cl.exe",
59
+ msvc_base_path / version / "include" / "vcruntime.h",
60
+ msvc_base_path / version / "lib" / "x64" / "vcruntime.lib",
61
+ ])
65
62
 
66
63
 
67
64
  def find_msvc_env() -> tuple[Optional[Path], Optional[str]]:
@@ -72,20 +69,16 @@ def find_msvc_env() -> tuple[Optional[Path], Optional[str]]:
72
69
 
73
70
  version = os.getenv("VCToolsVersion")
74
71
  if not check_msvc(msvc_base_path, version):
75
- warnings.warn(
76
- f"Environment variables VCINSTALLDIR = {os.getenv('VCINSTALLDIR')}, "
77
- f"VCToolsVersion = {os.getenv('VCToolsVersion')} are set, "
78
- "but this MSVC installation is incomplete."
79
- )
72
+ warnings.warn(f"Environment variables VCINSTALLDIR = {os.getenv('VCINSTALLDIR')}, "
73
+ f"VCToolsVersion = {os.getenv('VCToolsVersion')} are set, "
74
+ "but this MSVC installation is incomplete.")
80
75
  return None, None
81
76
 
82
77
  return msvc_base_path, version
83
78
 
84
79
 
85
80
  def find_msvc_vswhere() -> tuple[Optional[Path], Optional[str]]:
86
- vswhere_path = find_in_program_files(
87
- r"Microsoft Visual Studio\Installer\vswhere.exe"
88
- )
81
+ vswhere_path = find_in_program_files(r"Microsoft Visual Studio\Installer\vswhere.exe")
89
82
  if vswhere_path is None:
90
83
  return None, None
91
84
 
@@ -111,9 +104,7 @@ def find_msvc_vswhere() -> tuple[Optional[Path], Optional[str]]:
111
104
  if not msvc_base_path.exists():
112
105
  return None, None
113
106
 
114
- version = max_version(
115
- os.listdir(msvc_base_path), check=partial(check_msvc, msvc_base_path)
116
- )
107
+ version = max_version(os.listdir(msvc_base_path), check=partial(check_msvc, msvc_base_path))
117
108
  if version is None:
118
109
  return None, None
119
110
 
@@ -132,9 +123,7 @@ def find_msvc_envpath() -> tuple[Optional[Path], Optional[str]]:
132
123
  if not msvc_base_path.exists():
133
124
  continue
134
125
 
135
- version = max_version(
136
- os.listdir(msvc_base_path), check=partial(check_msvc, msvc_base_path)
137
- )
126
+ version = max_version(os.listdir(msvc_base_path), check=partial(check_msvc, msvc_base_path))
138
127
  if version is None:
139
128
  continue
140
129
 
@@ -153,9 +142,7 @@ def find_msvc_hardcoded() -> tuple[Optional[Path], Optional[str]]:
153
142
  paths = sorted(paths)[::-1]
154
143
  for msvc_base_path in paths:
155
144
  msvc_base_path = Path(msvc_base_path)
156
- version = max_version(
157
- os.listdir(msvc_base_path), check=partial(check_msvc, msvc_base_path)
158
- )
145
+ version = max_version(os.listdir(msvc_base_path), check=partial(check_msvc, msvc_base_path))
159
146
  if version is None:
160
147
  continue
161
148
  return msvc_base_path, version
@@ -188,13 +175,10 @@ def find_msvc(env_only: bool) -> tuple[Optional[str], list[str], list[str]]:
188
175
 
189
176
 
190
177
  def check_winsdk(winsdk_base_path: Path, version: str) -> bool:
191
- return all(
192
- x.exists()
193
- for x in [
194
- winsdk_base_path / "Include" / version / "ucrt" / "stdlib.h",
195
- winsdk_base_path / "Lib" / version / "ucrt" / "x64" / "ucrt.lib",
196
- ]
197
- )
178
+ return all(x.exists() for x in [
179
+ winsdk_base_path / "Include" / version / "ucrt" / "stdlib.h",
180
+ winsdk_base_path / "Lib" / version / "ucrt" / "x64" / "ucrt.lib",
181
+ ])
198
182
 
199
183
 
200
184
  def find_winsdk_env() -> tuple[Optional[Path], Optional[str]]:
@@ -205,18 +189,16 @@ def find_winsdk_env() -> tuple[Optional[Path], Optional[str]]:
205
189
 
206
190
  version = os.getenv("WindowsSDKVersion")
207
191
  if version is None:
208
- warnings.warn(
209
- f"Environment variable WindowsSdkDir = {os.getenv('WindowsSdkDir')}, "
210
- "but WindowsSDKVersion is not set."
211
- )
192
+ version = os.getenv("WindowsSDKVer")
193
+ if version is None:
194
+ warnings.warn(f"Environment variable WindowsSdkDir = {winsdk_base_path}, "
195
+ "but WindowsSDKVersion (or WindowsSDKVer) is not set.")
212
196
  return None, None
213
197
  version = version.rstrip("\\")
214
198
  if not check_winsdk(winsdk_base_path, version):
215
- warnings.warn(
216
- f"Environment variables WindowsSdkDir = {os.getenv('WindowsSdkDir')}, "
217
- f"WindowsSDKVersion = {os.getenv('WindowsSDKVersion')} are set, "
218
- "but this Windows SDK installation is incomplete."
219
- )
199
+ warnings.warn(f"Environment variables WindowsSdkDir = {winsdk_base_path}, "
200
+ f"WindowsSDKVersion (or WindowsSDKVer) = {version} are set, "
201
+ "but this Windows SDK installation is incomplete.")
220
202
  return None, None
221
203
 
222
204
  return winsdk_base_path, version
@@ -225,9 +207,7 @@ def find_winsdk_env() -> tuple[Optional[Path], Optional[str]]:
225
207
  def find_winsdk_registry() -> tuple[Optional[Path], Optional[str]]:
226
208
  try:
227
209
  reg = winreg.ConnectRegistry(None, winreg.HKEY_LOCAL_MACHINE)
228
- key = winreg.OpenKeyEx(
229
- reg, r"SOFTWARE\WOW6432Node\Microsoft\Microsoft SDKs\Windows\v10.0"
230
- )
210
+ key = winreg.OpenKeyEx(reg, r"SOFTWARE\WOW6432Node\Microsoft\Microsoft SDKs\Windows\v10.0")
231
211
  folder = winreg.QueryValueEx(key, "InstallationFolder")[0]
232
212
  winreg.CloseKey(key)
233
213
  except OSError:
@@ -294,9 +274,7 @@ def find_winsdk(env_only: bool) -> tuple[list[str], list[str]]:
294
274
 
295
275
 
296
276
  @functools.lru_cache
297
- def find_msvc_winsdk(
298
- env_only: bool = False,
299
- ) -> tuple[Optional[str], list[str], list[str]]:
277
+ def find_msvc_winsdk(env_only: bool = False, ) -> tuple[Optional[str], list[str], list[str]]:
300
278
  msvc_bin_path, msvc_inc_dirs, msvc_lib_dirs = find_msvc(env_only)
301
279
  winsdk_inc_dirs, winsdk_lib_dirs = find_winsdk(env_only)
302
280
  return (
@@ -312,9 +290,9 @@ def find_python() -> list[str]:
312
290
  if sysconfig.get_config_var("Py_GIL_DISABLED"):
313
291
  version += "t"
314
292
  for python_base_path in [
315
- sys.exec_prefix,
316
- sys.base_exec_prefix,
317
- os.path.dirname(sys.executable),
293
+ sys.exec_prefix,
294
+ sys.base_exec_prefix,
295
+ os.path.dirname(sys.executable),
318
296
  ]:
319
297
  python_lib_dir = Path(python_base_path) / "libs"
320
298
  if (python_lib_dir / f"python{version}.lib").exists():
@@ -326,14 +304,11 @@ def find_python() -> list[str]:
326
304
 
327
305
  def check_and_find_cuda(base_path: Path) -> tuple[Optional[str], list[str], list[str]]:
328
306
  # pip
329
- if all(
330
- x.exists()
331
- for x in [
307
+ if all(x.exists() for x in [
332
308
  base_path / "cuda_nvcc" / "bin" / "ptxas.exe",
333
309
  base_path / "cuda_runtime" / "include" / "cuda.h",
334
310
  base_path / "cuda_runtime" / "lib" / "x64" / "cuda.lib",
335
- ]
336
- ):
311
+ ]):
337
312
  return (
338
313
  str(base_path / "cuda_nvcc" / "bin"),
339
314
  [str(base_path / "cuda_runtime" / "include")],
@@ -341,14 +316,11 @@ def check_and_find_cuda(base_path: Path) -> tuple[Optional[str], list[str], list
341
316
  )
342
317
 
343
318
  # conda
344
- if all(
345
- x.exists()
346
- for x in [
319
+ if all(x.exists() for x in [
347
320
  base_path / "bin" / "ptxas.exe",
348
321
  base_path / "include" / "cuda.h",
349
322
  base_path / "lib" / "cuda.lib",
350
- ]
351
- ):
323
+ ]):
352
324
  return (
353
325
  str(base_path / "bin"),
354
326
  [str(base_path / "include")],
@@ -356,14 +328,11 @@ def check_and_find_cuda(base_path: Path) -> tuple[Optional[str], list[str], list
356
328
  )
357
329
 
358
330
  # bundled or system-wide
359
- if all(
360
- x.exists()
361
- for x in [
331
+ if all(x.exists() for x in [
362
332
  base_path / "bin" / "ptxas.exe",
363
333
  base_path / "include" / "cuda.h",
364
334
  base_path / "lib" / "x64" / "cuda.lib",
365
- ]
366
- ):
335
+ ]):
367
336
  return (
368
337
  str(base_path / "bin"),
369
338
  [str(base_path / "include")],
@@ -380,9 +349,7 @@ def find_cuda_env() -> tuple[Optional[str], list[str], list[str]]:
380
349
  continue
381
350
 
382
351
  cuda_base_path = Path(cuda_base_path)
383
- cuda_bin_path, cuda_inc_dirs, cuda_lib_dirs = check_and_find_cuda(
384
- cuda_base_path
385
- )
352
+ cuda_bin_path, cuda_inc_dirs, cuda_lib_dirs = check_and_find_cuda(cuda_base_path)
386
353
  if cuda_bin_path:
387
354
  return cuda_bin_path, cuda_inc_dirs, cuda_lib_dirs
388
355
 
@@ -390,9 +357,7 @@ def find_cuda_env() -> tuple[Optional[str], list[str], list[str]]:
390
357
 
391
358
 
392
359
  def find_cuda_bundled() -> tuple[Optional[str], list[str], list[str]]:
393
- cuda_base_path = (
394
- Path(sysconfig.get_paths()["platlib"]) / "triton" / "backends" / "nvidia"
395
- )
360
+ cuda_base_path = (Path(sysconfig.get_paths()["platlib"]) / "triton" / "backends" / "nvidia")
396
361
  return check_and_find_cuda(cuda_base_path)
397
362
 
398
363
 
@@ -416,9 +381,7 @@ def find_cuda_hardcoded() -> tuple[Optional[str], list[str], list[str]]:
416
381
  paths = sorted(paths)[::-1]
417
382
  for cuda_base_path in paths:
418
383
  cuda_base_path = Path(cuda_base_path)
419
- cuda_bin_path, cuda_inc_dirs, cuda_lib_dirs = check_and_find_cuda(
420
- cuda_base_path
421
- )
384
+ cuda_bin_path, cuda_inc_dirs, cuda_lib_dirs = check_and_find_cuda(cuda_base_path)
422
385
  if cuda_bin_path:
423
386
  return cuda_bin_path, cuda_inc_dirs, cuda_lib_dirs
424
387
 
@@ -428,11 +391,11 @@ def find_cuda_hardcoded() -> tuple[Optional[str], list[str], list[str]]:
428
391
  @functools.lru_cache
429
392
  def find_cuda() -> tuple[Optional[str], list[str], list[str]]:
430
393
  for f in [
431
- find_cuda_env,
432
- find_cuda_bundled,
433
- find_cuda_pip,
434
- find_cuda_conda,
435
- find_cuda_hardcoded,
394
+ find_cuda_env,
395
+ find_cuda_bundled,
396
+ find_cuda_pip,
397
+ find_cuda_conda,
398
+ find_cuda_hardcoded,
436
399
  ]:
437
400
  cuda_bin_path, cuda_inc_dirs, cuda_lib_dirs = f()
438
401
  if cuda_bin_path:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: triton-windows
3
- Version: 3.4.0.post20
3
+ Version: 3.4.0.post21
4
4
  Summary: A language and compiler for custom Deep Learning operations
5
5
  Home-page: https://github.com/woct0rdho/triton-windows
6
6
  Author: Philippe Tillet, Dian Wu
@@ -5,8 +5,8 @@ triton/_utils.py,sha256=XTYb3qDDaVmbhmXbm6ChMTYTW9jeE538jZwJE_eliQg,3539
5
5
  triton/errors.py,sha256=8WfnuRKLG578mgY6cBA3ECruVMf9ULEKFNgRcJ6IhWM,89
6
6
  triton/knobs.py,sha256=VOdRM_J0TejBYP2H7QZZzLwcRJq-Eppm9hBxDt1pCgA,14916
7
7
  triton/testing.py,sha256=vbEQRNrOnnzRQvVVSaiZrUo8AC0XPV40GJxfvkKYLh0,20276
8
- triton/windows_utils.py,sha256=7uwsR-yQZQzzvHajkukryRTJlOotyRA5mlNlJOFVGsE,13130
9
- triton/_C/libtriton.pyd,sha256=feY3eFQa0O4dU5046FmNzjDDJeYUoZfWp82hHDU1PCo,89961984
8
+ triton/windows_utils.py,sha256=JMi6mjOApzh2-cw3Wl_nl6ji7JkwexYI7xgo2Et3ihU,12903
9
+ triton/_C/libtriton.pyd,sha256=_TR8zPM-fGXdMumvlF2VH2hQHqeJ79qanE6SqlVgjN4,89965056
10
10
  triton/backends/__init__.py,sha256=X7290kf96Fk9QnfLScsX4UDG3zPyH_-31E4A7pVOijM,1612
11
11
  triton/backends/compiler.py,sha256=MY2_cQG26p68z8VwRv2Nlj_h2DfEhwBbN-30caMgep0,2840
12
12
  triton/backends/driver.py,sha256=AN60upJlPgia0JwvZ8vIVgLITNPuI0fdz8zMIIHPpF4,1450
@@ -18,7 +18,7 @@ triton/backends/amd/lib/asanrtl.bc,sha256=1xv2RlU3WvbdsghHlmhwiHewGM2B5dKts5bERM
18
18
  triton/backends/amd/lib/ockl.bc,sha256=wQKCzkKukIHbu0lyjKUYlhndc7S27xto6L54J0Bn-C0,246124
19
19
  triton/backends/amd/lib/ocml.bc,sha256=UPNTXW0gCXUNB-c6orSYwb-mz9_mjUc7zny_vfFza44,205964
20
20
  triton/backends/nvidia/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
21
- triton/backends/nvidia/compiler.py,sha256=9ebNiX61uhApSojj5zf51HCh750FjXk2nzYlVQDJudk,19495
21
+ triton/backends/nvidia/compiler.py,sha256=7Yf79DdocAgYaWLR-MSTAv_QAJjVAZkhbr1-ovsnfnQ,19452
22
22
  triton/backends/nvidia/driver.c,sha256=rH8RDtMMv_UHr7qiLnrSdNg3xojOQe_fF1zW67LFjaE,17882
23
23
  triton/backends/nvidia/driver.py,sha256=22YT4HhTPI1aJ-mjw31Lvw1mcffj17pGJry3m9W6jio,26391
24
24
  triton/backends/nvidia/bin/ptxas.exe,sha256=f28E0l5aerLAfBXk7yagfOwIEE6_6_NkMx-vqPPEQ9Y,24753152
@@ -66,7 +66,7 @@ triton/language/extra/hip/libdevice.py,sha256=Rf-AmBzcO6ORVzSxSuLXOy0lpoZTsnRAuT
66
66
  triton/runtime/__init__.py,sha256=mKL5cqIBDUw2WO80NRCh4s1G8KYaqgM59TTAbTkPPjQ,621
67
67
  triton/runtime/_allocation.py,sha256=zaW4B7I7c-2rkVuN7IZaUB6IQSI1t4FvnTPZH-r7DTk,798
68
68
  triton/runtime/autotuner.py,sha256=cfWBuLpL6-eBv-J2tFIbL0gE3ZGHOFSJ0e3n0GfrzLw,20244
69
- triton/runtime/build.py,sha256=r44tiyJFWp5Xoxb2WUyw0nqxOA2rtyWN7O8krW9gZKE,6209
69
+ triton/runtime/build.py,sha256=hiFHKRV-fwDoT5lMbWpzA3hLp6LrE6ccw7zTo2AvHo0,6203
70
70
  triton/runtime/cache.py,sha256=uMV-CwCaS9cthIzKoLlTHXjhw_RoaIUaVP7zmgsdsIo,9689
71
71
  triton/runtime/driver.py,sha256=seGhU4efCFPVN0KVzd4gmZ1x5s0I_sFyM5NC8brXWF8,1798
72
72
  triton/runtime/errors.py,sha256=CwfJXciwel_-K3BfQfKUpLPDWrSyTnGsfJkqJojrdfQ,1052
@@ -178,9 +178,9 @@ triton/tools/mxfp.py,sha256=YQdpBrGkOVNOtnLeRjMCeVFHWkSwUubGeWsItIjO8TU,11737
178
178
  triton/tools/tensor_descriptor.py,sha256=mt4iVVRcNg0gjoytb6iCP4l5vt-H2V3MGeAQfJcStJo,1289
179
179
  triton/tools/extra/cuda/compile.c,sha256=TdIENsqk6wrvv1C4Mk-sq9keXe3SJuMQcf0UpxmjNZk,2153
180
180
  triton/tools/extra/cuda/compile.h,sha256=n9QKIFZTL4RSsiXtAxBP9XGSnxjyaevQQ9bBpwDsvAg,332
181
- triton_windows-3.4.0.post20.dist-info/licenses/LICENSE,sha256=kmQPuXIi_Qppj_KM4MN4LBcmI_jWxgm1V2NqgPKPuUY,1132
182
- triton_windows-3.4.0.post20.dist-info/METADATA,sha256=XVQISF1LWaRTh_mbQoa1OXk_1uhmigdfEfWJ2whPIPc,1794
183
- triton_windows-3.4.0.post20.dist-info/WHEEL,sha256=qV0EIPljj1XC_vuSatRWjn02nZIz3N1t8jsZz7HBr2U,101
184
- triton_windows-3.4.0.post20.dist-info/entry_points.txt,sha256=cztF9ZYXxoMhibI_OttiKCl1EBP2LQaV8naJ-BcuES4,76
185
- triton_windows-3.4.0.post20.dist-info/top_level.txt,sha256=WBiIZyv6n9Y7MIh-HPHSv2w1RDk7EFL__7ZgQRrmHYs,7
186
- triton_windows-3.4.0.post20.dist-info/RECORD,,
181
+ triton_windows-3.4.0.post21.dist-info/licenses/LICENSE,sha256=kmQPuXIi_Qppj_KM4MN4LBcmI_jWxgm1V2NqgPKPuUY,1132
182
+ triton_windows-3.4.0.post21.dist-info/METADATA,sha256=IHOZbw7LyV2c8dx0dvpgjzw8LmdA99209iNKB1UC01o,1794
183
+ triton_windows-3.4.0.post21.dist-info/WHEEL,sha256=qV0EIPljj1XC_vuSatRWjn02nZIz3N1t8jsZz7HBr2U,101
184
+ triton_windows-3.4.0.post21.dist-info/entry_points.txt,sha256=cztF9ZYXxoMhibI_OttiKCl1EBP2LQaV8naJ-BcuES4,76
185
+ triton_windows-3.4.0.post21.dist-info/top_level.txt,sha256=WBiIZyv6n9Y7MIh-HPHSv2w1RDk7EFL__7ZgQRrmHYs,7
186
+ triton_windows-3.4.0.post21.dist-info/RECORD,,