PyPI - blksprs - Versions diffs - 2.0rc1__tar.gz → 2.0rc2__tar.gz - Mend

blksprs 2.0rc1tar.gz → 2.0rc2tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

{blksprs-2.0rc1 → blksprs-2.0rc2}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: blksprs
-Version: 2.0rc1
+Version: 2.0rc2
 Summary: A lightweight library for operations on blocksparse matrices in PyTorch.
 Author-email: Felix Schön <schoen@kr.tuwien.ac.at>
 Project-URL: Homepage, https://github.com/FelixSchoen/blksprs

{blksprs-2.0rc1 → blksprs-2.0rc2}/blksprs/ops/matmul.py RENAMED Viewed

@@ -205,6 +205,9 @@ def matmul_kernel(x,
             # Perform matrix multiplication
             buf += tl.dot(blk_x, blk_y)
+    # Cast buffer
+    buf = buf.to(o.dtype.element_ty)
     # Store output
     blk_o_idx = ((pid_blk * o_b_s) +
                  ((pid_row * val_tbs + tl.arange(0, TRITON_BLOCK_SIZE)) * o_r_s)[:, None] +

{blksprs-2.0rc1 → blksprs-2.0rc2}/blksprs/utils/validation.py RENAMED Viewed

@@ -27,8 +27,8 @@ def validate_dtype_float(*tensors: Tensor) -> None:
         return
     for tensor in tensors:
-        if tensor.dtype != torch.float32:
-            raise ValueError("Tensor must have float32 dtype")
+        if tensor.dtype != torch.float16 and tensor.dtype != torch.float32:
+            raise ValueError("Tensor must have either float16 or float32 dtype")
 def validate_dtype_int(*tensors: Tensor) -> None:
@@ -38,7 +38,7 @@ def validate_dtype_int(*tensors: Tensor) -> None:
     for tensor in tensors:
         if (tensor.dtype !=
                 torch.int32 and tensor.dtype != torch.int64):
-            raise ValueError("Tensor must have int32 or int64 dtype")
+            raise ValueError("Tensor must have either int32 or int64 dtype")
 def validate_device(*tensors: Tensor) -> None:
@@ -51,7 +51,7 @@ def validate_device(*tensors: Tensor) -> None:
         if i == 0:
             device = tensor.device
-            if not device.type == 'cuda':
+            if not device.type == "cuda":
                 raise ValueError("Tensors must be on GPU")
         if tensor.device != device:

{blksprs-2.0rc1 → blksprs-2.0rc2}/blksprs.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: blksprs
-Version: 2.0rc1
+Version: 2.0rc2
 Summary: A lightweight library for operations on blocksparse matrices in PyTorch.
 Author-email: Felix Schön <schoen@kr.tuwien.ac.at>
 Project-URL: Homepage, https://github.com/FelixSchoen/blksprs

{blksprs-2.0rc1 → blksprs-2.0rc2}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "blksprs"
-version = "2.0-rc.1"
+version = "2.0-rc.2"
 authors = [{ name = "Felix Schön", email = "schoen@kr.tuwien.ac.at" }]
 description = "A lightweight library for operations on blocksparse matrices in PyTorch."
 readme = "README.md"