tilelang-rocm 0.1.4.post10__cp310-cp310-manylinux1_x86_64.whl → 0.1.4.post11__cp310-cp310-manylinux1_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
tilelang/VERSION CHANGED
@@ -1 +1 @@
1
- 0.1.4.post10
1
+ 0.1.4.post11
Binary file
Binary file
tilelang/lib/libtvm.so CHANGED
Binary file
Binary file
@@ -16,3 +16,33 @@ struct __align__(16) fp8_e4_16_t {
16
16
  fp8_e4_8_t x;
17
17
  fp8_e4_8_t y;
18
18
  };
19
+
20
+ __device__ fp8_e4_4_t make_fp8_e4_4_t(fp8_e4_t x, fp8_e4_t y, fp8_e4_t z,
21
+ fp8_e4_t w) {
22
+ // reinterpret the 4 fp8_e4_t values to signed char value and shift
23
+ signed char x_char = *reinterpret_cast<signed char *>(&x);
24
+ signed char y_char = *reinterpret_cast<signed char *>(&y);
25
+ signed char z_char = *reinterpret_cast<signed char *>(&z);
26
+ signed char w_char = *reinterpret_cast<signed char *>(&w);
27
+ int res = (w_char << 24) | (z_char << 16) | (y_char << 8) | x_char;
28
+ return *reinterpret_cast<fp8_e4_4_t *>(&res);
29
+ }
30
+
31
+ __device__ fp8_e4_8_t make_fp8_e4_8_t(fp8_e4_t x, fp8_e4_t y, fp8_e4_t z,
32
+ fp8_e4_t w, fp8_e4_t v, fp8_e4_t u,
33
+ fp8_e4_t t, fp8_e4_t s) {
34
+ signed char x_char = *reinterpret_cast<signed char *>(&x);
35
+ signed char y_char = *reinterpret_cast<signed char *>(&y);
36
+ signed char z_char = *reinterpret_cast<signed char *>(&z);
37
+ signed char w_char = *reinterpret_cast<signed char *>(&w);
38
+ signed char v_char = *reinterpret_cast<signed char *>(&v);
39
+ signed char u_char = *reinterpret_cast<signed char *>(&u);
40
+ signed char t_char = *reinterpret_cast<signed char *>(&t);
41
+ signed char s_char = *reinterpret_cast<signed char *>(&s);
42
+ int a = (w_char << 24) | (z_char << 16) | (y_char << 8) | x_char;
43
+ int b = (s_char << 24) | (t_char << 16) | (u_char << 8) | v_char;
44
+ fp8_e4_8_t res;
45
+ res.x = *reinterpret_cast<fp8_e4_4_t *>(&a);
46
+ res.y = *reinterpret_cast<fp8_e4_4_t *>(&b);
47
+ return res;
48
+ }
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: tilelang-rocm
3
- Version: 0.1.4.post10
3
+ Version: 0.1.4.post11
4
4
  Summary: A tile level programming language to generate high performance code.
5
5
  Home-page: https://github.com/tile-ai/tilelang
6
6
  Author: Microsoft Research
@@ -1,7 +1,7 @@
1
1
  tilelang/CMakeLists.txt,sha256=xJhnusYZI4UhD_fzseGH3Tn2BeovUzz3aWUwPq-WU0Y,7010
2
2
  tilelang/LICENSE,sha256=v9fVeAgRKQXc5ySwTns767gj0-dHN9XYPpGURkAVAXs,1127
3
3
  tilelang/README.md,sha256=1RC_2IUBY-p0BR-d2xkNXC8zrva8-U3AVkmCozkssbY,11924
4
- tilelang/VERSION,sha256=Il_uPi-DubG_kcKlTV5qP75Dq4zOcrugFwCAygQ4SQU,13
4
+ tilelang/VERSION,sha256=ArXa5-BJWz0tYmntP_b1UkmqBWmkVJ5sMUiAaXMSrkA,13
5
5
  tilelang/__init__.py,sha256=yH0BknCRnFQN-E7d6p1HPNbeY4o3COqG7XzR_EJpbTo,3215
6
6
  tilelang/_ffi_api.py,sha256=D-HfDxx8EZq6qItftg-ejOhpC_smIZLN-pWPVCNX_UM,243
7
7
  tilelang/config.cmake,sha256=370i6N3wwi7-LPGZDBtiiu54UWp39ndD-9lCurLhHwI,14330
@@ -6383,10 +6383,10 @@ tilelang/layout/__init__.py,sha256=F1wr9yBG9GW84h8KWXz-hRJFfqyZuY0EKSrG08KyrWQ,2
6383
6383
  tilelang/layout/fragment.py,sha256=zTv9P96lsYi9BWc5pxR4PA2Z5RSDGP7D5uJCiNw7_oc,8445
6384
6384
  tilelang/layout/layout.py,sha256=20CWxz_S8k_WNvWiR4gdIrEsQ36e5bsnOEqmu4zGk_c,4311
6385
6385
  tilelang/layout/swizzle.py,sha256=PMqu_s1sNCh9uo8eDs5qmLKXnDqZwv34GT3H9D4YDO0,438
6386
- tilelang/lib/libtilelang.so,sha256=gWKpADoERYHrDu-eOXjYtG8ak-dvv_2cs8WDiFYnc8o,5040880
6387
- tilelang/lib/libtilelang_module.so,sha256=eStBjzb0e9y3lZVc21EefE1_nryt0Cs0wlYyz32QifI,5040880
6388
- tilelang/lib/libtvm.so,sha256=7qy1XeUSGm4YXJC22LUmLZMfaGEPdTCXVxq3pkqS_ZY,83982112
6389
- tilelang/lib/libtvm_runtime.so,sha256=BgUg1x-f2q3urmCbmBrbUtVFmS3SUyI6dBSAVP_yi8k,4794680
6386
+ tilelang/lib/libtilelang.so,sha256=XNX_4wZkR2yki7Jc2Q6hxRhhfcf32LoCnuOBX4TLnTU,5040720
6387
+ tilelang/lib/libtilelang_module.so,sha256=5urBFc9szW49ORCkvCDgfWavEAQKs9a6wQbuEQ2Bl1s,5040720
6388
+ tilelang/lib/libtvm.so,sha256=PK8xrRlNpJ8Pox1pxcVGSpdrfB5T89NaujkfDyvus0o,83982112
6389
+ tilelang/lib/libtvm_runtime.so,sha256=JMGIbjqmERUW2RN7KKUxx4DsPnf1RjZIKWXb7Trnrw0,4794680
6390
6390
  tilelang/math/__init__.py,sha256=JC4fqrU_LV_wDErti-wHNr4j6_mqP1PsK0qqkhaSzRU,209
6391
6391
  tilelang/primitives/__init__.py,sha256=10gQN3QWUFM1nkGXY46QFcWUXxwsKMsVn23JdyFHil4,167
6392
6392
  tilelang/primitives/gemm/__init__.py,sha256=j62ObmbL5Q6m3lSouNBQDk1hZZRnSp4UNNCCaSlKYXU,1658
@@ -6420,7 +6420,7 @@ tilelang/src/tl_templates/hip/common.h,sha256=KzMntW2OlABMwYjlxNqKiBDZQXQNrYApeV
6420
6420
  tilelang/src/tl_templates/hip/copy.h,sha256=fGHkbe4ReXoEtIWrgQ-mlCycaIL65SvNGWK1OJZdUQo,3324
6421
6421
  tilelang/src/tl_templates/hip/debug.h,sha256=9xGr4ka5x_nvY55XwbgTJFFwEnd09ta9jAZwjHyQau0,8231
6422
6422
  tilelang/src/tl_templates/hip/gemm.h,sha256=lYeOjV8OG2oZbcS7ByzOudE7i0FQJ71mrUcImkfhTrg,11610
6423
- tilelang/src/tl_templates/hip/hip_fp8.h,sha256=JYGiuuroLQH7CXT7IdKcpNUECmGOTe8DjIjcS9eLc0U,377
6423
+ tilelang/src/tl_templates/hip/hip_fp8.h,sha256=eFYV5OyHI2X5xMNOjv1NLqR2shlKkhiGQWiVEiY6LPs,1903
6424
6424
  tilelang/src/tl_templates/hip/ldsm.h,sha256=gRx_bSdsCsgcVumwUJwOnv4HuHruU2kC9TE9x_jo8k0,106
6425
6425
  tilelang/src/tl_templates/hip/reduce.h,sha256=-VKpG-TNbzPHIqsSReYpqZoM-oXFzIx6fMeBieV26Kc,1372
6426
6426
  tilelang/src/tl_templates/hip/threadblock_swizzle.h,sha256=HPuOUl2Ts76ckY5kVkLlfaK2WyHY0pEXskbXnnefFcA,2055
@@ -6437,8 +6437,8 @@ tilelang/utils/deprecated.py,sha256=CiZ9y_76_dZ24SFDdasDiLmibwi6xO2Gdj6WzTWU0Qg,
6437
6437
  tilelang/utils/language.py,sha256=KUzUZ8Z2x1np0Hu_MrjWOIcRrVAZHX90li1Xw9fYZXY,3291
6438
6438
  tilelang/utils/target.py,sha256=P-74pdCLWcp2MZMQUoPIFwKF1NZ1QT-L0VroIL8m2to,2486
6439
6439
  tilelang/utils/tensor.py,sha256=SZ4ewoJ-Mq3zg8zIHS7-XLUmYDdlNwh841yUkjnQtNU,12573
6440
- tilelang_rocm-0.1.4.post10.dist-info/licenses/LICENSE,sha256=v9fVeAgRKQXc5ySwTns767gj0-dHN9XYPpGURkAVAXs,1127
6441
- tilelang_rocm-0.1.4.post10.dist-info/METADATA,sha256=aBSwulXbZ0_bU2cIYKNCuRsUM2qlAsJ6O14B7fPJUoQ,13076
6442
- tilelang_rocm-0.1.4.post10.dist-info/WHEEL,sha256=0-G7woG4LgutcYzUGJCOYFgoh749-FtfhSMeIPLVGS0,104
6443
- tilelang_rocm-0.1.4.post10.dist-info/top_level.txt,sha256=qvMq-AYkDVggI-9VIAzCe5CXHl66IEWj7J29-JbuFsI,21
6444
- tilelang_rocm-0.1.4.post10.dist-info/RECORD,,
6440
+ tilelang_rocm-0.1.4.post11.dist-info/licenses/LICENSE,sha256=v9fVeAgRKQXc5ySwTns767gj0-dHN9XYPpGURkAVAXs,1127
6441
+ tilelang_rocm-0.1.4.post11.dist-info/METADATA,sha256=mj9fK8dUTSpEU776wVQ23WWkbeuwuFtMp1UNaCvilZ8,13076
6442
+ tilelang_rocm-0.1.4.post11.dist-info/WHEEL,sha256=0-G7woG4LgutcYzUGJCOYFgoh749-FtfhSMeIPLVGS0,104
6443
+ tilelang_rocm-0.1.4.post11.dist-info/top_level.txt,sha256=qvMq-AYkDVggI-9VIAzCe5CXHl66IEWj7J29-JbuFsI,21
6444
+ tilelang_rocm-0.1.4.post11.dist-info/RECORD,,