ejkernel 0.0.76__tar.gz → 0.0.78__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (2527) hide show
  1. {ejkernel-0.0.76 → ejkernel-0.0.78}/PKG-INFO +1 -1
  2. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/__init__.py +1 -1
  3. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/gated_delta_rule/_pallas_impl_fwd.py +41 -2
  4. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/gated_delta_rule/_xla_impl_fwd.py +57 -19
  5. {ejkernel-0.0.76 → ejkernel-0.0.78}/pyproject.toml +1 -1
  6. {ejkernel-0.0.76 → ejkernel-0.0.78}/README.md +0 -0
  7. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/CMakeLists.txt +0 -0
  8. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_attention.h +0 -0
  9. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_attention_ffi.cu +0 -0
  10. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_attention_kernel.h +0 -0
  11. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_attention_launch_template.h +0 -0
  12. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim128_vhdim128_bf16_sm100.cu +0 -0
  13. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim128_vhdim128_bf16_sm110.cu +0 -0
  14. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim128_vhdim128_bf16_sm120.cu +0 -0
  15. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim128_vhdim128_bf16_sm80.cu +0 -0
  16. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim128_vhdim128_bf16_sm90.cu +0 -0
  17. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim128_vhdim128_fp16_sm100.cu +0 -0
  18. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim128_vhdim128_fp16_sm110.cu +0 -0
  19. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim128_vhdim128_fp16_sm120.cu +0 -0
  20. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim128_vhdim128_fp16_sm80.cu +0 -0
  21. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim128_vhdim128_fp16_sm90.cu +0 -0
  22. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim192_vhdim192_bf16_sm100.cu +0 -0
  23. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim192_vhdim192_bf16_sm110.cu +0 -0
  24. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim192_vhdim192_bf16_sm120.cu +0 -0
  25. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim192_vhdim192_bf16_sm80.cu +0 -0
  26. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim192_vhdim192_bf16_sm90.cu +0 -0
  27. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim192_vhdim192_fp16_sm100.cu +0 -0
  28. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim192_vhdim192_fp16_sm110.cu +0 -0
  29. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim192_vhdim192_fp16_sm120.cu +0 -0
  30. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim192_vhdim192_fp16_sm80.cu +0 -0
  31. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim192_vhdim192_fp16_sm90.cu +0 -0
  32. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim256_vhdim256_bf16_sm100.cu +0 -0
  33. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim256_vhdim256_bf16_sm110.cu +0 -0
  34. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim256_vhdim256_bf16_sm120.cu +0 -0
  35. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim256_vhdim256_bf16_sm80.cu +0 -0
  36. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim256_vhdim256_bf16_sm90.cu +0 -0
  37. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim256_vhdim256_fp16_sm100.cu +0 -0
  38. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim256_vhdim256_fp16_sm110.cu +0 -0
  39. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim256_vhdim256_fp16_sm120.cu +0 -0
  40. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim256_vhdim256_fp16_sm80.cu +0 -0
  41. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim256_vhdim256_fp16_sm90.cu +0 -0
  42. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim32_vhdim32_bf16_sm100.cu +0 -0
  43. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim32_vhdim32_bf16_sm110.cu +0 -0
  44. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim32_vhdim32_bf16_sm120.cu +0 -0
  45. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim32_vhdim32_bf16_sm80.cu +0 -0
  46. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim32_vhdim32_bf16_sm90.cu +0 -0
  47. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim32_vhdim32_fp16_sm100.cu +0 -0
  48. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim32_vhdim32_fp16_sm110.cu +0 -0
  49. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim32_vhdim32_fp16_sm120.cu +0 -0
  50. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim32_vhdim32_fp16_sm80.cu +0 -0
  51. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim32_vhdim32_fp16_sm90.cu +0 -0
  52. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim64_vhdim64_bf16_sm100.cu +0 -0
  53. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim64_vhdim64_bf16_sm110.cu +0 -0
  54. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim64_vhdim64_bf16_sm120.cu +0 -0
  55. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim64_vhdim64_bf16_sm80.cu +0 -0
  56. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim64_vhdim64_bf16_sm90.cu +0 -0
  57. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim64_vhdim64_fp16_sm100.cu +0 -0
  58. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim64_vhdim64_fp16_sm110.cu +0 -0
  59. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim64_vhdim64_fp16_sm120.cu +0 -0
  60. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim64_vhdim64_fp16_sm80.cu +0 -0
  61. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim64_vhdim64_fp16_sm90.cu +0 -0
  62. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim96_vhdim96_bf16_sm100.cu +0 -0
  63. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim96_vhdim96_bf16_sm110.cu +0 -0
  64. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim96_vhdim96_bf16_sm120.cu +0 -0
  65. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim96_vhdim96_bf16_sm80.cu +0 -0
  66. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim96_vhdim96_bf16_sm90.cu +0 -0
  67. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim96_vhdim96_fp16_sm100.cu +0 -0
  68. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim96_vhdim96_fp16_sm110.cu +0 -0
  69. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim96_vhdim96_fp16_sm120.cu +0 -0
  70. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim96_vhdim96_fp16_sm80.cu +0 -0
  71. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/blocksparse_fwd_hdim96_vhdim96_fp16_sm90.cu +0 -0
  72. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/blocksparse_attention/src/code_gen.py +0 -0
  73. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/code_gen.py +0 -0
  74. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/CMakeLists.txt +0 -0
  75. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/block.h +0 -0
  76. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/code_gen.py +0 -0
  77. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/copy_sm90_bulk_reduce.hpp +0 -0
  78. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/cuda_check.h +0 -0
  79. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/epilogue_bwd.hpp +0 -0
  80. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/epilogue_fwd.hpp +0 -0
  81. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash.h +0 -0
  82. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_api.cpp +0 -0
  83. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_api_stable.cpp +0 -0
  84. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_bwd_kernel_sm80.h +0 -0
  85. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_bwd_kernel_sm90.h +0 -0
  86. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_bwd_launch_template.h +0 -0
  87. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_bwd_postprocess_kernel.h +0 -0
  88. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_bwd_preprocess_kernel.h +0 -0
  89. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_fwd_combine.cu +0 -0
  90. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_fwd_combine_kernel.h +0 -0
  91. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_fwd_combine_launch_template.h +0 -0
  92. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_fwd_kernel_sm80.h +0 -0
  93. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_fwd_kernel_sm90.h +0 -0
  94. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_fwd_launch_template.h +0 -0
  95. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/flash_prepare_scheduler.cu +0 -0
  96. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/heuristics.h +0 -0
  97. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_bf16_sm100.cu +0 -0
  98. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_bf16_sm110.cu +0 -0
  99. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_bf16_sm120.cu +0 -0
  100. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_bf16_sm80.cu +0 -0
  101. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_bf16_sm90.cu +0 -0
  102. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_bf16_softcap_sm100.cu +0 -0
  103. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_bf16_softcap_sm110.cu +0 -0
  104. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_bf16_softcap_sm120.cu +0 -0
  105. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_bf16_softcap_sm80.cu +0 -0
  106. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_bf16_softcap_sm90.cu +0 -0
  107. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_bf16_softcapall_sm90.cu +0 -0
  108. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_fp16_sm100.cu +0 -0
  109. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_fp16_sm110.cu +0 -0
  110. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_fp16_sm120.cu +0 -0
  111. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_fp16_sm80.cu +0 -0
  112. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_fp16_sm90.cu +0 -0
  113. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_fp16_softcap_sm100.cu +0 -0
  114. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_fp16_softcap_sm110.cu +0 -0
  115. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_fp16_softcap_sm120.cu +0 -0
  116. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_fp16_softcap_sm80.cu +0 -0
  117. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_fp16_softcap_sm90.cu +0 -0
  118. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim128_fp16_softcapall_sm90.cu +0 -0
  119. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_bf16_sm100.cu +0 -0
  120. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_bf16_sm110.cu +0 -0
  121. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_bf16_sm120.cu +0 -0
  122. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_bf16_sm80.cu +0 -0
  123. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_bf16_sm90.cu +0 -0
  124. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_bf16_softcap_sm100.cu +0 -0
  125. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_bf16_softcap_sm110.cu +0 -0
  126. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_bf16_softcap_sm120.cu +0 -0
  127. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_bf16_softcap_sm80.cu +0 -0
  128. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_bf16_softcap_sm90.cu +0 -0
  129. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_bf16_softcapall_sm90.cu +0 -0
  130. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_fp16_sm100.cu +0 -0
  131. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_fp16_sm110.cu +0 -0
  132. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_fp16_sm120.cu +0 -0
  133. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_fp16_sm80.cu +0 -0
  134. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_fp16_sm90.cu +0 -0
  135. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_fp16_softcap_sm100.cu +0 -0
  136. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_fp16_softcap_sm110.cu +0 -0
  137. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_fp16_softcap_sm120.cu +0 -0
  138. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_fp16_softcap_sm80.cu +0 -0
  139. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_fp16_softcap_sm90.cu +0 -0
  140. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim192_fp16_softcapall_sm90.cu +0 -0
  141. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_bf16_sm100.cu +0 -0
  142. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_bf16_sm110.cu +0 -0
  143. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_bf16_sm120.cu +0 -0
  144. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_bf16_sm80.cu +0 -0
  145. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_bf16_sm90.cu +0 -0
  146. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_bf16_softcap_sm100.cu +0 -0
  147. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_bf16_softcap_sm110.cu +0 -0
  148. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_bf16_softcap_sm120.cu +0 -0
  149. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_bf16_softcap_sm80.cu +0 -0
  150. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_bf16_softcap_sm90.cu +0 -0
  151. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_bf16_softcapall_sm90.cu +0 -0
  152. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_fp16_sm100.cu +0 -0
  153. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_fp16_sm110.cu +0 -0
  154. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_fp16_sm120.cu +0 -0
  155. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_fp16_sm80.cu +0 -0
  156. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_fp16_sm90.cu +0 -0
  157. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_fp16_softcap_sm100.cu +0 -0
  158. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_fp16_softcap_sm110.cu +0 -0
  159. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_fp16_softcap_sm120.cu +0 -0
  160. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_fp16_softcap_sm80.cu +0 -0
  161. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_fp16_softcap_sm90.cu +0 -0
  162. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim256_fp16_softcapall_sm90.cu +0 -0
  163. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_bf16_sm100.cu +0 -0
  164. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_bf16_sm110.cu +0 -0
  165. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_bf16_sm120.cu +0 -0
  166. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_bf16_sm80.cu +0 -0
  167. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_bf16_sm90.cu +0 -0
  168. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_bf16_softcap_sm100.cu +0 -0
  169. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_bf16_softcap_sm110.cu +0 -0
  170. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_bf16_softcap_sm120.cu +0 -0
  171. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_bf16_softcap_sm80.cu +0 -0
  172. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_bf16_softcap_sm90.cu +0 -0
  173. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_bf16_softcapall_sm90.cu +0 -0
  174. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_fp16_sm100.cu +0 -0
  175. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_fp16_sm110.cu +0 -0
  176. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_fp16_sm120.cu +0 -0
  177. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_fp16_sm80.cu +0 -0
  178. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_fp16_sm90.cu +0 -0
  179. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_fp16_softcap_sm100.cu +0 -0
  180. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_fp16_softcap_sm110.cu +0 -0
  181. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_fp16_softcap_sm120.cu +0 -0
  182. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_fp16_softcap_sm80.cu +0 -0
  183. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_fp16_softcap_sm90.cu +0 -0
  184. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim64_fp16_softcapall_sm90.cu +0 -0
  185. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_bf16_sm100.cu +0 -0
  186. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_bf16_sm110.cu +0 -0
  187. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_bf16_sm120.cu +0 -0
  188. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_bf16_sm80.cu +0 -0
  189. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_bf16_sm90.cu +0 -0
  190. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_bf16_softcap_sm100.cu +0 -0
  191. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_bf16_softcap_sm110.cu +0 -0
  192. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_bf16_softcap_sm120.cu +0 -0
  193. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_bf16_softcap_sm80.cu +0 -0
  194. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_bf16_softcap_sm90.cu +0 -0
  195. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_bf16_softcapall_sm90.cu +0 -0
  196. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_fp16_sm100.cu +0 -0
  197. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_fp16_sm110.cu +0 -0
  198. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_fp16_sm120.cu +0 -0
  199. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_fp16_sm80.cu +0 -0
  200. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_fp16_sm90.cu +0 -0
  201. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_fp16_softcap_sm100.cu +0 -0
  202. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_fp16_softcap_sm110.cu +0 -0
  203. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_fp16_softcap_sm120.cu +0 -0
  204. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_fp16_softcap_sm80.cu +0 -0
  205. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_fp16_softcap_sm90.cu +0 -0
  206. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_bwd_hdim96_fp16_softcapall_sm90.cu +0 -0
  207. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_packgqa_sm100.cu +0 -0
  208. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_packgqa_sm110.cu +0 -0
  209. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_packgqa_sm120.cu +0 -0
  210. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_packgqa_sm80.cu +0 -0
  211. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_packgqa_sm90.cu +0 -0
  212. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_packgqa_sm100.cu +0 -0
  213. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_packgqa_sm110.cu +0 -0
  214. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_packgqa_sm120.cu +0 -0
  215. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_packgqa_sm80.cu +0 -0
  216. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_packgqa_sm90.cu +0 -0
  217. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_sm100.cu +0 -0
  218. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_sm110.cu +0 -0
  219. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_sm120.cu +0 -0
  220. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_sm80.cu +0 -0
  221. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_sm90.cu +0 -0
  222. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_softcap_packgqa_sm100.cu +0 -0
  223. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_softcap_packgqa_sm110.cu +0 -0
  224. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_softcap_packgqa_sm120.cu +0 -0
  225. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_softcap_packgqa_sm80.cu +0 -0
  226. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_softcap_packgqa_sm90.cu +0 -0
  227. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_softcap_sm100.cu +0 -0
  228. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_softcap_sm110.cu +0 -0
  229. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_softcap_sm120.cu +0 -0
  230. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_softcap_sm80.cu +0 -0
  231. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_softcap_sm90.cu +0 -0
  232. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_softcapall_sm80.cu +0 -0
  233. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_packgqa_sm100.cu +0 -0
  234. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_packgqa_sm110.cu +0 -0
  235. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_packgqa_sm120.cu +0 -0
  236. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_packgqa_sm80.cu +0 -0
  237. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_packgqa_sm90.cu +0 -0
  238. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_sm100.cu +0 -0
  239. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_sm110.cu +0 -0
  240. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_sm120.cu +0 -0
  241. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_sm80.cu +0 -0
  242. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_sm90.cu +0 -0
  243. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_softcap_packgqa_sm100.cu +0 -0
  244. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_softcap_packgqa_sm110.cu +0 -0
  245. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_softcap_packgqa_sm120.cu +0 -0
  246. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_softcap_packgqa_sm80.cu +0 -0
  247. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_softcap_packgqa_sm90.cu +0 -0
  248. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_softcap_sm100.cu +0 -0
  249. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_softcap_sm110.cu +0 -0
  250. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_softcap_sm120.cu +0 -0
  251. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_softcap_sm80.cu +0 -0
  252. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_softcap_sm90.cu +0 -0
  253. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_paged_split_softcapall_sm80.cu +0 -0
  254. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_sm100.cu +0 -0
  255. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_sm110.cu +0 -0
  256. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_sm120.cu +0 -0
  257. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_sm80.cu +0 -0
  258. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_sm90.cu +0 -0
  259. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_softcap_packgqa_sm100.cu +0 -0
  260. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_softcap_packgqa_sm110.cu +0 -0
  261. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_softcap_packgqa_sm120.cu +0 -0
  262. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_softcap_packgqa_sm80.cu +0 -0
  263. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_softcap_packgqa_sm90.cu +0 -0
  264. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_softcap_sm100.cu +0 -0
  265. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_softcap_sm110.cu +0 -0
  266. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_softcap_sm120.cu +0 -0
  267. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_softcap_sm80.cu +0 -0
  268. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_softcap_sm90.cu +0 -0
  269. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_softcapall_sm80.cu +0 -0
  270. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_packgqa_sm100.cu +0 -0
  271. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_packgqa_sm110.cu +0 -0
  272. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_packgqa_sm120.cu +0 -0
  273. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_packgqa_sm80.cu +0 -0
  274. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_packgqa_sm90.cu +0 -0
  275. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_sm100.cu +0 -0
  276. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_sm110.cu +0 -0
  277. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_sm120.cu +0 -0
  278. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_sm80.cu +0 -0
  279. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_sm90.cu +0 -0
  280. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_softcap_packgqa_sm100.cu +0 -0
  281. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_softcap_packgqa_sm110.cu +0 -0
  282. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_softcap_packgqa_sm120.cu +0 -0
  283. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_softcap_packgqa_sm80.cu +0 -0
  284. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_softcap_packgqa_sm90.cu +0 -0
  285. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_softcap_sm100.cu +0 -0
  286. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_softcap_sm110.cu +0 -0
  287. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_softcap_sm120.cu +0 -0
  288. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_softcap_sm80.cu +0 -0
  289. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_softcap_sm90.cu +0 -0
  290. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_bf16_split_softcapall_sm80.cu +0 -0
  291. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_packgqa_sm100.cu +0 -0
  292. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_packgqa_sm110.cu +0 -0
  293. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_packgqa_sm120.cu +0 -0
  294. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_packgqa_sm90.cu +0 -0
  295. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_packgqa_sm100.cu +0 -0
  296. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_packgqa_sm110.cu +0 -0
  297. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_packgqa_sm120.cu +0 -0
  298. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_packgqa_sm90.cu +0 -0
  299. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_sm100.cu +0 -0
  300. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_sm110.cu +0 -0
  301. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_sm120.cu +0 -0
  302. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_sm90.cu +0 -0
  303. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_softcap_packgqa_sm100.cu +0 -0
  304. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_softcap_packgqa_sm110.cu +0 -0
  305. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_softcap_packgqa_sm120.cu +0 -0
  306. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_softcap_packgqa_sm90.cu +0 -0
  307. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_softcap_sm100.cu +0 -0
  308. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_softcap_sm110.cu +0 -0
  309. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_softcap_sm120.cu +0 -0
  310. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_softcap_sm90.cu +0 -0
  311. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_packgqa_sm100.cu +0 -0
  312. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_packgqa_sm110.cu +0 -0
  313. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_packgqa_sm120.cu +0 -0
  314. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_packgqa_sm90.cu +0 -0
  315. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_sm100.cu +0 -0
  316. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_sm110.cu +0 -0
  317. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_sm120.cu +0 -0
  318. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_sm90.cu +0 -0
  319. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_softcap_packgqa_sm100.cu +0 -0
  320. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_softcap_packgqa_sm110.cu +0 -0
  321. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_softcap_packgqa_sm120.cu +0 -0
  322. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_softcap_packgqa_sm90.cu +0 -0
  323. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_softcap_sm100.cu +0 -0
  324. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_softcap_sm110.cu +0 -0
  325. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_softcap_sm120.cu +0 -0
  326. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_paged_split_softcap_sm90.cu +0 -0
  327. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_sm100.cu +0 -0
  328. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_sm110.cu +0 -0
  329. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_sm120.cu +0 -0
  330. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_sm90.cu +0 -0
  331. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_softcap_packgqa_sm100.cu +0 -0
  332. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_softcap_packgqa_sm110.cu +0 -0
  333. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_softcap_packgqa_sm120.cu +0 -0
  334. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_softcap_packgqa_sm90.cu +0 -0
  335. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_softcap_sm100.cu +0 -0
  336. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_softcap_sm110.cu +0 -0
  337. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_softcap_sm120.cu +0 -0
  338. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_softcap_sm90.cu +0 -0
  339. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_packgqa_sm100.cu +0 -0
  340. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_packgqa_sm110.cu +0 -0
  341. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_packgqa_sm120.cu +0 -0
  342. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_packgqa_sm90.cu +0 -0
  343. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_sm100.cu +0 -0
  344. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_sm110.cu +0 -0
  345. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_sm120.cu +0 -0
  346. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_sm90.cu +0 -0
  347. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_softcap_packgqa_sm100.cu +0 -0
  348. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_softcap_packgqa_sm110.cu +0 -0
  349. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_softcap_packgqa_sm120.cu +0 -0
  350. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_softcap_packgqa_sm90.cu +0 -0
  351. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_softcap_sm100.cu +0 -0
  352. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_softcap_sm110.cu +0 -0
  353. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_softcap_sm120.cu +0 -0
  354. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_e4m3_split_softcap_sm90.cu +0 -0
  355. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_packgqa_sm100.cu +0 -0
  356. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_packgqa_sm110.cu +0 -0
  357. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_packgqa_sm120.cu +0 -0
  358. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_packgqa_sm80.cu +0 -0
  359. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_packgqa_sm90.cu +0 -0
  360. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_packgqa_sm100.cu +0 -0
  361. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_packgqa_sm110.cu +0 -0
  362. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_packgqa_sm120.cu +0 -0
  363. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_packgqa_sm80.cu +0 -0
  364. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_packgqa_sm90.cu +0 -0
  365. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_sm100.cu +0 -0
  366. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_sm110.cu +0 -0
  367. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_sm120.cu +0 -0
  368. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_sm80.cu +0 -0
  369. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_sm90.cu +0 -0
  370. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_softcap_packgqa_sm100.cu +0 -0
  371. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_softcap_packgqa_sm110.cu +0 -0
  372. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_softcap_packgqa_sm120.cu +0 -0
  373. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_softcap_packgqa_sm80.cu +0 -0
  374. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_softcap_packgqa_sm90.cu +0 -0
  375. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_softcap_sm100.cu +0 -0
  376. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_softcap_sm110.cu +0 -0
  377. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_softcap_sm120.cu +0 -0
  378. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_softcap_sm80.cu +0 -0
  379. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_softcap_sm90.cu +0 -0
  380. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_softcapall_sm80.cu +0 -0
  381. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_packgqa_sm100.cu +0 -0
  382. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_packgqa_sm110.cu +0 -0
  383. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_packgqa_sm120.cu +0 -0
  384. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_packgqa_sm80.cu +0 -0
  385. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_packgqa_sm90.cu +0 -0
  386. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_sm100.cu +0 -0
  387. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_sm110.cu +0 -0
  388. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_sm120.cu +0 -0
  389. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_sm80.cu +0 -0
  390. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_sm90.cu +0 -0
  391. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_softcap_packgqa_sm100.cu +0 -0
  392. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_softcap_packgqa_sm110.cu +0 -0
  393. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_softcap_packgqa_sm120.cu +0 -0
  394. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_softcap_packgqa_sm80.cu +0 -0
  395. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_softcap_packgqa_sm90.cu +0 -0
  396. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_softcap_sm100.cu +0 -0
  397. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_softcap_sm110.cu +0 -0
  398. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_softcap_sm120.cu +0 -0
  399. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_softcap_sm80.cu +0 -0
  400. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_softcap_sm90.cu +0 -0
  401. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_paged_split_softcapall_sm80.cu +0 -0
  402. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_sm100.cu +0 -0
  403. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_sm110.cu +0 -0
  404. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_sm120.cu +0 -0
  405. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_sm80.cu +0 -0
  406. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_sm90.cu +0 -0
  407. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_softcap_packgqa_sm100.cu +0 -0
  408. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_softcap_packgqa_sm110.cu +0 -0
  409. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_softcap_packgqa_sm120.cu +0 -0
  410. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_softcap_packgqa_sm80.cu +0 -0
  411. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_softcap_packgqa_sm90.cu +0 -0
  412. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_softcap_sm100.cu +0 -0
  413. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_softcap_sm110.cu +0 -0
  414. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_softcap_sm120.cu +0 -0
  415. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_softcap_sm80.cu +0 -0
  416. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_softcap_sm90.cu +0 -0
  417. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_softcapall_sm80.cu +0 -0
  418. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_packgqa_sm100.cu +0 -0
  419. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_packgqa_sm110.cu +0 -0
  420. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_packgqa_sm120.cu +0 -0
  421. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_packgqa_sm80.cu +0 -0
  422. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_packgqa_sm90.cu +0 -0
  423. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_sm100.cu +0 -0
  424. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_sm110.cu +0 -0
  425. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_sm120.cu +0 -0
  426. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_sm80.cu +0 -0
  427. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_sm90.cu +0 -0
  428. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_softcap_packgqa_sm100.cu +0 -0
  429. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_softcap_packgqa_sm110.cu +0 -0
  430. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_softcap_packgqa_sm120.cu +0 -0
  431. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_softcap_packgqa_sm80.cu +0 -0
  432. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_softcap_packgqa_sm90.cu +0 -0
  433. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_softcap_sm100.cu +0 -0
  434. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_softcap_sm110.cu +0 -0
  435. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_softcap_sm120.cu +0 -0
  436. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_softcap_sm80.cu +0 -0
  437. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_softcap_sm90.cu +0 -0
  438. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim128_fp16_split_softcapall_sm80.cu +0 -0
  439. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_bf16_packgqa_sm90.cu +0 -0
  440. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_bf16_paged_sm90.cu +0 -0
  441. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_bf16_paged_softcap_sm90.cu +0 -0
  442. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_bf16_paged_split_sm90.cu +0 -0
  443. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_bf16_paged_split_softcap_sm90.cu +0 -0
  444. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_bf16_sm90.cu +0 -0
  445. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_bf16_softcap_packgqa_sm90.cu +0 -0
  446. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_bf16_softcap_sm90.cu +0 -0
  447. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_bf16_split_sm90.cu +0 -0
  448. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_bf16_split_softcap_sm90.cu +0 -0
  449. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_e4m3_packgqa_sm90.cu +0 -0
  450. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_e4m3_paged_sm90.cu +0 -0
  451. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_e4m3_paged_softcap_sm90.cu +0 -0
  452. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_e4m3_paged_split_sm90.cu +0 -0
  453. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_e4m3_paged_split_softcap_sm90.cu +0 -0
  454. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_e4m3_sm90.cu +0 -0
  455. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_e4m3_softcap_packgqa_sm90.cu +0 -0
  456. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_e4m3_softcap_sm90.cu +0 -0
  457. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_e4m3_split_sm90.cu +0 -0
  458. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_e4m3_split_softcap_sm90.cu +0 -0
  459. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_fp16_packgqa_sm90.cu +0 -0
  460. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_fp16_paged_sm90.cu +0 -0
  461. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_fp16_paged_softcap_sm90.cu +0 -0
  462. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_fp16_paged_split_sm90.cu +0 -0
  463. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_fp16_paged_split_softcap_sm90.cu +0 -0
  464. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_fp16_sm90.cu +0 -0
  465. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_fp16_softcap_packgqa_sm90.cu +0 -0
  466. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_fp16_softcap_sm90.cu +0 -0
  467. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_fp16_split_sm90.cu +0 -0
  468. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_128_fp16_split_softcap_sm90.cu +0 -0
  469. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_packgqa_sm100.cu +0 -0
  470. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_packgqa_sm110.cu +0 -0
  471. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_packgqa_sm120.cu +0 -0
  472. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_packgqa_sm80.cu +0 -0
  473. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_packgqa_sm90.cu +0 -0
  474. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_packgqa_sm100.cu +0 -0
  475. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_packgqa_sm110.cu +0 -0
  476. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_packgqa_sm120.cu +0 -0
  477. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_packgqa_sm80.cu +0 -0
  478. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_packgqa_sm90.cu +0 -0
  479. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_sm100.cu +0 -0
  480. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_sm110.cu +0 -0
  481. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_sm120.cu +0 -0
  482. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_sm80.cu +0 -0
  483. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_sm90.cu +0 -0
  484. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_softcap_packgqa_sm100.cu +0 -0
  485. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_softcap_packgqa_sm110.cu +0 -0
  486. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_softcap_packgqa_sm120.cu +0 -0
  487. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_softcap_packgqa_sm80.cu +0 -0
  488. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_softcap_packgqa_sm90.cu +0 -0
  489. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_softcap_sm100.cu +0 -0
  490. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_softcap_sm110.cu +0 -0
  491. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_softcap_sm120.cu +0 -0
  492. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_softcap_sm80.cu +0 -0
  493. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_softcap_sm90.cu +0 -0
  494. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_softcapall_sm80.cu +0 -0
  495. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_packgqa_sm100.cu +0 -0
  496. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_packgqa_sm110.cu +0 -0
  497. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_packgqa_sm120.cu +0 -0
  498. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_packgqa_sm80.cu +0 -0
  499. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_packgqa_sm90.cu +0 -0
  500. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_sm100.cu +0 -0
  501. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_sm110.cu +0 -0
  502. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_sm120.cu +0 -0
  503. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_sm80.cu +0 -0
  504. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_sm90.cu +0 -0
  505. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_softcap_packgqa_sm100.cu +0 -0
  506. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_softcap_packgqa_sm110.cu +0 -0
  507. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_softcap_packgqa_sm120.cu +0 -0
  508. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_softcap_packgqa_sm80.cu +0 -0
  509. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_softcap_packgqa_sm90.cu +0 -0
  510. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_softcap_sm100.cu +0 -0
  511. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_softcap_sm110.cu +0 -0
  512. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_softcap_sm120.cu +0 -0
  513. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_softcap_sm80.cu +0 -0
  514. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_softcap_sm90.cu +0 -0
  515. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_paged_split_softcapall_sm80.cu +0 -0
  516. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_sm100.cu +0 -0
  517. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_sm110.cu +0 -0
  518. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_sm120.cu +0 -0
  519. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_sm80.cu +0 -0
  520. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_sm90.cu +0 -0
  521. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_softcap_packgqa_sm100.cu +0 -0
  522. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_softcap_packgqa_sm110.cu +0 -0
  523. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_softcap_packgqa_sm120.cu +0 -0
  524. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_softcap_packgqa_sm80.cu +0 -0
  525. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_softcap_packgqa_sm90.cu +0 -0
  526. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_softcap_sm100.cu +0 -0
  527. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_softcap_sm110.cu +0 -0
  528. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_softcap_sm120.cu +0 -0
  529. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_softcap_sm80.cu +0 -0
  530. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_softcap_sm90.cu +0 -0
  531. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_softcapall_sm80.cu +0 -0
  532. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_packgqa_sm100.cu +0 -0
  533. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_packgqa_sm110.cu +0 -0
  534. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_packgqa_sm120.cu +0 -0
  535. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_packgqa_sm80.cu +0 -0
  536. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_packgqa_sm90.cu +0 -0
  537. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_sm100.cu +0 -0
  538. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_sm110.cu +0 -0
  539. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_sm120.cu +0 -0
  540. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_sm80.cu +0 -0
  541. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_sm90.cu +0 -0
  542. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_softcap_packgqa_sm100.cu +0 -0
  543. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_softcap_packgqa_sm110.cu +0 -0
  544. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_softcap_packgqa_sm120.cu +0 -0
  545. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_softcap_packgqa_sm80.cu +0 -0
  546. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_softcap_packgqa_sm90.cu +0 -0
  547. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_softcap_sm100.cu +0 -0
  548. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_softcap_sm110.cu +0 -0
  549. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_softcap_sm120.cu +0 -0
  550. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_softcap_sm80.cu +0 -0
  551. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_softcap_sm90.cu +0 -0
  552. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_bf16_split_softcapall_sm80.cu +0 -0
  553. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_packgqa_sm100.cu +0 -0
  554. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_packgqa_sm110.cu +0 -0
  555. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_packgqa_sm120.cu +0 -0
  556. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_packgqa_sm90.cu +0 -0
  557. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_packgqa_sm100.cu +0 -0
  558. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_packgqa_sm110.cu +0 -0
  559. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_packgqa_sm120.cu +0 -0
  560. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_packgqa_sm90.cu +0 -0
  561. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_sm100.cu +0 -0
  562. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_sm110.cu +0 -0
  563. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_sm120.cu +0 -0
  564. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_sm90.cu +0 -0
  565. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_softcap_packgqa_sm100.cu +0 -0
  566. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_softcap_packgqa_sm110.cu +0 -0
  567. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_softcap_packgqa_sm120.cu +0 -0
  568. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_softcap_packgqa_sm90.cu +0 -0
  569. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_softcap_sm100.cu +0 -0
  570. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_softcap_sm110.cu +0 -0
  571. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_softcap_sm120.cu +0 -0
  572. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_softcap_sm90.cu +0 -0
  573. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_packgqa_sm100.cu +0 -0
  574. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_packgqa_sm110.cu +0 -0
  575. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_packgqa_sm120.cu +0 -0
  576. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_packgqa_sm90.cu +0 -0
  577. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_sm100.cu +0 -0
  578. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_sm110.cu +0 -0
  579. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_sm120.cu +0 -0
  580. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_sm90.cu +0 -0
  581. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_softcap_packgqa_sm100.cu +0 -0
  582. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_softcap_packgqa_sm110.cu +0 -0
  583. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_softcap_packgqa_sm120.cu +0 -0
  584. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_softcap_packgqa_sm90.cu +0 -0
  585. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_softcap_sm100.cu +0 -0
  586. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_softcap_sm110.cu +0 -0
  587. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_softcap_sm120.cu +0 -0
  588. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_paged_split_softcap_sm90.cu +0 -0
  589. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_sm100.cu +0 -0
  590. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_sm110.cu +0 -0
  591. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_sm120.cu +0 -0
  592. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_sm90.cu +0 -0
  593. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_softcap_packgqa_sm100.cu +0 -0
  594. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_softcap_packgqa_sm110.cu +0 -0
  595. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_softcap_packgqa_sm120.cu +0 -0
  596. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_softcap_packgqa_sm90.cu +0 -0
  597. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_softcap_sm100.cu +0 -0
  598. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_softcap_sm110.cu +0 -0
  599. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_softcap_sm120.cu +0 -0
  600. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_softcap_sm90.cu +0 -0
  601. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_packgqa_sm100.cu +0 -0
  602. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_packgqa_sm110.cu +0 -0
  603. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_packgqa_sm120.cu +0 -0
  604. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_packgqa_sm90.cu +0 -0
  605. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_sm100.cu +0 -0
  606. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_sm110.cu +0 -0
  607. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_sm120.cu +0 -0
  608. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_sm90.cu +0 -0
  609. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_softcap_packgqa_sm100.cu +0 -0
  610. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_softcap_packgqa_sm110.cu +0 -0
  611. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_softcap_packgqa_sm120.cu +0 -0
  612. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_softcap_packgqa_sm90.cu +0 -0
  613. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_softcap_sm100.cu +0 -0
  614. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_softcap_sm110.cu +0 -0
  615. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_softcap_sm120.cu +0 -0
  616. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_e4m3_split_softcap_sm90.cu +0 -0
  617. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_packgqa_sm100.cu +0 -0
  618. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_packgqa_sm110.cu +0 -0
  619. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_packgqa_sm120.cu +0 -0
  620. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_packgqa_sm80.cu +0 -0
  621. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_packgqa_sm90.cu +0 -0
  622. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_packgqa_sm100.cu +0 -0
  623. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_packgqa_sm110.cu +0 -0
  624. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_packgqa_sm120.cu +0 -0
  625. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_packgqa_sm80.cu +0 -0
  626. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_packgqa_sm90.cu +0 -0
  627. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_sm100.cu +0 -0
  628. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_sm110.cu +0 -0
  629. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_sm120.cu +0 -0
  630. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_sm80.cu +0 -0
  631. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_sm90.cu +0 -0
  632. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_softcap_packgqa_sm100.cu +0 -0
  633. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_softcap_packgqa_sm110.cu +0 -0
  634. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_softcap_packgqa_sm120.cu +0 -0
  635. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_softcap_packgqa_sm80.cu +0 -0
  636. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_softcap_packgqa_sm90.cu +0 -0
  637. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_softcap_sm100.cu +0 -0
  638. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_softcap_sm110.cu +0 -0
  639. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_softcap_sm120.cu +0 -0
  640. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_softcap_sm80.cu +0 -0
  641. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_softcap_sm90.cu +0 -0
  642. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_softcapall_sm80.cu +0 -0
  643. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_packgqa_sm100.cu +0 -0
  644. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_packgqa_sm110.cu +0 -0
  645. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_packgqa_sm120.cu +0 -0
  646. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_packgqa_sm80.cu +0 -0
  647. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_packgqa_sm90.cu +0 -0
  648. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_sm100.cu +0 -0
  649. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_sm110.cu +0 -0
  650. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_sm120.cu +0 -0
  651. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_sm80.cu +0 -0
  652. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_sm90.cu +0 -0
  653. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_softcap_packgqa_sm100.cu +0 -0
  654. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_softcap_packgqa_sm110.cu +0 -0
  655. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_softcap_packgqa_sm120.cu +0 -0
  656. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_softcap_packgqa_sm80.cu +0 -0
  657. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_softcap_packgqa_sm90.cu +0 -0
  658. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_softcap_sm100.cu +0 -0
  659. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_softcap_sm110.cu +0 -0
  660. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_softcap_sm120.cu +0 -0
  661. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_softcap_sm80.cu +0 -0
  662. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_softcap_sm90.cu +0 -0
  663. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_paged_split_softcapall_sm80.cu +0 -0
  664. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_sm100.cu +0 -0
  665. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_sm110.cu +0 -0
  666. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_sm120.cu +0 -0
  667. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_sm80.cu +0 -0
  668. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_sm90.cu +0 -0
  669. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_softcap_packgqa_sm100.cu +0 -0
  670. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_softcap_packgqa_sm110.cu +0 -0
  671. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_softcap_packgqa_sm120.cu +0 -0
  672. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_softcap_packgqa_sm80.cu +0 -0
  673. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_softcap_packgqa_sm90.cu +0 -0
  674. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_softcap_sm100.cu +0 -0
  675. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_softcap_sm110.cu +0 -0
  676. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_softcap_sm120.cu +0 -0
  677. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_softcap_sm80.cu +0 -0
  678. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_softcap_sm90.cu +0 -0
  679. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_softcapall_sm80.cu +0 -0
  680. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_packgqa_sm100.cu +0 -0
  681. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_packgqa_sm110.cu +0 -0
  682. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_packgqa_sm120.cu +0 -0
  683. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_packgqa_sm80.cu +0 -0
  684. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_packgqa_sm90.cu +0 -0
  685. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_sm100.cu +0 -0
  686. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_sm110.cu +0 -0
  687. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_sm120.cu +0 -0
  688. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_sm80.cu +0 -0
  689. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_sm90.cu +0 -0
  690. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_softcap_packgqa_sm100.cu +0 -0
  691. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_softcap_packgqa_sm110.cu +0 -0
  692. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_softcap_packgqa_sm120.cu +0 -0
  693. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_softcap_packgqa_sm80.cu +0 -0
  694. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_softcap_packgqa_sm90.cu +0 -0
  695. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_softcap_sm100.cu +0 -0
  696. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_softcap_sm110.cu +0 -0
  697. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_softcap_sm120.cu +0 -0
  698. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_softcap_sm80.cu +0 -0
  699. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_softcap_sm90.cu +0 -0
  700. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim192_fp16_split_softcapall_sm80.cu +0 -0
  701. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_packgqa_sm100.cu +0 -0
  702. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_packgqa_sm110.cu +0 -0
  703. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_packgqa_sm120.cu +0 -0
  704. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_packgqa_sm80.cu +0 -0
  705. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_packgqa_sm90.cu +0 -0
  706. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_packgqa_sm100.cu +0 -0
  707. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_packgqa_sm110.cu +0 -0
  708. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_packgqa_sm120.cu +0 -0
  709. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_packgqa_sm80.cu +0 -0
  710. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_packgqa_sm90.cu +0 -0
  711. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_sm100.cu +0 -0
  712. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_sm110.cu +0 -0
  713. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_sm120.cu +0 -0
  714. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_sm80.cu +0 -0
  715. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_sm90.cu +0 -0
  716. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_softcap_packgqa_sm100.cu +0 -0
  717. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_softcap_packgqa_sm110.cu +0 -0
  718. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_softcap_packgqa_sm120.cu +0 -0
  719. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_softcap_packgqa_sm80.cu +0 -0
  720. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_softcap_packgqa_sm90.cu +0 -0
  721. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_softcap_sm100.cu +0 -0
  722. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_softcap_sm110.cu +0 -0
  723. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_softcap_sm120.cu +0 -0
  724. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_softcap_sm80.cu +0 -0
  725. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_softcap_sm90.cu +0 -0
  726. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_softcapall_sm80.cu +0 -0
  727. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_packgqa_sm100.cu +0 -0
  728. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_packgqa_sm110.cu +0 -0
  729. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_packgqa_sm120.cu +0 -0
  730. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_packgqa_sm80.cu +0 -0
  731. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_packgqa_sm90.cu +0 -0
  732. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_sm100.cu +0 -0
  733. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_sm110.cu +0 -0
  734. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_sm120.cu +0 -0
  735. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_sm80.cu +0 -0
  736. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_sm90.cu +0 -0
  737. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_softcap_packgqa_sm100.cu +0 -0
  738. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_softcap_packgqa_sm110.cu +0 -0
  739. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_softcap_packgqa_sm120.cu +0 -0
  740. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_softcap_packgqa_sm80.cu +0 -0
  741. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_softcap_packgqa_sm90.cu +0 -0
  742. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_softcap_sm100.cu +0 -0
  743. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_softcap_sm110.cu +0 -0
  744. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_softcap_sm120.cu +0 -0
  745. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_softcap_sm80.cu +0 -0
  746. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_softcap_sm90.cu +0 -0
  747. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_paged_split_softcapall_sm80.cu +0 -0
  748. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_sm100.cu +0 -0
  749. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_sm110.cu +0 -0
  750. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_sm120.cu +0 -0
  751. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_sm80.cu +0 -0
  752. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_sm90.cu +0 -0
  753. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_softcap_packgqa_sm100.cu +0 -0
  754. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_softcap_packgqa_sm110.cu +0 -0
  755. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_softcap_packgqa_sm120.cu +0 -0
  756. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_softcap_packgqa_sm80.cu +0 -0
  757. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_softcap_packgqa_sm90.cu +0 -0
  758. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_softcap_sm100.cu +0 -0
  759. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_softcap_sm110.cu +0 -0
  760. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_softcap_sm120.cu +0 -0
  761. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_softcap_sm80.cu +0 -0
  762. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_softcap_sm90.cu +0 -0
  763. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_softcapall_sm80.cu +0 -0
  764. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_packgqa_sm100.cu +0 -0
  765. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_packgqa_sm110.cu +0 -0
  766. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_packgqa_sm120.cu +0 -0
  767. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_packgqa_sm80.cu +0 -0
  768. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_packgqa_sm90.cu +0 -0
  769. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_sm100.cu +0 -0
  770. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_sm110.cu +0 -0
  771. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_sm120.cu +0 -0
  772. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_sm80.cu +0 -0
  773. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_sm90.cu +0 -0
  774. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_softcap_packgqa_sm100.cu +0 -0
  775. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_softcap_packgqa_sm110.cu +0 -0
  776. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_softcap_packgqa_sm120.cu +0 -0
  777. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_softcap_packgqa_sm80.cu +0 -0
  778. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_softcap_packgqa_sm90.cu +0 -0
  779. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_softcap_sm100.cu +0 -0
  780. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_softcap_sm110.cu +0 -0
  781. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_softcap_sm120.cu +0 -0
  782. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_softcap_sm80.cu +0 -0
  783. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_softcap_sm90.cu +0 -0
  784. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_bf16_split_softcapall_sm80.cu +0 -0
  785. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_packgqa_sm100.cu +0 -0
  786. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_packgqa_sm110.cu +0 -0
  787. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_packgqa_sm120.cu +0 -0
  788. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_packgqa_sm90.cu +0 -0
  789. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_packgqa_sm100.cu +0 -0
  790. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_packgqa_sm110.cu +0 -0
  791. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_packgqa_sm120.cu +0 -0
  792. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_packgqa_sm90.cu +0 -0
  793. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_sm100.cu +0 -0
  794. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_sm110.cu +0 -0
  795. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_sm120.cu +0 -0
  796. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_sm90.cu +0 -0
  797. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_softcap_packgqa_sm100.cu +0 -0
  798. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_softcap_packgqa_sm110.cu +0 -0
  799. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_softcap_packgqa_sm120.cu +0 -0
  800. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_softcap_packgqa_sm90.cu +0 -0
  801. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_softcap_sm100.cu +0 -0
  802. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_softcap_sm110.cu +0 -0
  803. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_softcap_sm120.cu +0 -0
  804. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_softcap_sm90.cu +0 -0
  805. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_packgqa_sm100.cu +0 -0
  806. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_packgqa_sm110.cu +0 -0
  807. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_packgqa_sm120.cu +0 -0
  808. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_packgqa_sm90.cu +0 -0
  809. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_sm100.cu +0 -0
  810. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_sm110.cu +0 -0
  811. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_sm120.cu +0 -0
  812. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_sm90.cu +0 -0
  813. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_softcap_packgqa_sm100.cu +0 -0
  814. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_softcap_packgqa_sm110.cu +0 -0
  815. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_softcap_packgqa_sm120.cu +0 -0
  816. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_softcap_packgqa_sm90.cu +0 -0
  817. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_softcap_sm100.cu +0 -0
  818. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_softcap_sm110.cu +0 -0
  819. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_softcap_sm120.cu +0 -0
  820. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_paged_split_softcap_sm90.cu +0 -0
  821. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_sm100.cu +0 -0
  822. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_sm110.cu +0 -0
  823. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_sm120.cu +0 -0
  824. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_sm90.cu +0 -0
  825. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_softcap_packgqa_sm100.cu +0 -0
  826. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_softcap_packgqa_sm110.cu +0 -0
  827. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_softcap_packgqa_sm120.cu +0 -0
  828. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_softcap_packgqa_sm90.cu +0 -0
  829. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_softcap_sm100.cu +0 -0
  830. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_softcap_sm110.cu +0 -0
  831. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_softcap_sm120.cu +0 -0
  832. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_softcap_sm90.cu +0 -0
  833. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_packgqa_sm100.cu +0 -0
  834. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_packgqa_sm110.cu +0 -0
  835. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_packgqa_sm120.cu +0 -0
  836. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_packgqa_sm90.cu +0 -0
  837. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_sm100.cu +0 -0
  838. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_sm110.cu +0 -0
  839. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_sm120.cu +0 -0
  840. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_sm90.cu +0 -0
  841. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_softcap_packgqa_sm100.cu +0 -0
  842. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_softcap_packgqa_sm110.cu +0 -0
  843. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_softcap_packgqa_sm120.cu +0 -0
  844. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_softcap_packgqa_sm90.cu +0 -0
  845. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_softcap_sm100.cu +0 -0
  846. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_softcap_sm110.cu +0 -0
  847. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_softcap_sm120.cu +0 -0
  848. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_e4m3_split_softcap_sm90.cu +0 -0
  849. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_packgqa_sm100.cu +0 -0
  850. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_packgqa_sm110.cu +0 -0
  851. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_packgqa_sm120.cu +0 -0
  852. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_packgqa_sm80.cu +0 -0
  853. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_packgqa_sm90.cu +0 -0
  854. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_packgqa_sm100.cu +0 -0
  855. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_packgqa_sm110.cu +0 -0
  856. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_packgqa_sm120.cu +0 -0
  857. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_packgqa_sm80.cu +0 -0
  858. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_packgqa_sm90.cu +0 -0
  859. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_sm100.cu +0 -0
  860. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_sm110.cu +0 -0
  861. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_sm120.cu +0 -0
  862. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_sm80.cu +0 -0
  863. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_sm90.cu +0 -0
  864. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_softcap_packgqa_sm100.cu +0 -0
  865. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_softcap_packgqa_sm110.cu +0 -0
  866. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_softcap_packgqa_sm120.cu +0 -0
  867. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_softcap_packgqa_sm80.cu +0 -0
  868. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_softcap_packgqa_sm90.cu +0 -0
  869. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_softcap_sm100.cu +0 -0
  870. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_softcap_sm110.cu +0 -0
  871. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_softcap_sm120.cu +0 -0
  872. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_softcap_sm80.cu +0 -0
  873. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_softcap_sm90.cu +0 -0
  874. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_softcapall_sm80.cu +0 -0
  875. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_packgqa_sm100.cu +0 -0
  876. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_packgqa_sm110.cu +0 -0
  877. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_packgqa_sm120.cu +0 -0
  878. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_packgqa_sm80.cu +0 -0
  879. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_packgqa_sm90.cu +0 -0
  880. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_sm100.cu +0 -0
  881. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_sm110.cu +0 -0
  882. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_sm120.cu +0 -0
  883. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_sm80.cu +0 -0
  884. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_sm90.cu +0 -0
  885. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_softcap_packgqa_sm100.cu +0 -0
  886. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_softcap_packgqa_sm110.cu +0 -0
  887. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_softcap_packgqa_sm120.cu +0 -0
  888. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_softcap_packgqa_sm80.cu +0 -0
  889. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_softcap_packgqa_sm90.cu +0 -0
  890. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_softcap_sm100.cu +0 -0
  891. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_softcap_sm110.cu +0 -0
  892. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_softcap_sm120.cu +0 -0
  893. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_softcap_sm80.cu +0 -0
  894. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_softcap_sm90.cu +0 -0
  895. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_paged_split_softcapall_sm80.cu +0 -0
  896. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_sm100.cu +0 -0
  897. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_sm110.cu +0 -0
  898. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_sm120.cu +0 -0
  899. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_sm80.cu +0 -0
  900. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_sm90.cu +0 -0
  901. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_softcap_packgqa_sm100.cu +0 -0
  902. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_softcap_packgqa_sm110.cu +0 -0
  903. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_softcap_packgqa_sm120.cu +0 -0
  904. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_softcap_packgqa_sm80.cu +0 -0
  905. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_softcap_packgqa_sm90.cu +0 -0
  906. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_softcap_sm100.cu +0 -0
  907. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_softcap_sm110.cu +0 -0
  908. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_softcap_sm120.cu +0 -0
  909. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_softcap_sm80.cu +0 -0
  910. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_softcap_sm90.cu +0 -0
  911. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_softcapall_sm80.cu +0 -0
  912. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_packgqa_sm100.cu +0 -0
  913. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_packgqa_sm110.cu +0 -0
  914. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_packgqa_sm120.cu +0 -0
  915. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_packgqa_sm80.cu +0 -0
  916. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_packgqa_sm90.cu +0 -0
  917. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_sm100.cu +0 -0
  918. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_sm110.cu +0 -0
  919. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_sm120.cu +0 -0
  920. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_sm80.cu +0 -0
  921. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_sm90.cu +0 -0
  922. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_softcap_packgqa_sm100.cu +0 -0
  923. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_softcap_packgqa_sm110.cu +0 -0
  924. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_softcap_packgqa_sm120.cu +0 -0
  925. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_softcap_packgqa_sm80.cu +0 -0
  926. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_softcap_packgqa_sm90.cu +0 -0
  927. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_softcap_sm100.cu +0 -0
  928. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_softcap_sm110.cu +0 -0
  929. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_softcap_sm120.cu +0 -0
  930. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_softcap_sm80.cu +0 -0
  931. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_softcap_sm90.cu +0 -0
  932. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim256_fp16_split_softcapall_sm80.cu +0 -0
  933. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_bf16_packgqa_sm90.cu +0 -0
  934. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_bf16_paged_sm90.cu +0 -0
  935. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_bf16_paged_softcap_sm90.cu +0 -0
  936. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_bf16_paged_split_sm90.cu +0 -0
  937. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_bf16_paged_split_softcap_sm90.cu +0 -0
  938. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_bf16_sm90.cu +0 -0
  939. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_bf16_softcap_packgqa_sm90.cu +0 -0
  940. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_bf16_softcap_sm90.cu +0 -0
  941. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_bf16_split_sm90.cu +0 -0
  942. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_bf16_split_softcap_sm90.cu +0 -0
  943. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_fp16_packgqa_sm90.cu +0 -0
  944. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_fp16_paged_sm90.cu +0 -0
  945. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_fp16_paged_softcap_sm90.cu +0 -0
  946. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_fp16_paged_split_sm90.cu +0 -0
  947. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_fp16_paged_split_softcap_sm90.cu +0 -0
  948. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_fp16_sm90.cu +0 -0
  949. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_fp16_softcap_packgqa_sm90.cu +0 -0
  950. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_fp16_softcap_sm90.cu +0 -0
  951. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_fp16_split_sm90.cu +0 -0
  952. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_256_fp16_split_softcap_sm90.cu +0 -0
  953. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_bf16_packgqa_sm90.cu +0 -0
  954. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_bf16_paged_sm90.cu +0 -0
  955. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_bf16_paged_softcap_sm90.cu +0 -0
  956. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_bf16_paged_split_sm90.cu +0 -0
  957. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_bf16_paged_split_softcap_sm90.cu +0 -0
  958. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_bf16_sm90.cu +0 -0
  959. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_bf16_softcap_packgqa_sm90.cu +0 -0
  960. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_bf16_softcap_sm90.cu +0 -0
  961. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_bf16_split_sm90.cu +0 -0
  962. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_bf16_split_softcap_sm90.cu +0 -0
  963. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_fp16_packgqa_sm90.cu +0 -0
  964. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_fp16_paged_sm90.cu +0 -0
  965. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_fp16_paged_softcap_sm90.cu +0 -0
  966. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_fp16_paged_split_sm90.cu +0 -0
  967. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_fp16_paged_split_softcap_sm90.cu +0 -0
  968. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_fp16_sm90.cu +0 -0
  969. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_fp16_softcap_packgqa_sm90.cu +0 -0
  970. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_fp16_softcap_sm90.cu +0 -0
  971. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_fp16_split_sm90.cu +0 -0
  972. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_512_fp16_split_softcap_sm90.cu +0 -0
  973. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_packgqa_sm100.cu +0 -0
  974. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_packgqa_sm110.cu +0 -0
  975. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_packgqa_sm120.cu +0 -0
  976. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_packgqa_sm80.cu +0 -0
  977. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_packgqa_sm90.cu +0 -0
  978. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_packgqa_sm100.cu +0 -0
  979. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_packgqa_sm110.cu +0 -0
  980. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_packgqa_sm120.cu +0 -0
  981. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_packgqa_sm80.cu +0 -0
  982. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_packgqa_sm90.cu +0 -0
  983. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_sm100.cu +0 -0
  984. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_sm110.cu +0 -0
  985. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_sm120.cu +0 -0
  986. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_sm80.cu +0 -0
  987. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_sm90.cu +0 -0
  988. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_softcap_packgqa_sm100.cu +0 -0
  989. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_softcap_packgqa_sm110.cu +0 -0
  990. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_softcap_packgqa_sm120.cu +0 -0
  991. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_softcap_packgqa_sm80.cu +0 -0
  992. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_softcap_packgqa_sm90.cu +0 -0
  993. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_softcap_sm100.cu +0 -0
  994. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_softcap_sm110.cu +0 -0
  995. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_softcap_sm120.cu +0 -0
  996. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_softcap_sm80.cu +0 -0
  997. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_softcap_sm90.cu +0 -0
  998. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_softcapall_sm80.cu +0 -0
  999. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_packgqa_sm100.cu +0 -0
  1000. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_packgqa_sm110.cu +0 -0
  1001. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_packgqa_sm120.cu +0 -0
  1002. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_packgqa_sm80.cu +0 -0
  1003. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_packgqa_sm90.cu +0 -0
  1004. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_sm100.cu +0 -0
  1005. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_sm110.cu +0 -0
  1006. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_sm120.cu +0 -0
  1007. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_sm80.cu +0 -0
  1008. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_sm90.cu +0 -0
  1009. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_softcap_packgqa_sm100.cu +0 -0
  1010. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_softcap_packgqa_sm110.cu +0 -0
  1011. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_softcap_packgqa_sm120.cu +0 -0
  1012. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_softcap_packgqa_sm80.cu +0 -0
  1013. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_softcap_packgqa_sm90.cu +0 -0
  1014. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_softcap_sm100.cu +0 -0
  1015. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_softcap_sm110.cu +0 -0
  1016. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_softcap_sm120.cu +0 -0
  1017. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_softcap_sm80.cu +0 -0
  1018. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_softcap_sm90.cu +0 -0
  1019. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_paged_split_softcapall_sm80.cu +0 -0
  1020. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_sm100.cu +0 -0
  1021. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_sm110.cu +0 -0
  1022. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_sm120.cu +0 -0
  1023. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_sm80.cu +0 -0
  1024. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_sm90.cu +0 -0
  1025. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_softcap_packgqa_sm100.cu +0 -0
  1026. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_softcap_packgqa_sm110.cu +0 -0
  1027. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_softcap_packgqa_sm120.cu +0 -0
  1028. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_softcap_packgqa_sm80.cu +0 -0
  1029. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_softcap_packgqa_sm90.cu +0 -0
  1030. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_softcap_sm100.cu +0 -0
  1031. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_softcap_sm110.cu +0 -0
  1032. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_softcap_sm120.cu +0 -0
  1033. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_softcap_sm80.cu +0 -0
  1034. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_softcap_sm90.cu +0 -0
  1035. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_softcapall_sm80.cu +0 -0
  1036. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_packgqa_sm100.cu +0 -0
  1037. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_packgqa_sm110.cu +0 -0
  1038. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_packgqa_sm120.cu +0 -0
  1039. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_packgqa_sm80.cu +0 -0
  1040. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_packgqa_sm90.cu +0 -0
  1041. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_sm100.cu +0 -0
  1042. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_sm110.cu +0 -0
  1043. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_sm120.cu +0 -0
  1044. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_sm80.cu +0 -0
  1045. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_sm90.cu +0 -0
  1046. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_softcap_packgqa_sm100.cu +0 -0
  1047. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_softcap_packgqa_sm110.cu +0 -0
  1048. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_softcap_packgqa_sm120.cu +0 -0
  1049. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_softcap_packgqa_sm80.cu +0 -0
  1050. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_softcap_packgqa_sm90.cu +0 -0
  1051. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_softcap_sm100.cu +0 -0
  1052. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_softcap_sm110.cu +0 -0
  1053. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_softcap_sm120.cu +0 -0
  1054. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_softcap_sm80.cu +0 -0
  1055. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_softcap_sm90.cu +0 -0
  1056. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_bf16_split_softcapall_sm80.cu +0 -0
  1057. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_packgqa_sm100.cu +0 -0
  1058. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_packgqa_sm110.cu +0 -0
  1059. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_packgqa_sm120.cu +0 -0
  1060. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_packgqa_sm90.cu +0 -0
  1061. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_packgqa_sm100.cu +0 -0
  1062. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_packgqa_sm110.cu +0 -0
  1063. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_packgqa_sm120.cu +0 -0
  1064. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_packgqa_sm90.cu +0 -0
  1065. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_sm100.cu +0 -0
  1066. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_sm110.cu +0 -0
  1067. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_sm120.cu +0 -0
  1068. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_sm90.cu +0 -0
  1069. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_softcap_packgqa_sm100.cu +0 -0
  1070. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_softcap_packgqa_sm110.cu +0 -0
  1071. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_softcap_packgqa_sm120.cu +0 -0
  1072. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_softcap_packgqa_sm90.cu +0 -0
  1073. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_softcap_sm100.cu +0 -0
  1074. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_softcap_sm110.cu +0 -0
  1075. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_softcap_sm120.cu +0 -0
  1076. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_softcap_sm90.cu +0 -0
  1077. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_packgqa_sm100.cu +0 -0
  1078. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_packgqa_sm110.cu +0 -0
  1079. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_packgqa_sm120.cu +0 -0
  1080. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_packgqa_sm90.cu +0 -0
  1081. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_sm100.cu +0 -0
  1082. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_sm110.cu +0 -0
  1083. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_sm120.cu +0 -0
  1084. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_sm90.cu +0 -0
  1085. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_softcap_packgqa_sm100.cu +0 -0
  1086. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_softcap_packgqa_sm110.cu +0 -0
  1087. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_softcap_packgqa_sm120.cu +0 -0
  1088. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_softcap_packgqa_sm90.cu +0 -0
  1089. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_softcap_sm100.cu +0 -0
  1090. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_softcap_sm110.cu +0 -0
  1091. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_softcap_sm120.cu +0 -0
  1092. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_paged_split_softcap_sm90.cu +0 -0
  1093. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_sm100.cu +0 -0
  1094. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_sm110.cu +0 -0
  1095. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_sm120.cu +0 -0
  1096. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_sm90.cu +0 -0
  1097. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_softcap_packgqa_sm100.cu +0 -0
  1098. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_softcap_packgqa_sm110.cu +0 -0
  1099. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_softcap_packgqa_sm120.cu +0 -0
  1100. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_softcap_packgqa_sm90.cu +0 -0
  1101. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_softcap_sm100.cu +0 -0
  1102. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_softcap_sm110.cu +0 -0
  1103. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_softcap_sm120.cu +0 -0
  1104. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_softcap_sm90.cu +0 -0
  1105. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_packgqa_sm100.cu +0 -0
  1106. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_packgqa_sm110.cu +0 -0
  1107. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_packgqa_sm120.cu +0 -0
  1108. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_packgqa_sm90.cu +0 -0
  1109. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_sm100.cu +0 -0
  1110. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_sm110.cu +0 -0
  1111. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_sm120.cu +0 -0
  1112. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_sm90.cu +0 -0
  1113. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_softcap_packgqa_sm100.cu +0 -0
  1114. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_softcap_packgqa_sm110.cu +0 -0
  1115. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_softcap_packgqa_sm120.cu +0 -0
  1116. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_softcap_packgqa_sm90.cu +0 -0
  1117. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_softcap_sm100.cu +0 -0
  1118. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_softcap_sm110.cu +0 -0
  1119. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_softcap_sm120.cu +0 -0
  1120. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_e4m3_split_softcap_sm90.cu +0 -0
  1121. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_packgqa_sm100.cu +0 -0
  1122. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_packgqa_sm110.cu +0 -0
  1123. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_packgqa_sm120.cu +0 -0
  1124. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_packgqa_sm80.cu +0 -0
  1125. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_packgqa_sm90.cu +0 -0
  1126. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_packgqa_sm100.cu +0 -0
  1127. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_packgqa_sm110.cu +0 -0
  1128. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_packgqa_sm120.cu +0 -0
  1129. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_packgqa_sm80.cu +0 -0
  1130. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_packgqa_sm90.cu +0 -0
  1131. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_sm100.cu +0 -0
  1132. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_sm110.cu +0 -0
  1133. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_sm120.cu +0 -0
  1134. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_sm80.cu +0 -0
  1135. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_sm90.cu +0 -0
  1136. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_softcap_packgqa_sm100.cu +0 -0
  1137. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_softcap_packgqa_sm110.cu +0 -0
  1138. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_softcap_packgqa_sm120.cu +0 -0
  1139. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_softcap_packgqa_sm80.cu +0 -0
  1140. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_softcap_packgqa_sm90.cu +0 -0
  1141. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_softcap_sm100.cu +0 -0
  1142. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_softcap_sm110.cu +0 -0
  1143. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_softcap_sm120.cu +0 -0
  1144. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_softcap_sm80.cu +0 -0
  1145. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_softcap_sm90.cu +0 -0
  1146. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_softcapall_sm80.cu +0 -0
  1147. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_packgqa_sm100.cu +0 -0
  1148. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_packgqa_sm110.cu +0 -0
  1149. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_packgqa_sm120.cu +0 -0
  1150. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_packgqa_sm80.cu +0 -0
  1151. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_packgqa_sm90.cu +0 -0
  1152. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_sm100.cu +0 -0
  1153. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_sm110.cu +0 -0
  1154. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_sm120.cu +0 -0
  1155. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_sm80.cu +0 -0
  1156. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_sm90.cu +0 -0
  1157. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_softcap_packgqa_sm100.cu +0 -0
  1158. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_softcap_packgqa_sm110.cu +0 -0
  1159. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_softcap_packgqa_sm120.cu +0 -0
  1160. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_softcap_packgqa_sm80.cu +0 -0
  1161. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_softcap_packgqa_sm90.cu +0 -0
  1162. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_softcap_sm100.cu +0 -0
  1163. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_softcap_sm110.cu +0 -0
  1164. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_softcap_sm120.cu +0 -0
  1165. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_softcap_sm80.cu +0 -0
  1166. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_softcap_sm90.cu +0 -0
  1167. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_paged_split_softcapall_sm80.cu +0 -0
  1168. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_sm100.cu +0 -0
  1169. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_sm110.cu +0 -0
  1170. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_sm120.cu +0 -0
  1171. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_sm80.cu +0 -0
  1172. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_sm90.cu +0 -0
  1173. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_softcap_packgqa_sm100.cu +0 -0
  1174. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_softcap_packgqa_sm110.cu +0 -0
  1175. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_softcap_packgqa_sm120.cu +0 -0
  1176. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_softcap_packgqa_sm80.cu +0 -0
  1177. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_softcap_packgqa_sm90.cu +0 -0
  1178. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_softcap_sm100.cu +0 -0
  1179. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_softcap_sm110.cu +0 -0
  1180. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_softcap_sm120.cu +0 -0
  1181. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_softcap_sm80.cu +0 -0
  1182. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_softcap_sm90.cu +0 -0
  1183. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_softcapall_sm80.cu +0 -0
  1184. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_packgqa_sm100.cu +0 -0
  1185. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_packgqa_sm110.cu +0 -0
  1186. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_packgqa_sm120.cu +0 -0
  1187. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_packgqa_sm80.cu +0 -0
  1188. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_packgqa_sm90.cu +0 -0
  1189. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_sm100.cu +0 -0
  1190. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_sm110.cu +0 -0
  1191. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_sm120.cu +0 -0
  1192. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_sm80.cu +0 -0
  1193. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_sm90.cu +0 -0
  1194. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_softcap_packgqa_sm100.cu +0 -0
  1195. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_softcap_packgqa_sm110.cu +0 -0
  1196. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_softcap_packgqa_sm120.cu +0 -0
  1197. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_softcap_packgqa_sm80.cu +0 -0
  1198. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_softcap_packgqa_sm90.cu +0 -0
  1199. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_softcap_sm100.cu +0 -0
  1200. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_softcap_sm110.cu +0 -0
  1201. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_softcap_sm120.cu +0 -0
  1202. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_softcap_sm80.cu +0 -0
  1203. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_softcap_sm90.cu +0 -0
  1204. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim64_fp16_split_softcapall_sm80.cu +0 -0
  1205. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_packgqa_sm100.cu +0 -0
  1206. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_packgqa_sm110.cu +0 -0
  1207. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_packgqa_sm120.cu +0 -0
  1208. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_packgqa_sm80.cu +0 -0
  1209. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_packgqa_sm90.cu +0 -0
  1210. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_packgqa_sm100.cu +0 -0
  1211. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_packgqa_sm110.cu +0 -0
  1212. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_packgqa_sm120.cu +0 -0
  1213. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_packgqa_sm80.cu +0 -0
  1214. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_packgqa_sm90.cu +0 -0
  1215. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_sm100.cu +0 -0
  1216. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_sm110.cu +0 -0
  1217. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_sm120.cu +0 -0
  1218. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_sm80.cu +0 -0
  1219. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_sm90.cu +0 -0
  1220. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_softcap_packgqa_sm100.cu +0 -0
  1221. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_softcap_packgqa_sm110.cu +0 -0
  1222. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_softcap_packgqa_sm120.cu +0 -0
  1223. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_softcap_packgqa_sm80.cu +0 -0
  1224. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_softcap_packgqa_sm90.cu +0 -0
  1225. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_softcap_sm100.cu +0 -0
  1226. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_softcap_sm110.cu +0 -0
  1227. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_softcap_sm120.cu +0 -0
  1228. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_softcap_sm80.cu +0 -0
  1229. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_softcap_sm90.cu +0 -0
  1230. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_softcapall_sm80.cu +0 -0
  1231. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_packgqa_sm100.cu +0 -0
  1232. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_packgqa_sm110.cu +0 -0
  1233. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_packgqa_sm120.cu +0 -0
  1234. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_packgqa_sm80.cu +0 -0
  1235. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_packgqa_sm90.cu +0 -0
  1236. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_sm100.cu +0 -0
  1237. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_sm110.cu +0 -0
  1238. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_sm120.cu +0 -0
  1239. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_sm80.cu +0 -0
  1240. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_sm90.cu +0 -0
  1241. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_softcap_packgqa_sm100.cu +0 -0
  1242. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_softcap_packgqa_sm110.cu +0 -0
  1243. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_softcap_packgqa_sm120.cu +0 -0
  1244. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_softcap_packgqa_sm80.cu +0 -0
  1245. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_softcap_packgqa_sm90.cu +0 -0
  1246. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_softcap_sm100.cu +0 -0
  1247. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_softcap_sm110.cu +0 -0
  1248. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_softcap_sm120.cu +0 -0
  1249. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_softcap_sm80.cu +0 -0
  1250. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_softcap_sm90.cu +0 -0
  1251. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_paged_split_softcapall_sm80.cu +0 -0
  1252. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_sm100.cu +0 -0
  1253. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_sm110.cu +0 -0
  1254. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_sm120.cu +0 -0
  1255. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_sm80.cu +0 -0
  1256. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_sm90.cu +0 -0
  1257. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_softcap_packgqa_sm100.cu +0 -0
  1258. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_softcap_packgqa_sm110.cu +0 -0
  1259. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_softcap_packgqa_sm120.cu +0 -0
  1260. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_softcap_packgqa_sm80.cu +0 -0
  1261. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_softcap_packgqa_sm90.cu +0 -0
  1262. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_softcap_sm100.cu +0 -0
  1263. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_softcap_sm110.cu +0 -0
  1264. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_softcap_sm120.cu +0 -0
  1265. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_softcap_sm80.cu +0 -0
  1266. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_softcap_sm90.cu +0 -0
  1267. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_softcapall_sm80.cu +0 -0
  1268. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_packgqa_sm100.cu +0 -0
  1269. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_packgqa_sm110.cu +0 -0
  1270. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_packgqa_sm120.cu +0 -0
  1271. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_packgqa_sm80.cu +0 -0
  1272. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_packgqa_sm90.cu +0 -0
  1273. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_sm100.cu +0 -0
  1274. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_sm110.cu +0 -0
  1275. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_sm120.cu +0 -0
  1276. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_sm80.cu +0 -0
  1277. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_sm90.cu +0 -0
  1278. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_softcap_packgqa_sm100.cu +0 -0
  1279. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_softcap_packgqa_sm110.cu +0 -0
  1280. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_softcap_packgqa_sm120.cu +0 -0
  1281. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_softcap_packgqa_sm80.cu +0 -0
  1282. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_softcap_packgqa_sm90.cu +0 -0
  1283. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_softcap_sm100.cu +0 -0
  1284. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_softcap_sm110.cu +0 -0
  1285. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_softcap_sm120.cu +0 -0
  1286. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_softcap_sm80.cu +0 -0
  1287. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_softcap_sm90.cu +0 -0
  1288. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_bf16_split_softcapall_sm80.cu +0 -0
  1289. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_packgqa_sm100.cu +0 -0
  1290. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_packgqa_sm110.cu +0 -0
  1291. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_packgqa_sm120.cu +0 -0
  1292. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_packgqa_sm90.cu +0 -0
  1293. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_packgqa_sm100.cu +0 -0
  1294. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_packgqa_sm110.cu +0 -0
  1295. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_packgqa_sm120.cu +0 -0
  1296. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_packgqa_sm90.cu +0 -0
  1297. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_sm100.cu +0 -0
  1298. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_sm110.cu +0 -0
  1299. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_sm120.cu +0 -0
  1300. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_sm90.cu +0 -0
  1301. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_softcap_packgqa_sm100.cu +0 -0
  1302. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_softcap_packgqa_sm110.cu +0 -0
  1303. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_softcap_packgqa_sm120.cu +0 -0
  1304. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_softcap_packgqa_sm90.cu +0 -0
  1305. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_softcap_sm100.cu +0 -0
  1306. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_softcap_sm110.cu +0 -0
  1307. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_softcap_sm120.cu +0 -0
  1308. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_softcap_sm90.cu +0 -0
  1309. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_packgqa_sm100.cu +0 -0
  1310. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_packgqa_sm110.cu +0 -0
  1311. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_packgqa_sm120.cu +0 -0
  1312. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_packgqa_sm90.cu +0 -0
  1313. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_sm100.cu +0 -0
  1314. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_sm110.cu +0 -0
  1315. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_sm120.cu +0 -0
  1316. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_sm90.cu +0 -0
  1317. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_softcap_packgqa_sm100.cu +0 -0
  1318. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_softcap_packgqa_sm110.cu +0 -0
  1319. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_softcap_packgqa_sm120.cu +0 -0
  1320. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_softcap_packgqa_sm90.cu +0 -0
  1321. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_softcap_sm100.cu +0 -0
  1322. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_softcap_sm110.cu +0 -0
  1323. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_softcap_sm120.cu +0 -0
  1324. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_paged_split_softcap_sm90.cu +0 -0
  1325. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_sm100.cu +0 -0
  1326. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_sm110.cu +0 -0
  1327. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_sm120.cu +0 -0
  1328. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_sm90.cu +0 -0
  1329. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_softcap_packgqa_sm100.cu +0 -0
  1330. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_softcap_packgqa_sm110.cu +0 -0
  1331. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_softcap_packgqa_sm120.cu +0 -0
  1332. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_softcap_packgqa_sm90.cu +0 -0
  1333. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_softcap_sm100.cu +0 -0
  1334. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_softcap_sm110.cu +0 -0
  1335. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_softcap_sm120.cu +0 -0
  1336. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_softcap_sm90.cu +0 -0
  1337. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_packgqa_sm100.cu +0 -0
  1338. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_packgqa_sm110.cu +0 -0
  1339. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_packgqa_sm120.cu +0 -0
  1340. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_packgqa_sm90.cu +0 -0
  1341. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_sm100.cu +0 -0
  1342. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_sm110.cu +0 -0
  1343. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_sm120.cu +0 -0
  1344. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_sm90.cu +0 -0
  1345. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_softcap_packgqa_sm100.cu +0 -0
  1346. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_softcap_packgqa_sm110.cu +0 -0
  1347. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_softcap_packgqa_sm120.cu +0 -0
  1348. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_softcap_packgqa_sm90.cu +0 -0
  1349. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_softcap_sm100.cu +0 -0
  1350. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_softcap_sm110.cu +0 -0
  1351. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_softcap_sm120.cu +0 -0
  1352. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_e4m3_split_softcap_sm90.cu +0 -0
  1353. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_packgqa_sm100.cu +0 -0
  1354. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_packgqa_sm110.cu +0 -0
  1355. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_packgqa_sm120.cu +0 -0
  1356. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_packgqa_sm80.cu +0 -0
  1357. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_packgqa_sm90.cu +0 -0
  1358. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_packgqa_sm100.cu +0 -0
  1359. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_packgqa_sm110.cu +0 -0
  1360. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_packgqa_sm120.cu +0 -0
  1361. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_packgqa_sm80.cu +0 -0
  1362. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_packgqa_sm90.cu +0 -0
  1363. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_sm100.cu +0 -0
  1364. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_sm110.cu +0 -0
  1365. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_sm120.cu +0 -0
  1366. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_sm80.cu +0 -0
  1367. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_sm90.cu +0 -0
  1368. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_softcap_packgqa_sm100.cu +0 -0
  1369. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_softcap_packgqa_sm110.cu +0 -0
  1370. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_softcap_packgqa_sm120.cu +0 -0
  1371. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_softcap_packgqa_sm80.cu +0 -0
  1372. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_softcap_packgqa_sm90.cu +0 -0
  1373. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_softcap_sm100.cu +0 -0
  1374. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_softcap_sm110.cu +0 -0
  1375. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_softcap_sm120.cu +0 -0
  1376. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_softcap_sm80.cu +0 -0
  1377. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_softcap_sm90.cu +0 -0
  1378. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_softcapall_sm80.cu +0 -0
  1379. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_packgqa_sm100.cu +0 -0
  1380. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_packgqa_sm110.cu +0 -0
  1381. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_packgqa_sm120.cu +0 -0
  1382. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_packgqa_sm80.cu +0 -0
  1383. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_packgqa_sm90.cu +0 -0
  1384. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_sm100.cu +0 -0
  1385. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_sm110.cu +0 -0
  1386. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_sm120.cu +0 -0
  1387. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_sm80.cu +0 -0
  1388. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_sm90.cu +0 -0
  1389. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_softcap_packgqa_sm100.cu +0 -0
  1390. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_softcap_packgqa_sm110.cu +0 -0
  1391. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_softcap_packgqa_sm120.cu +0 -0
  1392. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_softcap_packgqa_sm80.cu +0 -0
  1393. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_softcap_packgqa_sm90.cu +0 -0
  1394. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_softcap_sm100.cu +0 -0
  1395. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_softcap_sm110.cu +0 -0
  1396. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_softcap_sm120.cu +0 -0
  1397. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_softcap_sm80.cu +0 -0
  1398. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_softcap_sm90.cu +0 -0
  1399. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_paged_split_softcapall_sm80.cu +0 -0
  1400. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_sm100.cu +0 -0
  1401. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_sm110.cu +0 -0
  1402. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_sm120.cu +0 -0
  1403. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_sm80.cu +0 -0
  1404. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_sm90.cu +0 -0
  1405. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_softcap_packgqa_sm100.cu +0 -0
  1406. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_softcap_packgqa_sm110.cu +0 -0
  1407. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_softcap_packgqa_sm120.cu +0 -0
  1408. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_softcap_packgqa_sm80.cu +0 -0
  1409. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_softcap_packgqa_sm90.cu +0 -0
  1410. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_softcap_sm100.cu +0 -0
  1411. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_softcap_sm110.cu +0 -0
  1412. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_softcap_sm120.cu +0 -0
  1413. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_softcap_sm80.cu +0 -0
  1414. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_softcap_sm90.cu +0 -0
  1415. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_softcapall_sm80.cu +0 -0
  1416. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_packgqa_sm100.cu +0 -0
  1417. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_packgqa_sm110.cu +0 -0
  1418. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_packgqa_sm120.cu +0 -0
  1419. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_packgqa_sm80.cu +0 -0
  1420. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_packgqa_sm90.cu +0 -0
  1421. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_sm100.cu +0 -0
  1422. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_sm110.cu +0 -0
  1423. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_sm120.cu +0 -0
  1424. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_sm80.cu +0 -0
  1425. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_sm90.cu +0 -0
  1426. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_softcap_packgqa_sm100.cu +0 -0
  1427. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_softcap_packgqa_sm110.cu +0 -0
  1428. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_softcap_packgqa_sm120.cu +0 -0
  1429. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_softcap_packgqa_sm80.cu +0 -0
  1430. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_softcap_packgqa_sm90.cu +0 -0
  1431. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_softcap_sm100.cu +0 -0
  1432. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_softcap_sm110.cu +0 -0
  1433. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_softcap_sm120.cu +0 -0
  1434. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_softcap_sm80.cu +0 -0
  1435. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_softcap_sm90.cu +0 -0
  1436. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdim96_fp16_split_softcapall_sm80.cu +0 -0
  1437. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_bf16_packgqa_sm90.cu +0 -0
  1438. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_bf16_paged_sm90.cu +0 -0
  1439. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_bf16_paged_softcap_sm90.cu +0 -0
  1440. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_bf16_paged_split_sm90.cu +0 -0
  1441. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_bf16_paged_split_softcap_sm90.cu +0 -0
  1442. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_bf16_sm90.cu +0 -0
  1443. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_bf16_softcap_packgqa_sm90.cu +0 -0
  1444. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_bf16_softcap_sm90.cu +0 -0
  1445. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_bf16_split_sm90.cu +0 -0
  1446. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_bf16_split_softcap_sm90.cu +0 -0
  1447. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_e4m3_packgqa_sm90.cu +0 -0
  1448. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_e4m3_paged_sm90.cu +0 -0
  1449. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_e4m3_paged_softcap_sm90.cu +0 -0
  1450. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_e4m3_paged_split_sm90.cu +0 -0
  1451. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_e4m3_paged_split_softcap_sm90.cu +0 -0
  1452. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_e4m3_sm90.cu +0 -0
  1453. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_e4m3_softcap_packgqa_sm90.cu +0 -0
  1454. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_e4m3_softcap_sm90.cu +0 -0
  1455. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_e4m3_split_sm90.cu +0 -0
  1456. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_e4m3_split_softcap_sm90.cu +0 -0
  1457. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_fp16_packgqa_sm90.cu +0 -0
  1458. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_fp16_paged_sm90.cu +0 -0
  1459. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_fp16_paged_softcap_sm90.cu +0 -0
  1460. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_fp16_paged_split_sm90.cu +0 -0
  1461. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_fp16_paged_split_softcap_sm90.cu +0 -0
  1462. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_fp16_sm90.cu +0 -0
  1463. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_fp16_softcap_packgqa_sm90.cu +0 -0
  1464. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_fp16_softcap_sm90.cu +0 -0
  1465. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_fp16_split_sm90.cu +0 -0
  1466. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimall_fp16_split_softcap_sm90.cu +0 -0
  1467. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_bf16_packgqa_sm90.cu +0 -0
  1468. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_bf16_paged_sm90.cu +0 -0
  1469. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_bf16_paged_softcap_sm90.cu +0 -0
  1470. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_bf16_paged_split_sm90.cu +0 -0
  1471. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_bf16_paged_split_softcap_sm90.cu +0 -0
  1472. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_bf16_sm90.cu +0 -0
  1473. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_bf16_softcap_packgqa_sm90.cu +0 -0
  1474. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_bf16_softcap_sm90.cu +0 -0
  1475. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_bf16_split_sm90.cu +0 -0
  1476. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_bf16_split_softcap_sm90.cu +0 -0
  1477. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_e4m3_packgqa_sm90.cu +0 -0
  1478. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_e4m3_paged_sm90.cu +0 -0
  1479. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_e4m3_paged_softcap_sm90.cu +0 -0
  1480. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_e4m3_paged_split_sm90.cu +0 -0
  1481. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_e4m3_paged_split_softcap_sm90.cu +0 -0
  1482. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_e4m3_sm90.cu +0 -0
  1483. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_e4m3_softcap_packgqa_sm90.cu +0 -0
  1484. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_e4m3_softcap_sm90.cu +0 -0
  1485. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_e4m3_split_sm90.cu +0 -0
  1486. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_e4m3_split_softcap_sm90.cu +0 -0
  1487. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_fp16_packgqa_sm90.cu +0 -0
  1488. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_fp16_paged_sm90.cu +0 -0
  1489. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_fp16_paged_softcap_sm90.cu +0 -0
  1490. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_fp16_paged_split_sm90.cu +0 -0
  1491. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_fp16_paged_split_softcap_sm90.cu +0 -0
  1492. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_fp16_sm90.cu +0 -0
  1493. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_fp16_softcap_packgqa_sm90.cu +0 -0
  1494. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_fp16_softcap_sm90.cu +0 -0
  1495. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_fp16_split_sm90.cu +0 -0
  1496. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/instantiations/flash_fwd_hdimdiff_fp16_split_softcap_sm90.cu +0 -0
  1497. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/mainloop_bwd_sm80.hpp +0 -0
  1498. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/mainloop_bwd_sm90_tma_gmma_ws.hpp +0 -0
  1499. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/mainloop_fwd_sm80.hpp +0 -0
  1500. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/mainloop_fwd_sm90_tma_gmma_ws.hpp +0 -0
  1501. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/mask.h +0 -0
  1502. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/named_barrier.hpp +0 -0
  1503. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/pack_gqa.h +0 -0
  1504. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/paged_kv.h +0 -0
  1505. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/rotary.h +0 -0
  1506. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/seqlen.h +0 -0
  1507. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/sm90_pipeline_no_cluster.hpp +0 -0
  1508. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/softmax.h +0 -0
  1509. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/static_switch.h +0 -0
  1510. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/tile_scheduler.hpp +0 -0
  1511. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/tile_size.h +0 -0
  1512. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/hopper/utils.h +0 -0
  1513. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/include/c10/cuda/CUDAException.h +0 -0
  1514. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/include/ejkernel_flash_attention.h +0 -0
  1515. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/include/ejkernel_flash_attention_cutlass.h +0 -0
  1516. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/alibi.h +0 -0
  1517. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/aten_shim.h +0 -0
  1518. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/block_info.h +0 -0
  1519. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/code_gen.py +0 -0
  1520. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/dropout.h +0 -0
  1521. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash.h +0 -0
  1522. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_attention_ffi.cu +0 -0
  1523. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_bf16_causal_sm100.cu +0 -0
  1524. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_bf16_causal_sm110.cu +0 -0
  1525. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_bf16_causal_sm120.cu +0 -0
  1526. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_bf16_causal_sm80.cu +0 -0
  1527. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_bf16_causal_sm90.cu +0 -0
  1528. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_bf16_sm100.cu +0 -0
  1529. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_bf16_sm110.cu +0 -0
  1530. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_bf16_sm120.cu +0 -0
  1531. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_bf16_sm80.cu +0 -0
  1532. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_bf16_sm90.cu +0 -0
  1533. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_fp16_causal_sm100.cu +0 -0
  1534. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_fp16_causal_sm110.cu +0 -0
  1535. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_fp16_causal_sm120.cu +0 -0
  1536. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_fp16_causal_sm80.cu +0 -0
  1537. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_fp16_causal_sm90.cu +0 -0
  1538. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_fp16_sm100.cu +0 -0
  1539. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_fp16_sm110.cu +0 -0
  1540. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_fp16_sm120.cu +0 -0
  1541. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_fp16_sm80.cu +0 -0
  1542. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim128_fp16_sm90.cu +0 -0
  1543. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_bf16_causal_sm100.cu +0 -0
  1544. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_bf16_causal_sm110.cu +0 -0
  1545. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_bf16_causal_sm120.cu +0 -0
  1546. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_bf16_causal_sm80.cu +0 -0
  1547. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_bf16_causal_sm90.cu +0 -0
  1548. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_bf16_sm100.cu +0 -0
  1549. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_bf16_sm110.cu +0 -0
  1550. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_bf16_sm120.cu +0 -0
  1551. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_bf16_sm80.cu +0 -0
  1552. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_bf16_sm90.cu +0 -0
  1553. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_fp16_causal_sm100.cu +0 -0
  1554. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_fp16_causal_sm110.cu +0 -0
  1555. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_fp16_causal_sm120.cu +0 -0
  1556. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_fp16_causal_sm80.cu +0 -0
  1557. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_fp16_causal_sm90.cu +0 -0
  1558. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_fp16_sm100.cu +0 -0
  1559. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_fp16_sm110.cu +0 -0
  1560. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_fp16_sm120.cu +0 -0
  1561. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_fp16_sm80.cu +0 -0
  1562. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim192_fp16_sm90.cu +0 -0
  1563. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_bf16_causal_sm100.cu +0 -0
  1564. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_bf16_causal_sm110.cu +0 -0
  1565. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_bf16_causal_sm120.cu +0 -0
  1566. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_bf16_causal_sm80.cu +0 -0
  1567. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_bf16_causal_sm90.cu +0 -0
  1568. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_bf16_sm100.cu +0 -0
  1569. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_bf16_sm110.cu +0 -0
  1570. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_bf16_sm120.cu +0 -0
  1571. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_bf16_sm80.cu +0 -0
  1572. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_bf16_sm90.cu +0 -0
  1573. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_fp16_causal_sm100.cu +0 -0
  1574. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_fp16_causal_sm110.cu +0 -0
  1575. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_fp16_causal_sm120.cu +0 -0
  1576. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_fp16_causal_sm80.cu +0 -0
  1577. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_fp16_causal_sm90.cu +0 -0
  1578. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_fp16_sm100.cu +0 -0
  1579. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_fp16_sm110.cu +0 -0
  1580. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_fp16_sm120.cu +0 -0
  1581. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_fp16_sm80.cu +0 -0
  1582. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim256_fp16_sm90.cu +0 -0
  1583. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_bf16_causal_sm100.cu +0 -0
  1584. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_bf16_causal_sm110.cu +0 -0
  1585. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_bf16_causal_sm120.cu +0 -0
  1586. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_bf16_causal_sm80.cu +0 -0
  1587. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_bf16_causal_sm90.cu +0 -0
  1588. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_bf16_sm100.cu +0 -0
  1589. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_bf16_sm110.cu +0 -0
  1590. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_bf16_sm120.cu +0 -0
  1591. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_bf16_sm80.cu +0 -0
  1592. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_bf16_sm90.cu +0 -0
  1593. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_fp16_causal_sm100.cu +0 -0
  1594. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_fp16_causal_sm110.cu +0 -0
  1595. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_fp16_causal_sm120.cu +0 -0
  1596. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_fp16_causal_sm80.cu +0 -0
  1597. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_fp16_causal_sm90.cu +0 -0
  1598. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_fp16_sm100.cu +0 -0
  1599. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_fp16_sm110.cu +0 -0
  1600. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_fp16_sm120.cu +0 -0
  1601. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_fp16_sm80.cu +0 -0
  1602. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim32_fp16_sm90.cu +0 -0
  1603. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_bf16_causal_sm100.cu +0 -0
  1604. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_bf16_causal_sm110.cu +0 -0
  1605. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_bf16_causal_sm120.cu +0 -0
  1606. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_bf16_causal_sm80.cu +0 -0
  1607. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_bf16_causal_sm90.cu +0 -0
  1608. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_bf16_sm100.cu +0 -0
  1609. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_bf16_sm110.cu +0 -0
  1610. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_bf16_sm120.cu +0 -0
  1611. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_bf16_sm80.cu +0 -0
  1612. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_bf16_sm90.cu +0 -0
  1613. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_fp16_causal_sm100.cu +0 -0
  1614. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_fp16_causal_sm110.cu +0 -0
  1615. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_fp16_causal_sm120.cu +0 -0
  1616. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_fp16_causal_sm80.cu +0 -0
  1617. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_fp16_causal_sm90.cu +0 -0
  1618. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_fp16_sm100.cu +0 -0
  1619. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_fp16_sm110.cu +0 -0
  1620. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_fp16_sm120.cu +0 -0
  1621. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_fp16_sm80.cu +0 -0
  1622. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim64_fp16_sm90.cu +0 -0
  1623. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_bf16_causal_sm100.cu +0 -0
  1624. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_bf16_causal_sm110.cu +0 -0
  1625. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_bf16_causal_sm120.cu +0 -0
  1626. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_bf16_causal_sm80.cu +0 -0
  1627. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_bf16_causal_sm90.cu +0 -0
  1628. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_bf16_sm100.cu +0 -0
  1629. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_bf16_sm110.cu +0 -0
  1630. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_bf16_sm120.cu +0 -0
  1631. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_bf16_sm80.cu +0 -0
  1632. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_bf16_sm90.cu +0 -0
  1633. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_fp16_causal_sm100.cu +0 -0
  1634. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_fp16_causal_sm110.cu +0 -0
  1635. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_fp16_causal_sm120.cu +0 -0
  1636. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_fp16_causal_sm80.cu +0 -0
  1637. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_fp16_causal_sm90.cu +0 -0
  1638. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_fp16_sm100.cu +0 -0
  1639. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_fp16_sm110.cu +0 -0
  1640. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_fp16_sm120.cu +0 -0
  1641. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_fp16_sm80.cu +0 -0
  1642. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_hdim96_fp16_sm90.cu +0 -0
  1643. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_kernel.h +0 -0
  1644. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_launch_template.h +0 -0
  1645. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_bwd_preprocess_kernel.h +0 -0
  1646. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_bf16_causal_sm100.cu +0 -0
  1647. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_bf16_causal_sm110.cu +0 -0
  1648. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_bf16_causal_sm120.cu +0 -0
  1649. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_bf16_causal_sm80.cu +0 -0
  1650. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_bf16_causal_sm90.cu +0 -0
  1651. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_bf16_sm100.cu +0 -0
  1652. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_bf16_sm110.cu +0 -0
  1653. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_bf16_sm120.cu +0 -0
  1654. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_bf16_sm80.cu +0 -0
  1655. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_bf16_sm90.cu +0 -0
  1656. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_fp16_causal_sm100.cu +0 -0
  1657. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_fp16_causal_sm110.cu +0 -0
  1658. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_fp16_causal_sm120.cu +0 -0
  1659. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_fp16_causal_sm80.cu +0 -0
  1660. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_fp16_causal_sm90.cu +0 -0
  1661. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_fp16_sm100.cu +0 -0
  1662. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_fp16_sm110.cu +0 -0
  1663. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_fp16_sm120.cu +0 -0
  1664. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_fp16_sm80.cu +0 -0
  1665. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim128_fp16_sm90.cu +0 -0
  1666. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_bf16_causal_sm100.cu +0 -0
  1667. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_bf16_causal_sm110.cu +0 -0
  1668. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_bf16_causal_sm120.cu +0 -0
  1669. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_bf16_causal_sm80.cu +0 -0
  1670. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_bf16_causal_sm90.cu +0 -0
  1671. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_bf16_sm100.cu +0 -0
  1672. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_bf16_sm110.cu +0 -0
  1673. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_bf16_sm120.cu +0 -0
  1674. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_bf16_sm80.cu +0 -0
  1675. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_bf16_sm90.cu +0 -0
  1676. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_fp16_causal_sm100.cu +0 -0
  1677. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_fp16_causal_sm110.cu +0 -0
  1678. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_fp16_causal_sm120.cu +0 -0
  1679. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_fp16_causal_sm80.cu +0 -0
  1680. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_fp16_causal_sm90.cu +0 -0
  1681. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_fp16_sm100.cu +0 -0
  1682. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_fp16_sm110.cu +0 -0
  1683. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_fp16_sm120.cu +0 -0
  1684. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_fp16_sm80.cu +0 -0
  1685. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim192_fp16_sm90.cu +0 -0
  1686. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_bf16_causal_sm100.cu +0 -0
  1687. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_bf16_causal_sm110.cu +0 -0
  1688. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_bf16_causal_sm120.cu +0 -0
  1689. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_bf16_causal_sm80.cu +0 -0
  1690. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_bf16_causal_sm90.cu +0 -0
  1691. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_bf16_sm100.cu +0 -0
  1692. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_bf16_sm110.cu +0 -0
  1693. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_bf16_sm120.cu +0 -0
  1694. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_bf16_sm80.cu +0 -0
  1695. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_bf16_sm90.cu +0 -0
  1696. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_fp16_causal_sm100.cu +0 -0
  1697. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_fp16_causal_sm110.cu +0 -0
  1698. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_fp16_causal_sm120.cu +0 -0
  1699. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_fp16_causal_sm80.cu +0 -0
  1700. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_fp16_causal_sm90.cu +0 -0
  1701. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_fp16_sm100.cu +0 -0
  1702. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_fp16_sm110.cu +0 -0
  1703. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_fp16_sm120.cu +0 -0
  1704. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_fp16_sm80.cu +0 -0
  1705. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim256_fp16_sm90.cu +0 -0
  1706. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_bf16_causal_sm100.cu +0 -0
  1707. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_bf16_causal_sm110.cu +0 -0
  1708. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_bf16_causal_sm120.cu +0 -0
  1709. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_bf16_causal_sm80.cu +0 -0
  1710. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_bf16_causal_sm90.cu +0 -0
  1711. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_bf16_sm100.cu +0 -0
  1712. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_bf16_sm110.cu +0 -0
  1713. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_bf16_sm120.cu +0 -0
  1714. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_bf16_sm80.cu +0 -0
  1715. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_bf16_sm90.cu +0 -0
  1716. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_fp16_causal_sm100.cu +0 -0
  1717. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_fp16_causal_sm110.cu +0 -0
  1718. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_fp16_causal_sm120.cu +0 -0
  1719. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_fp16_causal_sm80.cu +0 -0
  1720. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_fp16_causal_sm90.cu +0 -0
  1721. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_fp16_sm100.cu +0 -0
  1722. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_fp16_sm110.cu +0 -0
  1723. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_fp16_sm120.cu +0 -0
  1724. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_fp16_sm80.cu +0 -0
  1725. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim32_fp16_sm90.cu +0 -0
  1726. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_bf16_causal_sm100.cu +0 -0
  1727. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_bf16_causal_sm110.cu +0 -0
  1728. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_bf16_causal_sm120.cu +0 -0
  1729. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_bf16_causal_sm80.cu +0 -0
  1730. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_bf16_causal_sm90.cu +0 -0
  1731. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_bf16_sm100.cu +0 -0
  1732. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_bf16_sm110.cu +0 -0
  1733. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_bf16_sm120.cu +0 -0
  1734. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_bf16_sm80.cu +0 -0
  1735. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_bf16_sm90.cu +0 -0
  1736. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_fp16_causal_sm100.cu +0 -0
  1737. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_fp16_causal_sm110.cu +0 -0
  1738. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_fp16_causal_sm120.cu +0 -0
  1739. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_fp16_causal_sm80.cu +0 -0
  1740. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_fp16_causal_sm90.cu +0 -0
  1741. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_fp16_sm100.cu +0 -0
  1742. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_fp16_sm110.cu +0 -0
  1743. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_fp16_sm120.cu +0 -0
  1744. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_fp16_sm80.cu +0 -0
  1745. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim64_fp16_sm90.cu +0 -0
  1746. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_bf16_causal_sm100.cu +0 -0
  1747. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_bf16_causal_sm110.cu +0 -0
  1748. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_bf16_causal_sm120.cu +0 -0
  1749. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_bf16_causal_sm80.cu +0 -0
  1750. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_bf16_causal_sm90.cu +0 -0
  1751. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_bf16_sm100.cu +0 -0
  1752. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_bf16_sm110.cu +0 -0
  1753. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_bf16_sm120.cu +0 -0
  1754. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_bf16_sm80.cu +0 -0
  1755. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_bf16_sm90.cu +0 -0
  1756. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_fp16_causal_sm100.cu +0 -0
  1757. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_fp16_causal_sm110.cu +0 -0
  1758. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_fp16_causal_sm120.cu +0 -0
  1759. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_fp16_causal_sm80.cu +0 -0
  1760. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_fp16_causal_sm90.cu +0 -0
  1761. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_fp16_sm100.cu +0 -0
  1762. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_fp16_sm110.cu +0 -0
  1763. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_fp16_sm120.cu +0 -0
  1764. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_fp16_sm80.cu +0 -0
  1765. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_hdim96_fp16_sm90.cu +0 -0
  1766. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_kernel.h +0 -0
  1767. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_launch_template.h +0 -0
  1768. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_bf16_causal_sm100.cu +0 -0
  1769. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_bf16_causal_sm110.cu +0 -0
  1770. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_bf16_causal_sm120.cu +0 -0
  1771. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_bf16_causal_sm80.cu +0 -0
  1772. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_bf16_causal_sm90.cu +0 -0
  1773. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_bf16_sm100.cu +0 -0
  1774. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_bf16_sm110.cu +0 -0
  1775. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_bf16_sm120.cu +0 -0
  1776. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_bf16_sm80.cu +0 -0
  1777. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_bf16_sm90.cu +0 -0
  1778. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_fp16_causal_sm100.cu +0 -0
  1779. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_fp16_causal_sm110.cu +0 -0
  1780. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_fp16_causal_sm120.cu +0 -0
  1781. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_fp16_causal_sm80.cu +0 -0
  1782. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_fp16_causal_sm90.cu +0 -0
  1783. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_fp16_sm100.cu +0 -0
  1784. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_fp16_sm110.cu +0 -0
  1785. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_fp16_sm120.cu +0 -0
  1786. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_fp16_sm80.cu +0 -0
  1787. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim128_fp16_sm90.cu +0 -0
  1788. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_bf16_causal_sm100.cu +0 -0
  1789. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_bf16_causal_sm110.cu +0 -0
  1790. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_bf16_causal_sm120.cu +0 -0
  1791. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_bf16_causal_sm80.cu +0 -0
  1792. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_bf16_causal_sm90.cu +0 -0
  1793. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_bf16_sm100.cu +0 -0
  1794. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_bf16_sm110.cu +0 -0
  1795. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_bf16_sm120.cu +0 -0
  1796. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_bf16_sm80.cu +0 -0
  1797. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_bf16_sm90.cu +0 -0
  1798. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_fp16_causal_sm100.cu +0 -0
  1799. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_fp16_causal_sm110.cu +0 -0
  1800. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_fp16_causal_sm120.cu +0 -0
  1801. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_fp16_causal_sm80.cu +0 -0
  1802. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_fp16_causal_sm90.cu +0 -0
  1803. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_fp16_sm100.cu +0 -0
  1804. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_fp16_sm110.cu +0 -0
  1805. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_fp16_sm120.cu +0 -0
  1806. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_fp16_sm80.cu +0 -0
  1807. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim192_fp16_sm90.cu +0 -0
  1808. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_bf16_causal_sm100.cu +0 -0
  1809. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_bf16_causal_sm110.cu +0 -0
  1810. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_bf16_causal_sm120.cu +0 -0
  1811. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_bf16_causal_sm80.cu +0 -0
  1812. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_bf16_causal_sm90.cu +0 -0
  1813. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_bf16_sm100.cu +0 -0
  1814. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_bf16_sm110.cu +0 -0
  1815. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_bf16_sm120.cu +0 -0
  1816. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_bf16_sm80.cu +0 -0
  1817. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_bf16_sm90.cu +0 -0
  1818. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_fp16_causal_sm100.cu +0 -0
  1819. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_fp16_causal_sm110.cu +0 -0
  1820. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_fp16_causal_sm120.cu +0 -0
  1821. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_fp16_causal_sm80.cu +0 -0
  1822. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_fp16_causal_sm90.cu +0 -0
  1823. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_fp16_sm100.cu +0 -0
  1824. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_fp16_sm110.cu +0 -0
  1825. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_fp16_sm120.cu +0 -0
  1826. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_fp16_sm80.cu +0 -0
  1827. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim256_fp16_sm90.cu +0 -0
  1828. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_bf16_causal_sm100.cu +0 -0
  1829. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_bf16_causal_sm110.cu +0 -0
  1830. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_bf16_causal_sm120.cu +0 -0
  1831. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_bf16_causal_sm80.cu +0 -0
  1832. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_bf16_causal_sm90.cu +0 -0
  1833. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_bf16_sm100.cu +0 -0
  1834. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_bf16_sm110.cu +0 -0
  1835. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_bf16_sm120.cu +0 -0
  1836. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_bf16_sm80.cu +0 -0
  1837. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_bf16_sm90.cu +0 -0
  1838. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_fp16_causal_sm100.cu +0 -0
  1839. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_fp16_causal_sm110.cu +0 -0
  1840. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_fp16_causal_sm120.cu +0 -0
  1841. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_fp16_causal_sm80.cu +0 -0
  1842. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_fp16_causal_sm90.cu +0 -0
  1843. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_fp16_sm100.cu +0 -0
  1844. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_fp16_sm110.cu +0 -0
  1845. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_fp16_sm120.cu +0 -0
  1846. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_fp16_sm80.cu +0 -0
  1847. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim32_fp16_sm90.cu +0 -0
  1848. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_bf16_causal_sm100.cu +0 -0
  1849. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_bf16_causal_sm110.cu +0 -0
  1850. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_bf16_causal_sm120.cu +0 -0
  1851. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_bf16_causal_sm80.cu +0 -0
  1852. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_bf16_causal_sm90.cu +0 -0
  1853. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_bf16_sm100.cu +0 -0
  1854. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_bf16_sm110.cu +0 -0
  1855. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_bf16_sm120.cu +0 -0
  1856. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_bf16_sm80.cu +0 -0
  1857. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_bf16_sm90.cu +0 -0
  1858. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_fp16_causal_sm100.cu +0 -0
  1859. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_fp16_causal_sm110.cu +0 -0
  1860. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_fp16_causal_sm120.cu +0 -0
  1861. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_fp16_causal_sm80.cu +0 -0
  1862. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_fp16_causal_sm90.cu +0 -0
  1863. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_fp16_sm100.cu +0 -0
  1864. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_fp16_sm110.cu +0 -0
  1865. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_fp16_sm120.cu +0 -0
  1866. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_fp16_sm80.cu +0 -0
  1867. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim64_fp16_sm90.cu +0 -0
  1868. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_bf16_causal_sm100.cu +0 -0
  1869. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_bf16_causal_sm110.cu +0 -0
  1870. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_bf16_causal_sm120.cu +0 -0
  1871. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_bf16_causal_sm80.cu +0 -0
  1872. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_bf16_causal_sm90.cu +0 -0
  1873. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_bf16_sm100.cu +0 -0
  1874. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_bf16_sm110.cu +0 -0
  1875. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_bf16_sm120.cu +0 -0
  1876. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_bf16_sm80.cu +0 -0
  1877. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_bf16_sm90.cu +0 -0
  1878. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_fp16_causal_sm100.cu +0 -0
  1879. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_fp16_causal_sm110.cu +0 -0
  1880. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_fp16_causal_sm120.cu +0 -0
  1881. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_fp16_causal_sm80.cu +0 -0
  1882. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_fp16_causal_sm90.cu +0 -0
  1883. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_fp16_sm100.cu +0 -0
  1884. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_fp16_sm110.cu +0 -0
  1885. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_fp16_sm120.cu +0 -0
  1886. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_fp16_sm80.cu +0 -0
  1887. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/flash_fwd_split_hdim96_fp16_sm90.cu +0 -0
  1888. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/hardware_info.h +0 -0
  1889. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/kernel_traits.h +0 -0
  1890. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/mask.h +0 -0
  1891. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/namespace_config.h +0 -0
  1892. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/philox.cuh +0 -0
  1893. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/philox_unpack.cuh +0 -0
  1894. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/rotary.h +0 -0
  1895. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/softmax.h +0 -0
  1896. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/static_switch.h +0 -0
  1897. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/flash_attention/src/utils.h +0 -0
  1898. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/CMakeLists.txt +0 -0
  1899. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/code_gen.py +0 -0
  1900. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_cuda.cu +0 -0
  1901. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_cuda_impl.h +0 -0
  1902. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits2_bf16.cu +0 -0
  1903. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits2_f16.cu +0 -0
  1904. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits2_f32.cu +0 -0
  1905. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits3_bf16.cu +0 -0
  1906. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits3_f16.cu +0 -0
  1907. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits3_f32.cu +0 -0
  1908. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits4_bf16.cu +0 -0
  1909. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits4_f16.cu +0 -0
  1910. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits4_f32.cu +0 -0
  1911. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits5_bf16.cu +0 -0
  1912. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits5_f16.cu +0 -0
  1913. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits5_f32.cu +0 -0
  1914. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits6_bf16.cu +0 -0
  1915. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits6_f16.cu +0 -0
  1916. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits6_f32.cu +0 -0
  1917. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits7_bf16.cu +0 -0
  1918. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits7_f16.cu +0 -0
  1919. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits7_f32.cu +0 -0
  1920. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits8_bf16.cu +0 -0
  1921. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits8_f16.cu +0 -0
  1922. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_affine_bits8_f32.cu +0 -0
  1923. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_dispatch.h +0 -0
  1924. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_kernels.h +0 -0
  1925. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_mxfp4.cu +0 -0
  1926. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_mxfp8.cu +0 -0
  1927. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_nf4_bf16.cu +0 -0
  1928. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_nf4_f16.cu +0 -0
  1929. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_nf4_f32.cu +0 -0
  1930. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_nvfp4.cu +0 -0
  1931. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/quantized_matmul/src/qmm_dequant_nvfp8.cu +0 -0
  1932. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/CMakeLists.txt +0 -0
  1933. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/code_gen.py +0 -0
  1934. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3.h +0 -0
  1935. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_ffi.cu +0 -0
  1936. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_bf16_sm100.cu +0 -0
  1937. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_bf16_sm110.cu +0 -0
  1938. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_bf16_sm120.cu +0 -0
  1939. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_bf16_sm80.cu +0 -0
  1940. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_bf16_sm90.cu +0 -0
  1941. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_fp16_sm100.cu +0 -0
  1942. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_fp16_sm110.cu +0 -0
  1943. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_fp16_sm120.cu +0 -0
  1944. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_fp16_sm80.cu +0 -0
  1945. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_fp16_sm90.cu +0 -0
  1946. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_fp32_sm100.cu +0 -0
  1947. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_fp32_sm110.cu +0 -0
  1948. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_fp32_sm120.cu +0 -0
  1949. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_fp32_sm80.cu +0 -0
  1950. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim128_fp32_sm90.cu +0 -0
  1951. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_bf16_sm100.cu +0 -0
  1952. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_bf16_sm110.cu +0 -0
  1953. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_bf16_sm120.cu +0 -0
  1954. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_bf16_sm80.cu +0 -0
  1955. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_bf16_sm90.cu +0 -0
  1956. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_fp16_sm100.cu +0 -0
  1957. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_fp16_sm110.cu +0 -0
  1958. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_fp16_sm120.cu +0 -0
  1959. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_fp16_sm80.cu +0 -0
  1960. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_fp16_sm90.cu +0 -0
  1961. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_fp32_sm100.cu +0 -0
  1962. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_fp32_sm110.cu +0 -0
  1963. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_fp32_sm120.cu +0 -0
  1964. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_fp32_sm80.cu +0 -0
  1965. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim192_fp32_sm90.cu +0 -0
  1966. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_bf16_sm100.cu +0 -0
  1967. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_bf16_sm110.cu +0 -0
  1968. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_bf16_sm120.cu +0 -0
  1969. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_bf16_sm80.cu +0 -0
  1970. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_bf16_sm90.cu +0 -0
  1971. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_fp16_sm100.cu +0 -0
  1972. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_fp16_sm110.cu +0 -0
  1973. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_fp16_sm120.cu +0 -0
  1974. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_fp16_sm80.cu +0 -0
  1975. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_fp16_sm90.cu +0 -0
  1976. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_fp32_sm100.cu +0 -0
  1977. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_fp32_sm110.cu +0 -0
  1978. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_fp32_sm120.cu +0 -0
  1979. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_fp32_sm80.cu +0 -0
  1980. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim256_fp32_sm90.cu +0 -0
  1981. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_bf16_sm100.cu +0 -0
  1982. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_bf16_sm110.cu +0 -0
  1983. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_bf16_sm120.cu +0 -0
  1984. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_bf16_sm80.cu +0 -0
  1985. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_bf16_sm90.cu +0 -0
  1986. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_fp16_sm100.cu +0 -0
  1987. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_fp16_sm110.cu +0 -0
  1988. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_fp16_sm120.cu +0 -0
  1989. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_fp16_sm80.cu +0 -0
  1990. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_fp16_sm90.cu +0 -0
  1991. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_fp32_sm100.cu +0 -0
  1992. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_fp32_sm110.cu +0 -0
  1993. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_fp32_sm120.cu +0 -0
  1994. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_fp32_sm80.cu +0 -0
  1995. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim32_fp32_sm90.cu +0 -0
  1996. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_bf16_sm100.cu +0 -0
  1997. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_bf16_sm110.cu +0 -0
  1998. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_bf16_sm120.cu +0 -0
  1999. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_bf16_sm80.cu +0 -0
  2000. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_bf16_sm90.cu +0 -0
  2001. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_fp16_sm100.cu +0 -0
  2002. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_fp16_sm110.cu +0 -0
  2003. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_fp16_sm120.cu +0 -0
  2004. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_fp16_sm80.cu +0 -0
  2005. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_fp16_sm90.cu +0 -0
  2006. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_fp32_sm100.cu +0 -0
  2007. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_fp32_sm110.cu +0 -0
  2008. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_fp32_sm120.cu +0 -0
  2009. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_fp32_sm80.cu +0 -0
  2010. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim64_fp32_sm90.cu +0 -0
  2011. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_bf16_sm100.cu +0 -0
  2012. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_bf16_sm110.cu +0 -0
  2013. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_bf16_sm120.cu +0 -0
  2014. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_bf16_sm80.cu +0 -0
  2015. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_bf16_sm90.cu +0 -0
  2016. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_fp16_sm100.cu +0 -0
  2017. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_fp16_sm110.cu +0 -0
  2018. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_fp16_sm120.cu +0 -0
  2019. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_fp16_sm80.cu +0 -0
  2020. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_fp16_sm90.cu +0 -0
  2021. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_fp32_sm100.cu +0 -0
  2022. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_fp32_sm110.cu +0 -0
  2023. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_fp32_sm120.cu +0 -0
  2024. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_fp32_sm80.cu +0 -0
  2025. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_fwd_hdim96_fp32_sm90.cu +0 -0
  2026. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_kernel.h +0 -0
  2027. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/ragged_page_attention_v3/src/rpa_v3_launch_template.h +0 -0
  2028. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/CMakeLists.txt +0 -0
  2029. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/code_gen.py +0 -0
  2030. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua.h +0 -0
  2031. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_cuda.cu +0 -0
  2032. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim128_bf16_sm100.cu +0 -0
  2033. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim128_bf16_sm110.cu +0 -0
  2034. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim128_bf16_sm120.cu +0 -0
  2035. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim128_bf16_sm80.cu +0 -0
  2036. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim128_bf16_sm90.cu +0 -0
  2037. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim128_fp16_sm100.cu +0 -0
  2038. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim128_fp16_sm110.cu +0 -0
  2039. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim128_fp16_sm120.cu +0 -0
  2040. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim128_fp16_sm80.cu +0 -0
  2041. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim128_fp16_sm90.cu +0 -0
  2042. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim192_bf16_sm100.cu +0 -0
  2043. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim192_bf16_sm110.cu +0 -0
  2044. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim192_bf16_sm120.cu +0 -0
  2045. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim192_bf16_sm80.cu +0 -0
  2046. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim192_bf16_sm90.cu +0 -0
  2047. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim192_fp16_sm100.cu +0 -0
  2048. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim192_fp16_sm110.cu +0 -0
  2049. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim192_fp16_sm120.cu +0 -0
  2050. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim192_fp16_sm80.cu +0 -0
  2051. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim192_fp16_sm90.cu +0 -0
  2052. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim256_bf16_sm100.cu +0 -0
  2053. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim256_bf16_sm110.cu +0 -0
  2054. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim256_bf16_sm120.cu +0 -0
  2055. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim256_bf16_sm80.cu +0 -0
  2056. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim256_bf16_sm90.cu +0 -0
  2057. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim256_fp16_sm100.cu +0 -0
  2058. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim256_fp16_sm110.cu +0 -0
  2059. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim256_fp16_sm120.cu +0 -0
  2060. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim256_fp16_sm80.cu +0 -0
  2061. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim256_fp16_sm90.cu +0 -0
  2062. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim32_bf16_sm100.cu +0 -0
  2063. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim32_bf16_sm110.cu +0 -0
  2064. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim32_bf16_sm120.cu +0 -0
  2065. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim32_bf16_sm80.cu +0 -0
  2066. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim32_bf16_sm90.cu +0 -0
  2067. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim32_fp16_sm100.cu +0 -0
  2068. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim32_fp16_sm110.cu +0 -0
  2069. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim32_fp16_sm120.cu +0 -0
  2070. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim32_fp16_sm80.cu +0 -0
  2071. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim32_fp16_sm90.cu +0 -0
  2072. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim64_bf16_sm100.cu +0 -0
  2073. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim64_bf16_sm110.cu +0 -0
  2074. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim64_bf16_sm120.cu +0 -0
  2075. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim64_bf16_sm80.cu +0 -0
  2076. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim64_bf16_sm90.cu +0 -0
  2077. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim64_fp16_sm100.cu +0 -0
  2078. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim64_fp16_sm110.cu +0 -0
  2079. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim64_fp16_sm120.cu +0 -0
  2080. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim64_fp16_sm80.cu +0 -0
  2081. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim64_fp16_sm90.cu +0 -0
  2082. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim96_bf16_sm100.cu +0 -0
  2083. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim96_bf16_sm110.cu +0 -0
  2084. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim96_bf16_sm120.cu +0 -0
  2085. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim96_bf16_sm80.cu +0 -0
  2086. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim96_bf16_sm90.cu +0 -0
  2087. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim96_fp16_sm100.cu +0 -0
  2088. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim96_fp16_sm110.cu +0 -0
  2089. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim96_fp16_sm120.cu +0 -0
  2090. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim96_fp16_sm80.cu +0 -0
  2091. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_fwd_hdim96_fp16_sm90.cu +0 -0
  2092. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_kernel.h +0 -0
  2093. {ejkernel-0.0.76 → ejkernel-0.0.78}/csrc/unified_attention/src/ua_launch_template.h +0 -0
  2094. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/benchmarks.py +0 -0
  2095. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/build_cudalib.py +0 -0
  2096. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/callib/__init__.py +0 -0
  2097. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/callib/_cute_call.py +0 -0
  2098. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/callib/_cute_ffi.py +0 -0
  2099. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/callib/_ejit.py +0 -0
  2100. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/callib/_pallas_call.py +0 -0
  2101. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/callib/_triton_call.py +0 -0
  2102. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/callib/_utils.py +0 -0
  2103. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/errors.py +0 -0
  2104. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/__init__.py +0 -0
  2105. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/__init__.py +0 -0
  2106. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/blocksparse_attention/__init__.py +0 -0
  2107. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/blocksparse_attention/_build.py +0 -0
  2108. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/blocksparse_attention/_cuda_impl.py +0 -0
  2109. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/blocksparse_attention/_interface.py +0 -0
  2110. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/flash_attention/__init__.py +0 -0
  2111. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/flash_attention/_build.py +0 -0
  2112. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/flash_attention/_cuda_impl.py +0 -0
  2113. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/flash_attention/_interface.py +0 -0
  2114. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/quantized_matmul/__init__.py +0 -0
  2115. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/quantized_matmul/_build.py +0 -0
  2116. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/quantized_matmul/_cuda_impl.py +0 -0
  2117. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/quantized_matmul/_cuda_impl_bwd.py +0 -0
  2118. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/quantized_matmul/_cuda_impl_fwd.py +0 -0
  2119. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/quantized_matmul/_interface.py +0 -0
  2120. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/ragged_page_attention_v3/__init__.py +0 -0
  2121. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/ragged_page_attention_v3/_build.py +0 -0
  2122. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/ragged_page_attention_v3/_cuda_impl.py +0 -0
  2123. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/ragged_page_attention_v3/_interface.py +0 -0
  2124. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/unified_attention/__init__.py +0 -0
  2125. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/unified_attention/_build.py +0 -0
  2126. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/unified_attention/_cuda_impl.py +0 -0
  2127. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cuda/unified_attention/_interface.py +0 -0
  2128. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/__init__.py +0 -0
  2129. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/chunked_prefill_paged_decode/__init__.py +0 -0
  2130. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/chunked_prefill_paged_decode/_cute_impl_fwd.py +0 -0
  2131. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/chunked_prefill_paged_decode/_interface.py +0 -0
  2132. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/flash_attention/__init__.py +0 -0
  2133. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/flash_attention/_cute_impl.py +0 -0
  2134. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/flash_attention/_interface.py +0 -0
  2135. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/quantized_matmul/__init__.py +0 -0
  2136. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/quantized_matmul/_cute_impl.py +0 -0
  2137. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/quantized_matmul/_cute_impl_bwd.py +0 -0
  2138. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/quantized_matmul/_cute_impl_fwd.py +0 -0
  2139. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/quantized_matmul/_interface.py +0 -0
  2140. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/ragged_page_attention_v3/__init__.py +0 -0
  2141. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/ragged_page_attention_v3/_cute_impl_fwd.py +0 -0
  2142. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/ragged_page_attention_v3/_interface.py +0 -0
  2143. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/unified_attention/__init__.py +0 -0
  2144. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/unified_attention/_cute_impl.py +0 -0
  2145. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_cute/unified_attention/_interface.py +0 -0
  2146. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/__init__.py +0 -0
  2147. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/gpu/__init__.py +0 -0
  2148. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/gpu/ragged_decode_attention/__init__.py +0 -0
  2149. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/gpu/ragged_decode_attention/_interface.py +0 -0
  2150. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/gpu/ragged_decode_attention/_pallas_impl_fwd.py +0 -0
  2151. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/gpu/scaled_dot_product_attention/__init__.py +0 -0
  2152. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/gpu/scaled_dot_product_attention/_interface.py +0 -0
  2153. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/gpu/scaled_dot_product_attention/_pallas_impl_bwd.py +0 -0
  2154. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/gpu/scaled_dot_product_attention/_pallas_impl_fwd.py +0 -0
  2155. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/__init__.py +0 -0
  2156. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/all_gather_matmul/__init__.py +0 -0
  2157. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/all_gather_matmul/_interface.py +0 -0
  2158. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/all_gather_matmul/_pallas_impl.py +0 -0
  2159. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/blocksparse_attention/__init__.py +0 -0
  2160. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/blocksparse_attention/_info.py +0 -0
  2161. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/blocksparse_attention/_interface.py +0 -0
  2162. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/blocksparse_attention/_kernel.py +0 -0
  2163. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/blocksparse_attention/_masks.py +0 -0
  2164. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/deepseek_attn/__init__.py +0 -0
  2165. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/deepseek_attn/_interface.py +0 -0
  2166. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/deepseek_attn/_pallas_impl_bwd.py +0 -0
  2167. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/deepseek_attn/_pallas_impl_fwd.py +0 -0
  2168. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/flash_attention/__init__.py +0 -0
  2169. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/flash_attention/_interface.py +0 -0
  2170. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/flash_attention/_pallas_impl_bwd.py +0 -0
  2171. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/flash_attention/_pallas_impl_fwd.py +0 -0
  2172. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/flash_attention/_utils.py +0 -0
  2173. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/flash_mla/__init__.py +0 -0
  2174. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/flash_mla/_interface.py +0 -0
  2175. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/flash_mla/_pallas_impl_bwd.py +0 -0
  2176. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/flash_mla/_pallas_impl_fwd.py +0 -0
  2177. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/flash_mla/_utils.py +0 -0
  2178. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/gated_delta_rule/__init__.py +0 -0
  2179. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/gated_delta_rule/_interface.py +0 -0
  2180. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/gated_delta_rule/_pallas_impl_bwd.py +0 -0
  2181. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/grouped_matmul/__init__.py +0 -0
  2182. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/grouped_matmul/_interface.py +0 -0
  2183. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/grouped_matmul/_pallas_impl.py +0 -0
  2184. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/grouped_matmul/_utils.py +0 -0
  2185. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/grouped_matmulv2/__init__.py +0 -0
  2186. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/grouped_matmulv2/_interface.py +0 -0
  2187. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/grouped_matmulv2/_pallas_impl.py +0 -0
  2188. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/grouped_matmulv3/__init__.py +0 -0
  2189. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/grouped_matmulv3/_interface.py +0 -0
  2190. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/grouped_matmulv3/_pallas_impl.py +0 -0
  2191. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/multi_latent_ragged_page_attention/__init__.py +0 -0
  2192. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/multi_latent_ragged_page_attention/_interface.py +0 -0
  2193. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/multi_latent_ragged_page_attention/_pallas_impl_fwd.py +0 -0
  2194. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/multi_latent_ragged_page_attention_v2/__init__.py +0 -0
  2195. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/multi_latent_ragged_page_attention_v2/_interface.py +0 -0
  2196. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/multi_latent_ragged_page_attention_v2/_pallas_impl_fwd.py +0 -0
  2197. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/page_attention/__init__.py +0 -0
  2198. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/page_attention/_interface.py +0 -0
  2199. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/page_attention/_pallas_impl_fwd.py +0 -0
  2200. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/prefill_page_attention/__init__.py +0 -0
  2201. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/prefill_page_attention/_interface.py +0 -0
  2202. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/prefill_page_attention/_pallas_impl_fwd.py +0 -0
  2203. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/quantized_matmul/__init__.py +0 -0
  2204. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/quantized_matmul/_interface.py +0 -0
  2205. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/quantized_matmul/_pallas_impl_bwd.py +0 -0
  2206. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/quantized_matmul/_pallas_impl_core.py +0 -0
  2207. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/quantized_matmul/_pallas_impl_fwd.py +0 -0
  2208. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_decode_attention/__init__.py +0 -0
  2209. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_decode_attention/_interface.py +0 -0
  2210. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_decode_attention/_pallas_impl_fwd.py +0 -0
  2211. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_gated_delta_rule/__init__.py +0 -0
  2212. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_gated_delta_rule/_interface.py +0 -0
  2213. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_gated_delta_rule/_pallas_impl_fwd.py +0 -0
  2214. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_page_attention_v2/__init__.py +0 -0
  2215. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_page_attention_v2/_interface.py +0 -0
  2216. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_page_attention_v2/_pallas_impl_fwd.py +0 -0
  2217. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_page_attention_v2/_utils.py +0 -0
  2218. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_page_attention_v3/__init__.py +0 -0
  2219. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_page_attention_v3/_interface.py +0 -0
  2220. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_page_attention_v3/_pallas_impl_fwd.py +0 -0
  2221. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_page_attention_v3/_pallas_impl_fwd_h64.py +0 -0
  2222. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ragged_page_attention_v3/_utils.py +0 -0
  2223. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/reduce_scatter_matmul/__init__.py +0 -0
  2224. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/reduce_scatter_matmul/_interface.py +0 -0
  2225. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/reduce_scatter_matmul/_pallas_impl.py +0 -0
  2226. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ring_attention/__init__.py +0 -0
  2227. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ring_attention/_interface.py +0 -0
  2228. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ring_attention/_pallas_impl_bwd.py +0 -0
  2229. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_pallas/tpu/ring_attention/_pallas_impl_fwd.py +0 -0
  2230. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_registry.py +0 -0
  2231. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/__init__.py +0 -0
  2232. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/blocksparse_attention/__init__.py +0 -0
  2233. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/blocksparse_attention/_interface.py +0 -0
  2234. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/blocksparse_attention/_mask.py +0 -0
  2235. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/blocksparse_attention/_triton_impl_bwd.py +0 -0
  2236. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/blocksparse_attention/_triton_impl_fwd.py +0 -0
  2237. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/blocksparse_attention/_utilities.py +0 -0
  2238. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/chunked_prefill_paged_decode/__init__.py +0 -0
  2239. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/chunked_prefill_paged_decode/_interface.py +0 -0
  2240. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/chunked_prefill_paged_decode/_triton_impl_fwd.py +0 -0
  2241. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/decode_attention/__init__.py +0 -0
  2242. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/decode_attention/_interface.py +0 -0
  2243. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/decode_attention/_triton_impl_fwd.py +0 -0
  2244. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/flash_attention/__init__.py +0 -0
  2245. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/flash_attention/_interface.py +0 -0
  2246. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/flash_attention/_triton_impl_bwd.py +0 -0
  2247. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/flash_attention/_triton_impl_fwd.py +0 -0
  2248. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/flash_attention/_utilities.py +0 -0
  2249. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/flash_mla/__init__.py +0 -0
  2250. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/flash_mla/_interface.py +0 -0
  2251. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/flash_mla/_triton_impl_bwd.py +0 -0
  2252. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/flash_mla/_triton_impl_fwd.py +0 -0
  2253. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/flash_mla/_utilities.py +0 -0
  2254. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/gla/__init__.py +0 -0
  2255. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/gla/_interface.py +0 -0
  2256. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/gla/_triton_impl_bwd.py +0 -0
  2257. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/gla/_triton_impl_fwd.py +0 -0
  2258. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/lightning_attn/__init__.py +0 -0
  2259. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/lightning_attn/_interface.py +0 -0
  2260. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/lightning_attn/_triton_impl_bwd.py +0 -0
  2261. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/lightning_attn/_triton_impl_fwd.py +0 -0
  2262. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/mean_pooling/__init__.py +0 -0
  2263. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/mean_pooling/_interface.py +0 -0
  2264. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/mean_pooling/_triton_impl_bwd.py +0 -0
  2265. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/mean_pooling/_triton_impl_fwd.py +0 -0
  2266. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/native_sparse_attention/__init__.py +0 -0
  2267. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/native_sparse_attention/_compression.py +0 -0
  2268. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/native_sparse_attention/_interface.py +0 -0
  2269. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/native_sparse_attention/_triton_impl_bwd.py +0 -0
  2270. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/native_sparse_attention/_triton_impl_fwd.py +0 -0
  2271. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/native_sparse_attention/_utilities.py +0 -0
  2272. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/page_attention/__init__.py +0 -0
  2273. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/page_attention/_interface.py +0 -0
  2274. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/page_attention/_triton_impl_fwd.py +0 -0
  2275. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/quantized_matmul/__init__.py +0 -0
  2276. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/quantized_matmul/_interface.py +0 -0
  2277. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/quantized_matmul/_triton_impl.py +0 -0
  2278. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/quantized_matmul/_triton_impl_bwd.py +0 -0
  2279. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/quantized_matmul/_triton_impl_fwd.py +0 -0
  2280. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/quantized_matmul/_triton_impl_gemv.py +0 -0
  2281. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ragged_decode_attention/__init__.py +0 -0
  2282. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ragged_decode_attention/_interface.py +0 -0
  2283. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ragged_decode_attention/_triton_impl_fwd.py +0 -0
  2284. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ragged_page_attention_v2/__init__.py +0 -0
  2285. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ragged_page_attention_v2/_interface.py +0 -0
  2286. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ragged_page_attention_v2/_triton_impl_fwd.py +0 -0
  2287. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ragged_page_attention_v3/__init__.py +0 -0
  2288. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ragged_page_attention_v3/_interface.py +0 -0
  2289. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ragged_page_attention_v3/_triton_impl_fwd.py +0 -0
  2290. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/recurrent/__init__.py +0 -0
  2291. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/recurrent/_interface.py +0 -0
  2292. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/recurrent/_triton_impl_bwd.py +0 -0
  2293. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/recurrent/_triton_impl_fwd.py +0 -0
  2294. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ring_attention/__init__.py +0 -0
  2295. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ring_attention/_interface.py +0 -0
  2296. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ring_attention/_triton_impl_bwd.py +0 -0
  2297. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/ring_attention/_triton_impl_fwd.py +0 -0
  2298. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/rwkv4/__init__.py +0 -0
  2299. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/rwkv4/_interface.py +0 -0
  2300. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/rwkv4/_triton_impl_bwd.py +0 -0
  2301. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/rwkv4/_triton_impl_fwd.py +0 -0
  2302. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/rwkv6/__init__.py +0 -0
  2303. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/rwkv6/_interface.py +0 -0
  2304. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/rwkv6/_triton_impl_fwd.py +0 -0
  2305. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/rwkv7/__init__.py +0 -0
  2306. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/rwkv7/_interface.py +0 -0
  2307. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/rwkv7/_triton_impl_fwd.py +0 -0
  2308. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/unified_attention/__init__.py +0 -0
  2309. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/unified_attention/_interface.py +0 -0
  2310. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_triton/unified_attention/_triton_impl_fwd.py +0 -0
  2311. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/__init__.py +0 -0
  2312. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/all_gather_matmul/__init__.py +0 -0
  2313. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/all_gather_matmul/_interface.py +0 -0
  2314. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/all_gather_matmul/_xla_impl_bwd.py +0 -0
  2315. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/all_gather_matmul/_xla_impl_fwd.py +0 -0
  2316. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/attention/__init__.py +0 -0
  2317. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/attention/_interface.py +0 -0
  2318. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/attention/_xla_impl_bwd.py +0 -0
  2319. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/attention/_xla_impl_fwd.py +0 -0
  2320. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/blocksparse_attention/__init__.py +0 -0
  2321. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/blocksparse_attention/_interface.py +0 -0
  2322. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/blocksparse_attention/_xla_impl_bwd.py +0 -0
  2323. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/blocksparse_attention/_xla_impl_fwd.py +0 -0
  2324. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/chunked_prefill_paged_decode/__init__.py +0 -0
  2325. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/chunked_prefill_paged_decode/_interface.py +0 -0
  2326. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/chunked_prefill_paged_decode/_xla_impl_fwd.py +0 -0
  2327. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/decode_attention/__init__.py +0 -0
  2328. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/decode_attention/_interface.py +0 -0
  2329. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/decode_attention/_xla_impl_fwd.py +0 -0
  2330. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/deepseek_attn/__init__.py +0 -0
  2331. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/deepseek_attn/_interface.py +0 -0
  2332. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/deepseek_attn/_xla_impl_bwd.py +0 -0
  2333. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/deepseek_attn/_xla_impl_fwd.py +0 -0
  2334. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/flash_attention/__init__.py +0 -0
  2335. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/flash_attention/_interface.py +0 -0
  2336. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/flash_attention/_xla_impl_bwd.py +0 -0
  2337. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/flash_attention/_xla_impl_fwd.py +0 -0
  2338. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/flash_mla/__init__.py +0 -0
  2339. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/flash_mla/_interface.py +0 -0
  2340. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/flash_mla/_xla_impl_bwd.py +0 -0
  2341. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/flash_mla/_xla_impl_fwd.py +0 -0
  2342. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/gated_delta_rule/__init__.py +0 -0
  2343. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/gated_delta_rule/_interface.py +0 -0
  2344. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/gated_delta_rule/_xla_impl_bwd.py +0 -0
  2345. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/gla/__init__.py +0 -0
  2346. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/gla/_interface.py +0 -0
  2347. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/gla/_xla_impl_bwd.py +0 -0
  2348. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/gla/_xla_impl_fwd.py +0 -0
  2349. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/grouped_matmul/__init__.py +0 -0
  2350. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/grouped_matmul/_interface.py +0 -0
  2351. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/grouped_matmul/_xla_impl_bwd.py +0 -0
  2352. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/grouped_matmul/_xla_impl_fwd.py +0 -0
  2353. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/grouped_matmulv3/__init__.py +0 -0
  2354. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/grouped_matmulv3/_interface.py +0 -0
  2355. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/kernel_delta_attention/__init__.py +0 -0
  2356. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/kernel_delta_attention/_interface.py +0 -0
  2357. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/kernel_delta_attention/_xla_impl_fwd.py +0 -0
  2358. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/lightning_attn/__init__.py +0 -0
  2359. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/lightning_attn/_interface.py +0 -0
  2360. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/lightning_attn/_xla_impl_bwd.py +0 -0
  2361. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/lightning_attn/_xla_impl_fwd.py +0 -0
  2362. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/mean_pooling/__init__.py +0 -0
  2363. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/mean_pooling/_interface.py +0 -0
  2364. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/mean_pooling/_xla_impl_bwd.py +0 -0
  2365. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/mean_pooling/_xla_impl_fwd.py +0 -0
  2366. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/multi_latent_ragged_page_attention/__init__.py +0 -0
  2367. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/multi_latent_ragged_page_attention/_interface.py +0 -0
  2368. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/multi_latent_ragged_page_attention/_xla_impl_fwd.py +0 -0
  2369. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/multi_latent_ragged_page_attention_v2/__init__.py +0 -0
  2370. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/multi_latent_ragged_page_attention_v2/_interface.py +0 -0
  2371. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/multi_latent_ragged_page_attention_v2/_xla_impl_fwd.py +0 -0
  2372. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/native_sparse_attention/__init__.py +0 -0
  2373. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/native_sparse_attention/_interface.py +0 -0
  2374. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/native_sparse_attention/_xla_impl_bwd.py +0 -0
  2375. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/native_sparse_attention/_xla_impl_fwd.py +0 -0
  2376. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/page_attention/__init__.py +0 -0
  2377. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/page_attention/_interface.py +0 -0
  2378. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/page_attention/_xla_impl_fwd.py +0 -0
  2379. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/prefill_page_attention/__init__.py +0 -0
  2380. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/prefill_page_attention/_impl.py +0 -0
  2381. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/prefill_page_attention/_interface.py +0 -0
  2382. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/quantized_matmul/__init__.py +0 -0
  2383. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/quantized_matmul/_interface.py +0 -0
  2384. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/quantized_matmul/_xla_impl_bwd.py +0 -0
  2385. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/quantized_matmul/_xla_impl_fwd.py +0 -0
  2386. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_decode_attention/__init__.py +0 -0
  2387. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_decode_attention/_interface.py +0 -0
  2388. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_decode_attention/_xla_impl_fwd.py +0 -0
  2389. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_gated_delta_rule/__init__.py +0 -0
  2390. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_gated_delta_rule/_interface.py +0 -0
  2391. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_gated_delta_rule/_xla_impl_fwd.py +0 -0
  2392. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v2/__init__.py +0 -0
  2393. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v2/_interface.py +0 -0
  2394. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v2/_xla_impl_fwd.py +0 -0
  2395. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v2_turboquant/__init__.py +0 -0
  2396. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v2_turboquant/_interface.py +0 -0
  2397. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v2_turboquant/_xla_impl_fwd.py +0 -0
  2398. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v3/__init__.py +0 -0
  2399. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v3/_interface.py +0 -0
  2400. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v3/_xla_impl_bwd.py +0 -0
  2401. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v3/_xla_impl_fwd.py +0 -0
  2402. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v3_turboquant/__init__.py +0 -0
  2403. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v3_turboquant/_interface.py +0 -0
  2404. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ragged_page_attention_v3_turboquant/_xla_impl_fwd.py +0 -0
  2405. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/recurrent/__init__.py +0 -0
  2406. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/recurrent/_interface.py +0 -0
  2407. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/recurrent/_xla_impl_bwd.py +0 -0
  2408. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/recurrent/_xla_impl_fwd.py +0 -0
  2409. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/reduce_scatter_matmul/__init__.py +0 -0
  2410. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/reduce_scatter_matmul/_interface.py +0 -0
  2411. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/reduce_scatter_matmul/_xla_impl_bwd.py +0 -0
  2412. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/reduce_scatter_matmul/_xla_impl_fwd.py +0 -0
  2413. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ring_attention/__init__.py +0 -0
  2414. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ring_attention/_interface.py +0 -0
  2415. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ring_attention/_utils.py +0 -0
  2416. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ring_attention/_xla_impl_bwd.py +0 -0
  2417. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/ring_attention/_xla_impl_fwd.py +0 -0
  2418. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv4/__init__.py +0 -0
  2419. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv4/_interface.py +0 -0
  2420. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv4/_xla_impl_bwd.py +0 -0
  2421. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv4/_xla_impl_fwd.py +0 -0
  2422. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv6/__init__.py +0 -0
  2423. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv6/_interface.py +0 -0
  2424. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv6/_xla_impl_bwd.py +0 -0
  2425. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv6/_xla_impl_fwd.py +0 -0
  2426. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv7/__init__.py +0 -0
  2427. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv7/_interface.py +0 -0
  2428. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv7/_xla_impl_bwd.py +0 -0
  2429. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/rwkv7/_xla_impl_fwd.py +0 -0
  2430. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/scaled_dot_product_attention/__init__.py +0 -0
  2431. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/scaled_dot_product_attention/_interface.py +0 -0
  2432. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/scaled_dot_product_attention/_xla_impl_bwd.py +0 -0
  2433. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/scaled_dot_product_attention/_xla_impl_fwd.py +0 -0
  2434. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/state_space_v1/__init__.py +0 -0
  2435. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/state_space_v1/_interface.py +0 -0
  2436. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/state_space_v1/_xla_impl_bwd.py +0 -0
  2437. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/state_space_v1/_xla_impl_fwd.py +0 -0
  2438. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/state_space_v2/__init__.py +0 -0
  2439. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/state_space_v2/_interface.py +0 -0
  2440. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/state_space_v2/_xla_impl_bwd.py +0 -0
  2441. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/state_space_v2/_xla_impl_fwd.py +0 -0
  2442. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/unified_attention/__init__.py +0 -0
  2443. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/unified_attention/_interface.py +0 -0
  2444. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/kernels/_xla/unified_attention/_xla_impl_fwd.py +0 -0
  2445. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/loggings.py +0 -0
  2446. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/__init__.py +0 -0
  2447. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/base.py +0 -0
  2448. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/__init__.py +0 -0
  2449. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/all_gather_matmul.py +0 -0
  2450. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/attention.py +0 -0
  2451. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/blocksparse_attention.py +0 -0
  2452. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/chunked_prefill_paged_decode.py +0 -0
  2453. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/configs.py +0 -0
  2454. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/decode_attention.py +0 -0
  2455. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/deepseek_attn.py +0 -0
  2456. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/flash_attention.py +0 -0
  2457. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/gated_delta_rule.py +0 -0
  2458. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/gated_linear_attention.py +0 -0
  2459. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/grouped_matmul.py +0 -0
  2460. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/kernel_delta_attention.py +0 -0
  2461. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/lightning_attention.py +0 -0
  2462. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/multi_head_latent_attention.py +0 -0
  2463. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/multi_latent_ragged_page_attention.py +0 -0
  2464. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/multi_latent_ragged_page_attention_v2.py +0 -0
  2465. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/native_sparse_attention.py +0 -0
  2466. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/page_attention.py +0 -0
  2467. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/pooling.py +0 -0
  2468. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/prefill_page_attention.py +0 -0
  2469. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/quantized_matmul.py +0 -0
  2470. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/ragged_decode_attention.py +0 -0
  2471. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/ragged_gated_delta_rule.py +0 -0
  2472. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/ragged_page_attention_v2.py +0 -0
  2473. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/ragged_page_attention_v2_turboquant.py +0 -0
  2474. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/ragged_page_attention_v3.py +0 -0
  2475. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/ragged_page_attention_v3_turboquant.py +0 -0
  2476. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/recurrent.py +0 -0
  2477. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/reduce_scatter_matmul.py +0 -0
  2478. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/ring_attention.py +0 -0
  2479. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/rwkv4.py +0 -0
  2480. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/rwkv6.py +0 -0
  2481. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/rwkv7.py +0 -0
  2482. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/scaled_dot_product_attention.py +0 -0
  2483. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/state_space_v1.py +0 -0
  2484. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/state_space_v2.py +0 -0
  2485. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/modules/operations/unified_attention.py +0 -0
  2486. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/__init__.py +0 -0
  2487. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/config/__init__.py +0 -0
  2488. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/config/cache.py +0 -0
  2489. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/config/persistent.py +0 -0
  2490. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/config/selection.py +0 -0
  2491. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/core/__init__.py +0 -0
  2492. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/core/kernel.py +0 -0
  2493. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/core/types.py +0 -0
  2494. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/execution/__init__.py +0 -0
  2495. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/execution/batch.py +0 -0
  2496. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/execution/executor.py +0 -0
  2497. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/execution/offline.py +0 -0
  2498. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/execution/profiler.py +0 -0
  2499. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/execution/tuning.py +0 -0
  2500. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/registry.py +0 -0
  2501. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/utils/__init__.py +0 -0
  2502. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/utils/datacarrier.py +0 -0
  2503. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/utils/fingerprint.py +0 -0
  2504. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/utils/meta.py +0 -0
  2505. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/ops/utils/serialize.py +0 -0
  2506. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/__init__.py +0 -0
  2507. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/_quants/__init__.py +0 -0
  2508. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/_quants/quantizations.py +0 -0
  2509. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/_utils/__init__.py +0 -0
  2510. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/_utils/bitpack.py +0 -0
  2511. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/_utils/fp_tables.py +0 -0
  2512. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/_utils/grouping.py +0 -0
  2513. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/_utils/qparams.py +0 -0
  2514. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/quantized_array.py +0 -0
  2515. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/runtime.py +0 -0
  2516. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/turboquant/__init__.py +0 -0
  2517. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/turboquant/codebook.py +0 -0
  2518. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/turboquant/matrices.py +0 -0
  2519. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/turboquant/ops.py +0 -0
  2520. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/quantization/turboquant/packing.py +0 -0
  2521. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/types/__init__.py +0 -0
  2522. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/types/mask.py +0 -0
  2523. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/utils.py +0 -0
  2524. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/xla_utils/__init__.py +0 -0
  2525. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/xla_utils/cumsum.py +0 -0
  2526. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/xla_utils/shardings.py +0 -0
  2527. {ejkernel-0.0.76 → ejkernel-0.0.78}/ejkernel/xla_utils/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: ejkernel
3
- Version: 0.0.76
3
+ Version: 0.0.78
4
4
  Summary: Accelerate, Optimize performance with streamlined training and serving options with JAX.
5
5
  Keywords: Deep Learning,Machine Learning,JAX,CUDA,XLA,Triton,Pallas
6
6
  Author: Erfan Zare Chavoshi
@@ -43,7 +43,7 @@ import os as _os
43
43
  _os.environ.setdefault("TF_GPU_ALLOCATOR", "cuda_malloc_async")
44
44
  _os.environ.setdefault("CUTE_DSL_ENABLE_TVM_FFI", "1")
45
45
 
46
- __version__ = "0.0.76"
46
+ __version__ = "0.0.78"
47
47
 
48
48
  from . import errors, kernels, modules, types, utils, xla_utils
49
49
  from .errors import EjkernelRuntimeError
@@ -34,7 +34,7 @@ from jax.experimental import pallas as pl
34
34
  from jax.experimental.pallas import tpu as pltpu
35
35
  from jaxtyping import Array, Float
36
36
 
37
- from ...._xla.gated_delta_rule._xla_impl_fwd import _l2norm_with_inv
37
+ from ...._xla.gated_delta_rule._xla_impl_fwd import _l2norm_with_inv, _recurrent_gdr_fwd
38
38
 
39
39
  _P = lax.Precision.DEFAULT
40
40
  _N_FUSE = 1
@@ -53,7 +53,15 @@ def _chunk_blockspec(shape: tuple[int, ...]) -> pl.BlockSpec:
53
53
  def _neumann_inv(A, C, strict_lower=None, lower_mask=None):
54
54
  """Compute (I - A)^{-1} via repeated squaring. Input must be pre-sanitized."""
55
55
  _hp = lax.Precision.HIGHEST
56
- num_iters = min(math.ceil(math.log2(C)), 4) if C > 1 else 0
56
+ # ``A`` is strict-lower triangular, so the Neumann series terminates
57
+ # exactly after at most ``C - 1`` powers. Repeated squaring needs
58
+ # ``ceil(log2(C))`` stages to materialize all terms up to ``A^(C-1)``.
59
+ #
60
+ # Clipping this to 4 only reconstructs powers through ``A^15``. That
61
+ # makes partially-filled chunks numerically wrong once the valid prefix
62
+ # exceeds ~16 tokens, which shows up most clearly on padded-heavy SFT
63
+ # batches where the last chunk is only partially active.
64
+ num_iters = math.ceil(math.log2(C)) if C > 1 else 0
57
65
  if strict_lower is None:
58
66
  strict_lower = jnp.tril(jnp.ones((C, C), dtype=jnp.float32), k=-1)
59
67
  if lower_mask is None:
@@ -511,6 +519,37 @@ def _chunk_gdr_bwd_rule(chunk_size, use_qk_l2norm, res, g):
511
519
  _chunk_gdr_fwd.defvjp(_chunk_gdr_fwd_rule, _chunk_gdr_bwd_rule)
512
520
 
513
521
 
522
+ def _chunk_gdr_fwd(
523
+ query: Float[Array, "batch num_heads seq_len head_dim"],
524
+ key: Float[Array, "batch num_heads seq_len head_dim"],
525
+ value: Float[Array, "batch num_heads seq_len d_state"],
526
+ beta: Float[Array, "batch num_heads seq_len"],
527
+ decay: Float[Array, "batch num_heads seq_len"] | None,
528
+ chunk_size: int = 64,
529
+ initial_state: Float[Array, "batch num_heads head_dim d_state"] | None = None,
530
+ use_qk_l2norm: bool = True,
531
+ ) -> tuple[
532
+ Float[Array, "batch num_heads seq_len d_state"],
533
+ Float[Array, "batch num_heads head_dim d_state"],
534
+ ]:
535
+ """Exact multi-token chunked GDR path for TPU.
536
+
537
+ Keep the optimized Pallas single-token decode kernel, but route the
538
+ unstable multi-token training/prefill path through the exact chunked
539
+ triangular-solve implementation.
540
+ """
541
+ return _recurrent_gdr_fwd(
542
+ query=query,
543
+ key=key,
544
+ value=value,
545
+ beta=beta,
546
+ decay=decay,
547
+ initial_state=initial_state,
548
+ use_qk_l2norm=use_qk_l2norm,
549
+ chunk_size=chunk_size,
550
+ )
551
+
552
+
514
553
  def _gdr_single_step_fwd_kernel(q_ref, k_ref, v_ref, beta_ref, decay_ref, state_ref, out_ref, final_state_ref):
515
554
  q_t = q_ref[0, 0, 0].astype(jnp.float32)
516
555
  k_t = k_ref[0, 0, 0].astype(jnp.float32)
@@ -174,9 +174,9 @@ def _recurrent_gdr_fwd(
174
174
  initial_state = initial_state.astype(jnp.float32)
175
175
 
176
176
  if decay is None:
177
- decay = jnp.zeros((B, H, L), dtype=jnp.float32)
177
+ decay = jnp.zeros((B, H, L), dtype=input_dtype)
178
178
  else:
179
- decay = decay.astype(jnp.float32)
179
+ decay = decay.astype(input_dtype)
180
180
 
181
181
  pad_size = (C - L % C) % C
182
182
  if pad_size > 0:
@@ -205,7 +205,7 @@ def _recurrent_gdr_fwd(
205
205
  strict_lower = jnp.tril(jnp.ones((C, C), dtype=jnp.bool_), k=-1)
206
206
  lower_mask = jnp.tril(jnp.ones((C, C), dtype=jnp.bool_))
207
207
  g_diff = jnp.where(strict_lower, g_diff, -1e30)
208
- S = jnp.where(strict_lower, S * jnp.exp(g_diff), 0.0)
208
+ S = jnp.where(strict_lower, S * jnp.exp(jnp.clip(g_diff, -20.0, 20.0)), 0.0)
209
209
 
210
210
  eye = jnp.eye(C, dtype=jnp.float32)
211
211
  lhs = jnp.broadcast_to(eye, S.shape) + S
@@ -223,17 +223,17 @@ def _recurrent_gdr_fwd(
223
223
  input_dtype
224
224
  )
225
225
 
226
- k_beta_g = k_beta.astype(jnp.float32) * jnp.exp(g_cumsum)[..., None]
226
+ k_beta_g = k_beta.astype(jnp.float32) * jnp.exp(jnp.clip(g_cumsum, -20.0, 20.0))[..., None]
227
227
  w_chunks = jnp.einsum("bhcij,bhcjk->bhcik", A, k_beta_g, precision=_MATMUL_PRECISION).astype(input_dtype)
228
228
 
229
229
  attn_qk = jnp.einsum("bhcik,bhcjk->bhcij", q_c, k_c, precision=_MATMUL_PRECISION).astype(jnp.float32)
230
230
  g_diff_intra = g_cumsum[..., :, None] - g_cumsum[..., None, :]
231
231
  g_diff_intra = jnp.where(lower_mask, g_diff_intra, -1e30)
232
- attn_i = jnp.where(lower_mask, attn_qk * jnp.exp(g_diff_intra), 0.0).astype(input_dtype)
232
+ attn_i = jnp.where(lower_mask, attn_qk * jnp.exp(jnp.clip(g_diff_intra, -20.0, 20.0)), 0.0).astype(input_dtype)
233
233
 
234
- q_g = (q_c.astype(jnp.float32) * jnp.exp(g_cumsum)[..., None]).astype(input_dtype)
235
- g_end_exp = jnp.exp(g_cumsum[..., -1])[..., None, None]
236
- g_diff_state = jnp.exp(g_cumsum[..., -1, None] - g_cumsum)[..., None]
234
+ q_g = (q_c.astype(jnp.float32) * jnp.exp(jnp.clip(g_cumsum, -20.0, 20.0))[..., None]).astype(input_dtype)
235
+ g_end_exp = jnp.exp(jnp.clip(g_cumsum[..., -1], -20.0, 20.0))[..., None, None]
236
+ g_diff_state = jnp.exp(jnp.clip(g_cumsum[..., -1, None] - g_cumsum, -20.0, 20.0))[..., None]
237
237
  k_g_diff = (k_c.astype(jnp.float32) * g_diff_state).astype(input_dtype)
238
238
 
239
239
  xs = (
@@ -339,9 +339,9 @@ def _chunk_gdr_fwd_core(
339
339
  key, k_inv_norm = _l2norm_with_inv(key, axis=-1, eps=1e-6)
340
340
 
341
341
  if decay is None:
342
- decay = jnp.zeros((B, H, L), dtype=input_dtype)
342
+ decay = jnp.zeros((B, H, L), dtype=jnp.float32)
343
343
  else:
344
- decay = decay.astype(input_dtype)
344
+ decay = decay.astype(jnp.float32)
345
345
 
346
346
  pad_size = (chunk_size - L % chunk_size) % chunk_size
347
347
  if pad_size > 0:
@@ -374,7 +374,7 @@ def _chunk_gdr_fwd_core(
374
374
 
375
375
  g_diff = g_cumsum[:, :, :, :, None] - g_cumsum[:, :, :, None, :]
376
376
  g_diff = jnp.tril(g_diff)
377
- decay_mask = jnp.exp(g_diff)
377
+ decay_mask = jnp.exp(jnp.clip(g_diff, -20.0, 20.0))
378
378
  decay_mask = jnp.tril(decay_mask)
379
379
 
380
380
  attn = jnp.einsum("bhcik,bhcjk->bhcij", k_beta, key, precision=_MATMUL_PRECISION)
@@ -387,10 +387,10 @@ def _chunk_gdr_fwd_core(
387
387
 
388
388
  attn = jnp.nan_to_num(inv, nan=0.0, posinf=0.0, neginf=0.0).astype(input_dtype)
389
389
 
390
- g_cumsum_exp = jnp.exp(g_cumsum).astype(input_dtype)
390
+ g_cumsum_exp = jnp.exp(jnp.clip(g_cumsum, -20.0, 20.0)).astype(input_dtype)
391
391
  g_end = g_cumsum[:, :, :, -1]
392
- g_end_exp = jnp.exp(g_end).astype(input_dtype)
393
- g_diff_state_exp = jnp.exp(g_end[:, :, :, None] - g_cumsum).astype(input_dtype)
392
+ g_end_exp = jnp.exp(jnp.clip(g_end, -20.0, 20.0)).astype(input_dtype)
393
+ g_diff_state_exp = jnp.exp(jnp.clip(g_end[:, :, :, None] - g_cumsum, -20.0, 20.0)).astype(input_dtype)
394
394
 
395
395
  value_local = jnp.einsum("bhcij,bhcjv->bhciv", attn, v_beta, precision=_MATMUL_PRECISION)
396
396
  k_beta_scaled = k_beta * g_cumsum_exp[:, :, :, :, None]
@@ -424,15 +424,21 @@ def _chunk_gdr_fwd_core(
424
424
  q_scaled = q_i * g_exp_i[:, :, :, None]
425
425
  qk_fused = jnp.stack([k_cumdecay_i, q_scaled], axis=0)
426
426
  both = jnp.einsum("nbhik,bhkv->nbhiv", qk_fused, state, precision=_MATMUL_PRECISION)
427
- v_prime, attn_inter = both[0], both[1]
428
-
429
- v_new = v_i - v_prime
430
- core_out = attn_inter + jnp.einsum("bhij,bhjv->bhiv", attn_qk, v_new, precision=_MATMUL_PRECISION)
427
+ v_prime = jnp.nan_to_num(both[0], nan=0.0, posinf=0.0, neginf=0.0)
428
+ attn_inter = jnp.nan_to_num(both[1], nan=0.0, posinf=0.0, neginf=0.0)
429
+
430
+ v_new = jnp.nan_to_num(v_i - v_prime, nan=0.0, posinf=0.0, neginf=0.0)
431
+ core_out = jnp.nan_to_num(
432
+ attn_inter + jnp.einsum("bhij,bhjv->bhiv", attn_qk, v_new, precision=_MATMUL_PRECISION),
433
+ nan=0.0,
434
+ posinf=0.0,
435
+ neginf=0.0,
436
+ )
431
437
 
432
438
  state_decayed = state * g_end_exp_i[:, :, None, None]
433
439
  k_scaled = k_i * g_diff_exp_i[:, :, :, None]
434
440
  state_update = jnp.einsum("bhik,bhiv->bhkv", k_scaled, v_new, precision=_MATMUL_PRECISION)
435
- new_state = (state_decayed + state_update).astype(state.dtype)
441
+ new_state = jnp.nan_to_num(state_decayed + state_update, nan=0.0, posinf=0.0, neginf=0.0).astype(state.dtype)
436
442
 
437
443
  return new_state, core_out.astype(input_dtype)
438
444
 
@@ -537,6 +543,38 @@ def _chunk_gdr_bwd_rule(chunk_size, use_qk_l2norm, res, g):
537
543
  _chunk_gdr_fwd.defvjp(_chunk_gdr_fwd_rule, _chunk_gdr_bwd_rule)
538
544
 
539
545
 
546
+ def _chunk_gdr_fwd(
547
+ query: Float[Array, "batch num_heads seq_len head_dim"],
548
+ key: Float[Array, "batch num_heads seq_len head_dim"],
549
+ value: Float[Array, "batch num_heads seq_len d_state"],
550
+ beta: Float[Array, "batch num_heads seq_len"],
551
+ decay: Float[Array, "batch num_heads seq_len"] | None,
552
+ chunk_size: int = 64,
553
+ initial_state: Float[Array, "batch num_heads head_dim d_state"] | None = None,
554
+ use_qk_l2norm: bool = True,
555
+ ) -> tuple[
556
+ Float[Array, "batch num_heads seq_len d_state"],
557
+ Float[Array, "batch num_heads head_dim d_state"],
558
+ ]:
559
+ """Exact multi-token chunked GDR path.
560
+
561
+ The previous Neumann/custom-VJP implementation diverges catastrophically on
562
+ real padded SFT batches even though isolated tensor probes looked small.
563
+ Use the exact triangular-solve chunked formulation for the production
564
+ multi-token path and rely on standard autodiff through it.
565
+ """
566
+ return _recurrent_gdr_fwd(
567
+ query=query,
568
+ key=key,
569
+ value=value,
570
+ beta=beta,
571
+ decay=decay,
572
+ initial_state=initial_state,
573
+ use_qk_l2norm=use_qk_l2norm,
574
+ chunk_size=chunk_size,
575
+ )
576
+
577
+
540
578
  def _single_step_gdr_fwd(
541
579
  query: Float[Array, "batch num_heads 1 head_dim"],
542
580
  key: Float[Array, "batch num_heads 1 head_dim"],
@@ -4,7 +4,7 @@ build-backend = "uv_build"
4
4
 
5
5
  [project]
6
6
  name = "ejkernel"
7
- version = "0.0.76"
7
+ version = "0.0.78"
8
8
  authors = [{ name = "Erfan Zare Chavoshi", email = "Erfanzare810@gmail.com" }]
9
9
  description = "Accelerate, Optimize performance with streamlined training and serving options with JAX."
10
10
  readme = "README.md"
File without changes
File without changes