sequenzo 0.1.31__cp310-cp310-macosx_10_9_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (299) hide show
  1. _sequenzo_fastcluster.cpython-310-darwin.so +0 -0
  2. sequenzo/__init__.py +349 -0
  3. sequenzo/big_data/__init__.py +12 -0
  4. sequenzo/big_data/clara/__init__.py +26 -0
  5. sequenzo/big_data/clara/clara.py +476 -0
  6. sequenzo/big_data/clara/utils/__init__.py +27 -0
  7. sequenzo/big_data/clara/utils/aggregatecases.py +92 -0
  8. sequenzo/big_data/clara/utils/davies_bouldin.py +91 -0
  9. sequenzo/big_data/clara/utils/get_weighted_diss.cpython-310-darwin.so +0 -0
  10. sequenzo/big_data/clara/utils/wfcmdd.py +205 -0
  11. sequenzo/big_data/clara/visualization.py +88 -0
  12. sequenzo/clustering/KMedoids.py +178 -0
  13. sequenzo/clustering/__init__.py +30 -0
  14. sequenzo/clustering/clustering_c_code.cpython-310-darwin.so +0 -0
  15. sequenzo/clustering/hierarchical_clustering.py +1256 -0
  16. sequenzo/clustering/sequenzo_fastcluster/fastcluster.py +495 -0
  17. sequenzo/clustering/sequenzo_fastcluster/src/fastcluster.cpp +1877 -0
  18. sequenzo/clustering/sequenzo_fastcluster/src/fastcluster_python.cpp +1264 -0
  19. sequenzo/clustering/src/KMedoid.cpp +263 -0
  20. sequenzo/clustering/src/PAM.cpp +237 -0
  21. sequenzo/clustering/src/PAMonce.cpp +265 -0
  22. sequenzo/clustering/src/cluster_quality.cpp +496 -0
  23. sequenzo/clustering/src/cluster_quality.h +128 -0
  24. sequenzo/clustering/src/cluster_quality_backup.cpp +570 -0
  25. sequenzo/clustering/src/module.cpp +228 -0
  26. sequenzo/clustering/src/weightedinertia.cpp +111 -0
  27. sequenzo/clustering/utils/__init__.py +27 -0
  28. sequenzo/clustering/utils/disscenter.py +122 -0
  29. sequenzo/data_preprocessing/__init__.py +22 -0
  30. sequenzo/data_preprocessing/helpers.py +303 -0
  31. sequenzo/datasets/__init__.py +41 -0
  32. sequenzo/datasets/biofam.csv +2001 -0
  33. sequenzo/datasets/biofam_child_domain.csv +2001 -0
  34. sequenzo/datasets/biofam_left_domain.csv +2001 -0
  35. sequenzo/datasets/biofam_married_domain.csv +2001 -0
  36. sequenzo/datasets/chinese_colonial_territories.csv +12 -0
  37. sequenzo/datasets/country_co2_emissions.csv +194 -0
  38. sequenzo/datasets/country_co2_emissions_global_deciles.csv +195 -0
  39. sequenzo/datasets/country_co2_emissions_global_quintiles.csv +195 -0
  40. sequenzo/datasets/country_co2_emissions_local_deciles.csv +195 -0
  41. sequenzo/datasets/country_co2_emissions_local_quintiles.csv +195 -0
  42. sequenzo/datasets/country_gdp_per_capita.csv +194 -0
  43. sequenzo/datasets/dyadic_children.csv +61 -0
  44. sequenzo/datasets/dyadic_parents.csv +61 -0
  45. sequenzo/datasets/mvad.csv +713 -0
  46. sequenzo/datasets/pairfam_activity_by_month.csv +1028 -0
  47. sequenzo/datasets/pairfam_activity_by_year.csv +1028 -0
  48. sequenzo/datasets/pairfam_family_by_month.csv +1028 -0
  49. sequenzo/datasets/pairfam_family_by_year.csv +1028 -0
  50. sequenzo/datasets/political_science_aid_shock.csv +166 -0
  51. sequenzo/datasets/political_science_donor_fragmentation.csv +157 -0
  52. sequenzo/define_sequence_data.py +1400 -0
  53. sequenzo/dissimilarity_measures/__init__.py +31 -0
  54. sequenzo/dissimilarity_measures/c_code.cpython-310-darwin.so +0 -0
  55. sequenzo/dissimilarity_measures/get_distance_matrix.py +762 -0
  56. sequenzo/dissimilarity_measures/get_substitution_cost_matrix.py +246 -0
  57. sequenzo/dissimilarity_measures/src/DHDdistance.cpp +148 -0
  58. sequenzo/dissimilarity_measures/src/LCPdistance.cpp +114 -0
  59. sequenzo/dissimilarity_measures/src/LCPspellDistance.cpp +215 -0
  60. sequenzo/dissimilarity_measures/src/OMdistance.cpp +247 -0
  61. sequenzo/dissimilarity_measures/src/OMspellDistance.cpp +281 -0
  62. sequenzo/dissimilarity_measures/src/__init__.py +0 -0
  63. sequenzo/dissimilarity_measures/src/dist2matrix.cpp +63 -0
  64. sequenzo/dissimilarity_measures/src/dp_utils.h +160 -0
  65. sequenzo/dissimilarity_measures/src/module.cpp +40 -0
  66. sequenzo/dissimilarity_measures/src/setup.py +30 -0
  67. sequenzo/dissimilarity_measures/src/utils.h +25 -0
  68. sequenzo/dissimilarity_measures/src/xsimd/.github/cmake-test/main.cpp +6 -0
  69. sequenzo/dissimilarity_measures/src/xsimd/benchmark/main.cpp +159 -0
  70. sequenzo/dissimilarity_measures/src/xsimd/benchmark/xsimd_benchmark.hpp +565 -0
  71. sequenzo/dissimilarity_measures/src/xsimd/docs/source/conf.py +37 -0
  72. sequenzo/dissimilarity_measures/src/xsimd/examples/mandelbrot.cpp +330 -0
  73. sequenzo/dissimilarity_measures/src/xsimd/examples/pico_bench.hpp +246 -0
  74. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/common/xsimd_common_arithmetic.hpp +266 -0
  75. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/common/xsimd_common_complex.hpp +112 -0
  76. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/common/xsimd_common_details.hpp +323 -0
  77. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/common/xsimd_common_logical.hpp +218 -0
  78. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/common/xsimd_common_math.hpp +2583 -0
  79. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/common/xsimd_common_memory.hpp +880 -0
  80. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/common/xsimd_common_rounding.hpp +72 -0
  81. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/common/xsimd_common_swizzle.hpp +174 -0
  82. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/common/xsimd_common_trigo.hpp +978 -0
  83. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx.hpp +1924 -0
  84. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx2.hpp +1144 -0
  85. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx512bw.hpp +656 -0
  86. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx512cd.hpp +28 -0
  87. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx512dq.hpp +244 -0
  88. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx512er.hpp +20 -0
  89. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx512f.hpp +2650 -0
  90. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx512ifma.hpp +20 -0
  91. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx512pf.hpp +20 -0
  92. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx512vbmi.hpp +77 -0
  93. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx512vbmi2.hpp +131 -0
  94. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx512vnni_avx512bw.hpp +20 -0
  95. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avx512vnni_avx512vbmi2.hpp +20 -0
  96. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_avxvnni.hpp +20 -0
  97. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_common.hpp +24 -0
  98. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_common_fwd.hpp +77 -0
  99. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_constants.hpp +393 -0
  100. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_emulated.hpp +788 -0
  101. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_fma3_avx.hpp +93 -0
  102. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_fma3_avx2.hpp +46 -0
  103. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_fma3_sse.hpp +97 -0
  104. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_fma4.hpp +92 -0
  105. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_i8mm_neon64.hpp +17 -0
  106. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_isa.hpp +142 -0
  107. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_neon.hpp +3142 -0
  108. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_neon64.hpp +1543 -0
  109. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_rvv.hpp +1513 -0
  110. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_scalar.hpp +1260 -0
  111. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_sse2.hpp +2024 -0
  112. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_sse3.hpp +67 -0
  113. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_sse4_1.hpp +339 -0
  114. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_sse4_2.hpp +44 -0
  115. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_ssse3.hpp +186 -0
  116. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_sve.hpp +1155 -0
  117. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_vsx.hpp +892 -0
  118. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/arch/xsimd_wasm.hpp +1780 -0
  119. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/config/xsimd_arch.hpp +240 -0
  120. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/config/xsimd_config.hpp +484 -0
  121. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/config/xsimd_cpuid.hpp +269 -0
  122. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/config/xsimd_inline.hpp +27 -0
  123. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/math/xsimd_rem_pio2.hpp +719 -0
  124. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/memory/xsimd_aligned_allocator.hpp +349 -0
  125. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/memory/xsimd_alignment.hpp +91 -0
  126. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_all_registers.hpp +55 -0
  127. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_api.hpp +2765 -0
  128. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx2_register.hpp +44 -0
  129. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx512bw_register.hpp +51 -0
  130. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx512cd_register.hpp +51 -0
  131. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx512dq_register.hpp +51 -0
  132. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx512er_register.hpp +51 -0
  133. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx512f_register.hpp +77 -0
  134. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx512ifma_register.hpp +51 -0
  135. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx512pf_register.hpp +51 -0
  136. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx512vbmi2_register.hpp +51 -0
  137. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx512vbmi_register.hpp +51 -0
  138. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx512vnni_avx512bw_register.hpp +54 -0
  139. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx512vnni_avx512vbmi2_register.hpp +53 -0
  140. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avx_register.hpp +64 -0
  141. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_avxvnni_register.hpp +44 -0
  142. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_batch.hpp +1524 -0
  143. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_batch_constant.hpp +300 -0
  144. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_common_arch.hpp +47 -0
  145. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_emulated_register.hpp +80 -0
  146. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_fma3_avx2_register.hpp +50 -0
  147. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_fma3_avx_register.hpp +50 -0
  148. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_fma3_sse_register.hpp +50 -0
  149. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_fma4_register.hpp +50 -0
  150. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_i8mm_neon64_register.hpp +55 -0
  151. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_neon64_register.hpp +55 -0
  152. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_neon_register.hpp +154 -0
  153. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_register.hpp +94 -0
  154. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_rvv_register.hpp +506 -0
  155. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_sse2_register.hpp +59 -0
  156. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_sse3_register.hpp +49 -0
  157. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_sse4_1_register.hpp +48 -0
  158. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_sse4_2_register.hpp +48 -0
  159. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_ssse3_register.hpp +48 -0
  160. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_sve_register.hpp +156 -0
  161. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_traits.hpp +337 -0
  162. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_utils.hpp +536 -0
  163. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_vsx_register.hpp +77 -0
  164. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/types/xsimd_wasm_register.hpp +59 -0
  165. sequenzo/dissimilarity_measures/src/xsimd/include/xsimd/xsimd.hpp +75 -0
  166. sequenzo/dissimilarity_measures/src/xsimd/test/architectures/dummy.cpp +7 -0
  167. sequenzo/dissimilarity_measures/src/xsimd/test/doc/explicit_use_of_an_instruction_set.cpp +13 -0
  168. sequenzo/dissimilarity_measures/src/xsimd/test/doc/explicit_use_of_an_instruction_set_mean.cpp +24 -0
  169. sequenzo/dissimilarity_measures/src/xsimd/test/doc/explicit_use_of_an_instruction_set_mean_aligned.cpp +25 -0
  170. sequenzo/dissimilarity_measures/src/xsimd/test/doc/explicit_use_of_an_instruction_set_mean_arch_independent.cpp +28 -0
  171. sequenzo/dissimilarity_measures/src/xsimd/test/doc/explicit_use_of_an_instruction_set_mean_tag_dispatch.cpp +25 -0
  172. sequenzo/dissimilarity_measures/src/xsimd/test/doc/manipulating_abstract_batches.cpp +7 -0
  173. sequenzo/dissimilarity_measures/src/xsimd/test/doc/manipulating_parametric_batches.cpp +8 -0
  174. sequenzo/dissimilarity_measures/src/xsimd/test/doc/sum.hpp +31 -0
  175. sequenzo/dissimilarity_measures/src/xsimd/test/doc/sum_avx2.cpp +3 -0
  176. sequenzo/dissimilarity_measures/src/xsimd/test/doc/sum_sse2.cpp +3 -0
  177. sequenzo/dissimilarity_measures/src/xsimd/test/doc/writing_vectorized_code.cpp +11 -0
  178. sequenzo/dissimilarity_measures/src/xsimd/test/main.cpp +31 -0
  179. sequenzo/dissimilarity_measures/src/xsimd/test/test_api.cpp +230 -0
  180. sequenzo/dissimilarity_measures/src/xsimd/test/test_arch.cpp +217 -0
  181. sequenzo/dissimilarity_measures/src/xsimd/test/test_basic_math.cpp +183 -0
  182. sequenzo/dissimilarity_measures/src/xsimd/test/test_batch.cpp +1049 -0
  183. sequenzo/dissimilarity_measures/src/xsimd/test/test_batch_bool.cpp +508 -0
  184. sequenzo/dissimilarity_measures/src/xsimd/test/test_batch_cast.cpp +409 -0
  185. sequenzo/dissimilarity_measures/src/xsimd/test/test_batch_complex.cpp +712 -0
  186. sequenzo/dissimilarity_measures/src/xsimd/test/test_batch_constant.cpp +286 -0
  187. sequenzo/dissimilarity_measures/src/xsimd/test/test_batch_float.cpp +141 -0
  188. sequenzo/dissimilarity_measures/src/xsimd/test/test_batch_int.cpp +365 -0
  189. sequenzo/dissimilarity_measures/src/xsimd/test/test_batch_manip.cpp +308 -0
  190. sequenzo/dissimilarity_measures/src/xsimd/test/test_bitwise_cast.cpp +222 -0
  191. sequenzo/dissimilarity_measures/src/xsimd/test/test_complex_exponential.cpp +226 -0
  192. sequenzo/dissimilarity_measures/src/xsimd/test/test_complex_hyperbolic.cpp +183 -0
  193. sequenzo/dissimilarity_measures/src/xsimd/test/test_complex_power.cpp +265 -0
  194. sequenzo/dissimilarity_measures/src/xsimd/test/test_complex_trigonometric.cpp +236 -0
  195. sequenzo/dissimilarity_measures/src/xsimd/test/test_conversion.cpp +248 -0
  196. sequenzo/dissimilarity_measures/src/xsimd/test/test_custom_default_arch.cpp +28 -0
  197. sequenzo/dissimilarity_measures/src/xsimd/test/test_error_gamma.cpp +170 -0
  198. sequenzo/dissimilarity_measures/src/xsimd/test/test_explicit_batch_instantiation.cpp +32 -0
  199. sequenzo/dissimilarity_measures/src/xsimd/test/test_exponential.cpp +202 -0
  200. sequenzo/dissimilarity_measures/src/xsimd/test/test_extract_pair.cpp +92 -0
  201. sequenzo/dissimilarity_measures/src/xsimd/test/test_fp_manipulation.cpp +77 -0
  202. sequenzo/dissimilarity_measures/src/xsimd/test/test_gnu_source.cpp +30 -0
  203. sequenzo/dissimilarity_measures/src/xsimd/test/test_hyperbolic.cpp +167 -0
  204. sequenzo/dissimilarity_measures/src/xsimd/test/test_load_store.cpp +304 -0
  205. sequenzo/dissimilarity_measures/src/xsimd/test/test_memory.cpp +61 -0
  206. sequenzo/dissimilarity_measures/src/xsimd/test/test_poly_evaluation.cpp +64 -0
  207. sequenzo/dissimilarity_measures/src/xsimd/test/test_power.cpp +184 -0
  208. sequenzo/dissimilarity_measures/src/xsimd/test/test_rounding.cpp +199 -0
  209. sequenzo/dissimilarity_measures/src/xsimd/test/test_select.cpp +101 -0
  210. sequenzo/dissimilarity_measures/src/xsimd/test/test_shuffle.cpp +760 -0
  211. sequenzo/dissimilarity_measures/src/xsimd/test/test_sum.cpp +4 -0
  212. sequenzo/dissimilarity_measures/src/xsimd/test/test_sum.hpp +34 -0
  213. sequenzo/dissimilarity_measures/src/xsimd/test/test_traits.cpp +172 -0
  214. sequenzo/dissimilarity_measures/src/xsimd/test/test_trigonometric.cpp +208 -0
  215. sequenzo/dissimilarity_measures/src/xsimd/test/test_utils.hpp +611 -0
  216. sequenzo/dissimilarity_measures/src/xsimd/test/test_wasm/test_wasm_playwright.py +123 -0
  217. sequenzo/dissimilarity_measures/src/xsimd/test/test_xsimd_api.cpp +1460 -0
  218. sequenzo/dissimilarity_measures/utils/__init__.py +16 -0
  219. sequenzo/dissimilarity_measures/utils/get_LCP_length_for_2_seq.py +44 -0
  220. sequenzo/dissimilarity_measures/utils/get_sm_trate_substitution_cost_matrix.cpython-310-darwin.so +0 -0
  221. sequenzo/dissimilarity_measures/utils/seqconc.cpython-310-darwin.so +0 -0
  222. sequenzo/dissimilarity_measures/utils/seqdss.cpython-310-darwin.so +0 -0
  223. sequenzo/dissimilarity_measures/utils/seqdur.cpython-310-darwin.so +0 -0
  224. sequenzo/dissimilarity_measures/utils/seqlength.cpython-310-darwin.so +0 -0
  225. sequenzo/multidomain/__init__.py +23 -0
  226. sequenzo/multidomain/association_between_domains.py +311 -0
  227. sequenzo/multidomain/cat.py +597 -0
  228. sequenzo/multidomain/combt.py +519 -0
  229. sequenzo/multidomain/dat.py +81 -0
  230. sequenzo/multidomain/idcd.py +139 -0
  231. sequenzo/multidomain/linked_polyad.py +292 -0
  232. sequenzo/openmp_setup.py +233 -0
  233. sequenzo/prefix_tree/__init__.py +62 -0
  234. sequenzo/prefix_tree/hub.py +114 -0
  235. sequenzo/prefix_tree/individual_level_indicators.py +1321 -0
  236. sequenzo/prefix_tree/spell_individual_level_indicators.py +580 -0
  237. sequenzo/prefix_tree/spell_level_indicators.py +297 -0
  238. sequenzo/prefix_tree/system_level_indicators.py +544 -0
  239. sequenzo/prefix_tree/utils.py +54 -0
  240. sequenzo/seqhmm/__init__.py +95 -0
  241. sequenzo/seqhmm/advanced_optimization.py +305 -0
  242. sequenzo/seqhmm/bootstrap.py +411 -0
  243. sequenzo/seqhmm/build_hmm.py +142 -0
  244. sequenzo/seqhmm/build_mhmm.py +136 -0
  245. sequenzo/seqhmm/build_nhmm.py +121 -0
  246. sequenzo/seqhmm/fit_mhmm.py +62 -0
  247. sequenzo/seqhmm/fit_model.py +61 -0
  248. sequenzo/seqhmm/fit_nhmm.py +76 -0
  249. sequenzo/seqhmm/formulas.py +289 -0
  250. sequenzo/seqhmm/forward_backward_nhmm.py +276 -0
  251. sequenzo/seqhmm/gradients_nhmm.py +306 -0
  252. sequenzo/seqhmm/hmm.py +291 -0
  253. sequenzo/seqhmm/mhmm.py +314 -0
  254. sequenzo/seqhmm/model_comparison.py +238 -0
  255. sequenzo/seqhmm/multichannel_em.py +282 -0
  256. sequenzo/seqhmm/multichannel_utils.py +138 -0
  257. sequenzo/seqhmm/nhmm.py +270 -0
  258. sequenzo/seqhmm/nhmm_utils.py +191 -0
  259. sequenzo/seqhmm/predict.py +137 -0
  260. sequenzo/seqhmm/predict_mhmm.py +142 -0
  261. sequenzo/seqhmm/simulate.py +878 -0
  262. sequenzo/seqhmm/utils.py +218 -0
  263. sequenzo/seqhmm/visualization.py +910 -0
  264. sequenzo/sequence_characteristics/__init__.py +40 -0
  265. sequenzo/sequence_characteristics/complexity_index.py +49 -0
  266. sequenzo/sequence_characteristics/overall_cross_sectional_entropy.py +220 -0
  267. sequenzo/sequence_characteristics/plot_characteristics.py +593 -0
  268. sequenzo/sequence_characteristics/simple_characteristics.py +311 -0
  269. sequenzo/sequence_characteristics/state_frequencies_and_entropy_per_sequence.py +39 -0
  270. sequenzo/sequence_characteristics/turbulence.py +155 -0
  271. sequenzo/sequence_characteristics/variance_of_spell_durations.py +86 -0
  272. sequenzo/sequence_characteristics/within_sequence_entropy.py +43 -0
  273. sequenzo/suffix_tree/__init__.py +66 -0
  274. sequenzo/suffix_tree/hub.py +114 -0
  275. sequenzo/suffix_tree/individual_level_indicators.py +1679 -0
  276. sequenzo/suffix_tree/spell_individual_level_indicators.py +493 -0
  277. sequenzo/suffix_tree/spell_level_indicators.py +248 -0
  278. sequenzo/suffix_tree/system_level_indicators.py +535 -0
  279. sequenzo/suffix_tree/utils.py +56 -0
  280. sequenzo/version_check.py +283 -0
  281. sequenzo/visualization/__init__.py +29 -0
  282. sequenzo/visualization/plot_mean_time.py +222 -0
  283. sequenzo/visualization/plot_modal_state.py +276 -0
  284. sequenzo/visualization/plot_most_frequent_sequences.py +147 -0
  285. sequenzo/visualization/plot_relative_frequency.py +405 -0
  286. sequenzo/visualization/plot_sequence_index.py +1175 -0
  287. sequenzo/visualization/plot_single_medoid.py +153 -0
  288. sequenzo/visualization/plot_state_distribution.py +651 -0
  289. sequenzo/visualization/plot_transition_matrix.py +190 -0
  290. sequenzo/visualization/utils/__init__.py +23 -0
  291. sequenzo/visualization/utils/utils.py +310 -0
  292. sequenzo/with_event_history_analysis/__init__.py +35 -0
  293. sequenzo/with_event_history_analysis/sequence_analysis_multi_state_model.py +850 -0
  294. sequenzo/with_event_history_analysis/sequence_history_analysis.py +283 -0
  295. sequenzo-0.1.31.dist-info/METADATA +286 -0
  296. sequenzo-0.1.31.dist-info/RECORD +299 -0
  297. sequenzo-0.1.31.dist-info/WHEEL +5 -0
  298. sequenzo-0.1.31.dist-info/licenses/LICENSE +28 -0
  299. sequenzo-0.1.31.dist-info/top_level.txt +2 -0
@@ -0,0 +1,281 @@
1
+ #include <pybind11/pybind11.h>
2
+ #include <pybind11/numpy.h>
3
+ #include <vector>
4
+ #include <cmath>
5
+ #include <iostream>
6
+ #include "utils.h"
7
+ #include "dp_utils.h"
8
+ #ifdef _OPENMP
9
+ #include <omp.h>
10
+ #endif
11
+ #include <xsimd/xsimd.hpp>
12
+
13
+ namespace py = pybind11;
14
+
15
+ class OMspellDistance {
16
+ public:
17
+ OMspellDistance(py::array_t<int> sequences, py::array_t<double> sm, double indel, int norm, py::array_t<int> refseqS,
18
+ double timecost, py::array_t<double> seqdur, py::array_t<double> indellist, py::array_t<int> seqlength)
19
+ : indel(indel), norm(norm), timecost(timecost) {
20
+
21
+ py::print("[>] Starting Optimal Matching with spell(OMspell)...");
22
+ std::cout << std::flush;
23
+
24
+ try {
25
+ // ============================================
26
+ // parameter : sequences, sm, seqdur, indellist
27
+ // ============================================
28
+ this->sequences = sequences;
29
+ this->sm = sm;
30
+
31
+ this->seqdur = seqdur;
32
+ this->indellist = indellist;
33
+
34
+ this->seqlength = seqlength;
35
+
36
+ // ====================================================
37
+ // initialize nseq, seqlen, dist_matrix, fmatsize, fmat
38
+ // ====================================================
39
+ auto seq_shape = sequences.shape();
40
+ nseq = seq_shape[0];
41
+ len = seq_shape[1];
42
+
43
+ dist_matrix = py::array_t<double>({nseq, nseq});
44
+
45
+ fmatsize = len + 1;
46
+
47
+ // ====================
48
+ // initialize alphasize
49
+ // ====================
50
+ auto sm_shape = sm.shape();
51
+ alphasize = sm_shape[0];
52
+
53
+ // ==================
54
+ // initialize maxcost
55
+ // ==================
56
+ auto ptr = sm.mutable_unchecked<2>();
57
+
58
+ if(norm == 4){
59
+ maxscost = 2 * indel;
60
+ }else{
61
+ for(int i = 0; i < alphasize; i++){
62
+ for(int j = i+1; j < alphasize; j++){
63
+ if(ptr(i, j) > maxscost){
64
+ maxscost = ptr(i, j);
65
+ }
66
+ }
67
+ }
68
+ maxscost = std::min(maxscost, 2 * indel);
69
+ }
70
+
71
+ // about reference sequences :
72
+ nans = nseq;
73
+
74
+ rseq1 = refseqS.at(0);
75
+ rseq2 = refseqS.at(1);
76
+ if(rseq1 < rseq2){
77
+ nseq = rseq1;
78
+ nans = nseq * (rseq2 - rseq1);
79
+ }else{
80
+ rseq1 = rseq1 - 1;
81
+ }
82
+ refdist_matrix = py::array_t<double>({nseq, (rseq2-rseq1)});
83
+ } catch (const std::exception& e) {
84
+ py::print("Error in constructor: ", e.what());
85
+ throw;
86
+ }
87
+ }
88
+
89
+ // 对齐分配函数 moved to dp_utils.h
90
+
91
+ double getIndel(int i, int j, int state){
92
+ auto ptr_indel = indellist.mutable_unchecked<1>();
93
+ auto ptr_dur = seqdur.mutable_unchecked<2>();
94
+
95
+ return ptr_indel(state) + timecost * ptr_dur(i, j);
96
+ }
97
+
98
+ double getSubCost(int i_state, int j_state, int i_x, int i_y, int j_x, int j_y){
99
+ auto ptr_dur = seqdur.mutable_unchecked<2>();
100
+
101
+ if(i_state == j_state){
102
+ double diffdur = ptr_dur(i_x, i_y) - ptr_dur(j_x, j_y);
103
+
104
+ return abs(timecost * diffdur);
105
+ }else{
106
+ auto ptr_sm = sm.mutable_unchecked<2>();
107
+
108
+ return ptr_sm(i_state, j_state) +
109
+ (ptr_dur(i_x, i_y) + ptr_dur(j_x, j_y)) * timecost;
110
+ }
111
+ }
112
+
113
+ double compute_distance(int is, int js, double* prev, double* curr) {
114
+ try {
115
+ auto ptr_seq = sequences.unchecked<2>();
116
+ auto ptr_len = seqlength.unchecked<1>();
117
+ auto ptr_sm = sm.unchecked<2>();
118
+ auto ptr_dur = seqdur.unchecked<2>();
119
+ auto ptr_indel = indellist.unchecked<1>();
120
+
121
+ int i_state = 0, j_state = 0;
122
+ int mm = ptr_len(is);
123
+ int nn = ptr_len(js);
124
+ int mSuf = mm + 1;
125
+ int nSuf = nn + 1;
126
+
127
+ prev[0] = 0;
128
+ curr[0] = 0;
129
+
130
+ // initialize first row: cumulative insertions into js along columns
131
+ for (int jj = 1; jj < nSuf; jj++) {
132
+ int bj = ptr_seq(js, jj - 1);
133
+ prev[jj] = prev[jj - 1] + (ptr_indel(bj) + timecost * ptr_dur(js, jj - 1));
134
+ }
135
+
136
+ using batch_t = xsimd::batch<double>;
137
+ constexpr std::size_t B = batch_t::size;
138
+
139
+ for (int i = 1; i < mSuf; i++) {
140
+ i_state = ptr_seq(is, i - 1);
141
+ // per-row deletion cost (depends only on i_state and i position)
142
+ double dur_i = ptr_dur(is, i - 1);
143
+ double del_cost_i = ptr_indel(i_state) + timecost * dur_i;
144
+
145
+ // first column: cumulative deletions D[i][0] = D[i-1][0] + del_cost_i
146
+ curr[0] = prev[0] + del_cost_i;
147
+
148
+ int j = 1;
149
+ for (; j + (int)B <= nSuf; j += (int)B) {
150
+ const double* prev_ptr = prev + j;
151
+ const double* prevm1_ptr = prev + (j - 1);
152
+
153
+ batch_t prevj = batch_t::load_unaligned(prev_ptr);
154
+ batch_t prevjm1 = batch_t::load_unaligned(prevm1_ptr);
155
+
156
+ alignas(64) double subs[B];
157
+ alignas(64) double ins[B];
158
+ for (std::size_t b = 0; b < B; ++b) {
159
+ int jj_idx = j + (int)b - 1;
160
+ int bj = ptr_seq(js, jj_idx);
161
+ double dur_j = ptr_dur(js, jj_idx);
162
+
163
+ if (i_state == bj) {
164
+ subs[b] = std::abs(timecost * (dur_i - dur_j));
165
+ } else {
166
+ subs[b] = ptr_sm(i_state, bj) + (dur_i + dur_j) * timecost;
167
+ }
168
+ ins[b] = ptr_indel(bj) + timecost * dur_j;
169
+ }
170
+
171
+ batch_t sub_batch = batch_t::load_unaligned(subs);
172
+ batch_t cand_del = prevj + batch_t(del_cost_i);
173
+ batch_t cand_sub = prevjm1 + sub_batch;
174
+ batch_t vert = xsimd::min(cand_del, cand_sub);
175
+
176
+ double running = curr[j - 1] + ins[0];
177
+ for (std::size_t b = 0; b < B; ++b) {
178
+ double v = vert.get(b);
179
+ double c = std::min(v, running);
180
+ curr[j + (int)b] = c;
181
+ if (b + 1 < B) running = c + ins[b + 1];
182
+ }
183
+ }
184
+
185
+ // tail scalar handling
186
+ for (; j < nSuf; ++j) {
187
+ j_state = ptr_seq(js, j - 1);
188
+ double minimum = prev[j] + del_cost_i;
189
+ double j_indel = curr[j - 1] + (ptr_indel(j_state) + timecost * ptr_dur(js, j - 1));
190
+ double sub = prev[j - 1] + (
191
+ (i_state == j_state)
192
+ ? std::abs(timecost * (dur_i - ptr_dur(js, j - 1)))
193
+ : (ptr_sm(i_state, j_state) + (dur_i + ptr_dur(js, j - 1)) * timecost)
194
+ );
195
+ curr[j] = std::min({ minimum, j_indel, sub });
196
+ }
197
+
198
+ std::swap(prev, curr);
199
+ }
200
+
201
+ double maxpossiblecost = std::abs(nn - mm) * indel + maxscost * std::min(mm, nn);
202
+ double ml = double(mm) * indel;
203
+ double nl = double(nn) * indel;
204
+
205
+ return normalize_distance(prev[nSuf - 1], maxpossiblecost, ml, nl, norm);
206
+ } catch (const std::exception& e) {
207
+ py::print("Error in compute_distance: ", e.what());
208
+ throw;
209
+ }
210
+ }
211
+
212
+ py::array_t<double> compute_all_distances() {
213
+ try {
214
+ return dp_utils::compute_all_distances(
215
+ nseq,
216
+ fmatsize,
217
+ dist_matrix,
218
+ [this](int i, int j, double* prev, double* curr) {
219
+ return this->compute_distance(i, j, prev, curr);
220
+ }
221
+ );
222
+ } catch (const std::exception& e) {
223
+ py::print("Error in compute_all_distances: ", e.what());
224
+ throw;
225
+ }
226
+ }
227
+
228
+ py::array_t<double> compute_refseq_distances() {
229
+ try {
230
+ auto buffer = refdist_matrix.mutable_unchecked<2>();
231
+
232
+ #pragma omp parallel
233
+ {
234
+ double* prev = dp_utils::aligned_alloc_double(static_cast<size_t>(fmatsize));
235
+ double* curr = dp_utils::aligned_alloc_double(static_cast<size_t>(fmatsize));
236
+
237
+ #pragma omp for schedule(static)
238
+ for (int rseq = rseq1; rseq < rseq2; rseq ++) {
239
+ for (int is = 0; is < nseq; is ++) {
240
+ double cmpres = 0;
241
+ if(is != rseq){
242
+ cmpres = compute_distance(is, rseq, prev, curr);
243
+ }
244
+
245
+ buffer(is, rseq - rseq1) = cmpres;
246
+ }
247
+ }
248
+ dp_utils::aligned_free_double(prev);
249
+ dp_utils::aligned_free_double(curr);
250
+ }
251
+
252
+ return refdist_matrix;
253
+ } catch (const std::exception& e) {
254
+ py::print("Error in compute_all_distances: ", e.what());
255
+ throw;
256
+ }
257
+ }
258
+
259
+ private:
260
+ py::array_t<int> sequences;
261
+ py::array_t<int> seqlength;
262
+ py::array_t<double> sm;
263
+ double indel;
264
+ int norm;
265
+ int nseq;
266
+ int len;
267
+ int alphasize;
268
+ int fmatsize;
269
+ py::array_t<double> dist_matrix;
270
+ double maxscost;
271
+
272
+ double timecost;
273
+ py::array_t<double> seqdur;
274
+ py::array_t<double> indellist;
275
+
276
+ // about reference sequences :
277
+ int nans = -1;
278
+ int rseq1 = -1;
279
+ int rseq2 = -1;
280
+ py::array_t<double> refdist_matrix;
281
+ };
File without changes
@@ -0,0 +1,63 @@
1
+ #include <pybind11/pybind11.h>
2
+ #include <pybind11/numpy.h>
3
+ #include <vector>
4
+ #include <iostream>
5
+ #ifdef _OPENMP
6
+ #include <omp.h>
7
+ #endif
8
+
9
+ namespace py = pybind11;
10
+
11
+ class dist2matrix {
12
+ public:
13
+ dist2matrix(int nseq, py::array_t<int> seqdata_didxs, py::array_t<double> dist_dseqs_num)
14
+ : nseq(nseq) {
15
+
16
+ py::print("[>] Computing all pairwise distances...");
17
+ std::cout << std::flush;
18
+
19
+ try {
20
+ this->seqdata_didxs = seqdata_didxs;
21
+ this->dist_dseqs_num = dist_dseqs_num;
22
+
23
+ dist_matrix = py::array_t<double>({nseq, nseq});
24
+ } catch (const std::exception& e) {
25
+ py::print("Error in constructor: ", e.what());
26
+ throw;
27
+ }
28
+ }
29
+
30
+ py::array_t<double> padding_matrix() {
31
+ try {
32
+ auto idxs_buf = seqdata_didxs.unchecked<1>();
33
+ auto dist_buf = dist_dseqs_num.unchecked<2>();
34
+ auto buffer = dist_matrix.mutable_unchecked<2>();
35
+
36
+ #pragma omp parallel for schedule(static)
37
+ for (int i = 0; i < nseq; ++i) {
38
+ for (int j = i; j < nseq; ++j) {
39
+ buffer(i, j) = dist_buf(idxs_buf(i), idxs_buf(j));
40
+ }
41
+ }
42
+
43
+ #pragma omp parallel for schedule(static)
44
+ for (int i = 0; i < nseq; ++i) {
45
+ for (int j = i + 1; j < nseq; ++j) {
46
+ buffer(j, i) = buffer(i, j);
47
+ }
48
+ }
49
+
50
+ return dist_matrix;
51
+ } catch (const std::exception& e) {
52
+ py::print("Error in compute_all_distances: ", e.what());
53
+ throw;
54
+ }
55
+ }
56
+
57
+ private:
58
+ py::array_t<int> seqdata_didxs;
59
+ py::array_t<double> dist_dseqs_num;
60
+ int nseq = 0;
61
+
62
+ py::array_t<double> dist_matrix;
63
+ };
@@ -0,0 +1,160 @@
1
+ #pragma once
2
+
3
+ #include <pybind11/pybind11.h>
4
+ #include <pybind11/numpy.h>
5
+ #ifdef _OPENMP
6
+ #include <omp.h>
7
+ #endif
8
+ #include <cstdlib>
9
+ #include <new>
10
+
11
+ namespace dp_utils {
12
+
13
+ // Cross-platform aligned allocation for double buffers
14
+ #ifdef _WIN32
15
+ inline double* aligned_alloc_double(size_t size, size_t align = 64) {
16
+ return reinterpret_cast<double*>(_aligned_malloc(size * sizeof(double), align));
17
+ }
18
+ inline void aligned_free_double(double* ptr) {
19
+ _aligned_free(ptr);
20
+ }
21
+ #else
22
+ inline double* aligned_alloc_double(size_t size, size_t align = 64) {
23
+ void* ptr = nullptr;
24
+ if (posix_memalign(&ptr, align, size * sizeof(double)) != 0) throw std::bad_alloc();
25
+ return reinterpret_cast<double*>(ptr);
26
+ }
27
+ inline void aligned_free_double(double* ptr) { free(ptr); }
28
+ #endif
29
+
30
+ // Generic pairwise symmetric computation helper
31
+ // ComputeFn signature: double(int i, int j, double* prev, double* curr)
32
+ template <typename ComputeFn>
33
+ inline pybind11::array_t<double> compute_all_distances(
34
+ int nseq,
35
+ int fmatsize,
36
+ pybind11::array_t<double>& dist_matrix,
37
+ ComputeFn&& compute_fn
38
+ ) {
39
+ auto buffer = dist_matrix.mutable_unchecked<2>();
40
+
41
+ #pragma omp parallel
42
+ {
43
+ double* prev = aligned_alloc_double(static_cast<size_t>(fmatsize));
44
+ double* curr = aligned_alloc_double(static_cast<size_t>(fmatsize));
45
+
46
+ #pragma omp for schedule(static)
47
+ for (int i = 0; i < nseq; i++) {
48
+ for (int j = i; j < nseq; j++) {
49
+ buffer(i, j) = compute_fn(i, j, prev, curr);
50
+ }
51
+ }
52
+
53
+ aligned_free_double(prev);
54
+ aligned_free_double(curr);
55
+ }
56
+
57
+ #pragma omp parallel for schedule(static)
58
+ for (int i = 0; i < nseq; i++) {
59
+ for (int j = i + 1; j < nseq; j++) {
60
+ buffer(j, i) = buffer(i, j);
61
+ }
62
+ }
63
+
64
+ return dist_matrix;
65
+ }
66
+
67
+ // Generic pairwise symmetric computation helper (no buffers)
68
+ // ComputeFn signature: double(int i, int j)
69
+ template <typename ComputeFn>
70
+ inline pybind11::array_t<double> compute_all_distances_simple(
71
+ int nseq,
72
+ pybind11::array_t<double>& dist_matrix,
73
+ ComputeFn&& compute_fn
74
+ ) {
75
+ auto buffer = dist_matrix.mutable_unchecked<2>();
76
+
77
+ #pragma omp parallel
78
+ {
79
+ #pragma omp for schedule(static)
80
+ for (int i = 0; i < nseq; i++) {
81
+ for (int j = i; j < nseq; j++) {
82
+ buffer(i, j) = compute_fn(i, j);
83
+ }
84
+ }
85
+ }
86
+
87
+ #pragma omp parallel for schedule(static)
88
+ for (int i = 0; i < nseq; ++i) {
89
+ for (int j = i + 1; j < nseq; ++j) {
90
+ buffer(j, i) = buffer(i, j);
91
+ }
92
+ }
93
+
94
+ return dist_matrix;
95
+ }
96
+
97
+ // Generic reference-sequence computation helper (no buffers)
98
+ // ComputeFn signature: double(int is, int rseq)
99
+ template <typename ComputeFn>
100
+ inline pybind11::array_t<double> compute_refseq_distances_simple(
101
+ int nseq,
102
+ int rseq1,
103
+ int rseq2,
104
+ pybind11::array_t<double>& refdist_matrix,
105
+ ComputeFn&& compute_fn
106
+ ) {
107
+ auto buffer = refdist_matrix.mutable_unchecked<2>();
108
+
109
+ #pragma omp parallel
110
+ {
111
+ #pragma omp for schedule(guided)
112
+ for (int rseq = rseq1; rseq < rseq2; rseq++) {
113
+ for (int is = 0; is < nseq; is++) {
114
+ buffer(is, rseq - rseq1) = (is == rseq) ? 0.0 : compute_fn(is, rseq);
115
+ }
116
+ }
117
+ }
118
+
119
+ return refdist_matrix;
120
+ }
121
+
122
+ // Generic reference-sequence computation helper (with DP buffers)
123
+ // ComputeFn signature: double(int is, int rseq, double* prev, double* curr)
124
+ template <typename ComputeFn>
125
+ inline pybind11::array_t<double> compute_refseq_distances_buffered(
126
+ int nseq,
127
+ int rseq1,
128
+ int rseq2,
129
+ int fmatsize,
130
+ pybind11::array_t<double>& refdist_matrix,
131
+ ComputeFn&& compute_fn
132
+ ) {
133
+ auto buffer = refdist_matrix.mutable_unchecked<2>();
134
+
135
+ #pragma omp parallel
136
+ {
137
+ double* prev = aligned_alloc_double(static_cast<size_t>(fmatsize));
138
+ double* curr = aligned_alloc_double(static_cast<size_t>(fmatsize));
139
+
140
+ #pragma omp for schedule(static)
141
+ for (int rseq = rseq1; rseq < rseq2; rseq++) {
142
+ for (int is = 0; is < nseq; is++) {
143
+ double cmpres = 0.0;
144
+ if (is != rseq) {
145
+ cmpres = compute_fn(is, rseq, prev, curr);
146
+ }
147
+ buffer(is, rseq - rseq1) = cmpres;
148
+ }
149
+ }
150
+
151
+ aligned_free_double(prev);
152
+ aligned_free_double(curr);
153
+ }
154
+
155
+ return refdist_matrix;
156
+ }
157
+
158
+ } // namespace dp_utils
159
+
160
+
@@ -0,0 +1,40 @@
1
+ #include <pybind11/pybind11.h>
2
+ #include "OMdistance.cpp"
3
+ #include "OMspellDistance.cpp"
4
+ #include "dist2matrix.cpp"
5
+ #include "DHDdistance.cpp"
6
+ #include "LCPdistance.cpp"
7
+ #include "LCPspellDistance.cpp"
8
+
9
+ namespace py = pybind11;
10
+
11
+ PYBIND11_MODULE(c_code, m) {
12
+ py::class_<dist2matrix>(m, "dist2matrix")
13
+ .def(py::init<int, py::array_t<int>, py::array_t<double>>())
14
+ .def("padding_matrix", &dist2matrix::padding_matrix);
15
+
16
+ py::class_<LCPdistance>(m, "LCPdistance")
17
+ .def(py::init<py::array_t<int>, int, int, py::array_t<int>>())
18
+ .def("compute_all_distances", &LCPdistance::compute_all_distances)
19
+ .def("compute_refseq_distances", &LCPdistance::compute_refseq_distances);
20
+
21
+ py::class_<LCPspellDistance>(m, "LCPspellDistance")
22
+ .def(py::init<py::array_t<int>, py::array_t<double>, py::array_t<int>, int, int, py::array_t<int>, double>())
23
+ .def("compute_all_distances", &LCPspellDistance::compute_all_distances)
24
+ .def("compute_refseq_distances", &LCPspellDistance::compute_refseq_distances);
25
+
26
+ py::class_<DHDdistance>(m, "DHDdistance")
27
+ .def(py::init<py::array_t<int>, py::array_t<double>, int, double, py::array_t<int>>())
28
+ .def("compute_all_distances", &DHDdistance::compute_all_distances)
29
+ .def("compute_refseq_distances", &DHDdistance::compute_refseq_distances);
30
+
31
+ py::class_<OMspellDistance>(m, "OMspellDistance")
32
+ .def(py::init<py::array_t<int>, py::array_t<double>, double, int, py::array_t<int>, double, py::array_t<double>, py::array_t<double>, py::array_t<int>>())
33
+ .def("compute_all_distances", &OMspellDistance::compute_all_distances)
34
+ .def("compute_refseq_distances", &OMspellDistance::compute_refseq_distances);
35
+
36
+ py::class_<OMdistance>(m, "OMdistance")
37
+ .def(py::init<py::array_t<int>, py::array_t<double>, double, int, py::array_t<int>, py::array_t<int>>())
38
+ .def("compute_all_distances", &OMdistance::compute_all_distances)
39
+ .def("compute_refseq_distances", &OMdistance::compute_refseq_distances);
40
+ }
@@ -0,0 +1,30 @@
1
+ """
2
+ @Author : 李欣怡
3
+ @File : setup.py
4
+ @Time : 2025/3/30 18:55
5
+ @Desc :
6
+ """
7
+ from setuptools import setup, Extension
8
+ import pybind11
9
+
10
+ pybind11_include = pybind11.get_include()
11
+
12
+ ext_modules = [
13
+ Extension(
14
+ 'c_code',
15
+ [r'/home/xinyi_test/test/module.cpp'],
16
+ include_dirs=[
17
+ pybind11_include,
18
+ r'/home/xinyi_test/test/xsimd/include'
19
+ ],
20
+ language='c++',
21
+ extra_compile_args=['-O2', '-std=c++17'],
22
+ ),
23
+ ]
24
+
25
+ setup(
26
+ name='c_code',
27
+ version='0.1',
28
+ ext_modules=ext_modules,
29
+ zip_safe=False,
30
+ )
@@ -0,0 +1,25 @@
1
+ #ifndef CC_CODE_UTILS_H
2
+ #define CC_CODE_UTILS_H
3
+
4
+ #include <cmath>
5
+
6
+ static inline double normalize_distance(double rawdist, double maxdist, double l1, double l2, int norm){
7
+ if (rawdist == 0.0) return 0.0;
8
+ switch (norm) {
9
+ case 0:
10
+ return rawdist;
11
+ case 1:
12
+ return l1 > l2 ? rawdist / l1 : l2 > 0.0 ? rawdist / l2 : 0.0;
13
+ case 2:
14
+ return (l1 * l2 == 0.0) ? (l1 != l2 ? 1.0 : 0.0)
15
+ : 1.0 - ((maxdist - rawdist) / (2.0 * std::sqrt(l1) * std::sqrt(l2)));
16
+ case 3:
17
+ return maxdist == 0.0 ? 1.0 : rawdist / maxdist;
18
+ case 4:
19
+ return maxdist == 0.0 ? 1.0 : (2.0 * rawdist) / (rawdist + maxdist);
20
+ default:
21
+ return rawdist;
22
+ }
23
+ }
24
+
25
+ #endif //CC_CODE_UTILS_H
@@ -0,0 +1,6 @@
1
+ #include "xsimd/xsimd.hpp"
2
+
3
+ int main()
4
+ {
5
+ return 0;
6
+ }