scitex 2.5.0__py3-none-any.whl → 2.7.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (1091) hide show
  1. scitex/__init__.py +19 -8
  2. scitex/__main__.py +2 -1
  3. scitex/__version__.py +1 -1
  4. scitex/_optional_deps.py +13 -20
  5. scitex/ai/__init__.py +5 -0
  6. scitex/ai/_gen_ai/_Anthropic.py +3 -1
  7. scitex/ai/_gen_ai/_BaseGenAI.py +3 -2
  8. scitex/ai/_gen_ai/_DeepSeek.py +1 -1
  9. scitex/ai/_gen_ai/_Google.py +3 -2
  10. scitex/ai/_gen_ai/_Llama.py +4 -2
  11. scitex/ai/_gen_ai/_OpenAI.py +3 -1
  12. scitex/ai/_gen_ai/_PARAMS.py +1 -0
  13. scitex/ai/_gen_ai/_Perplexity.py +3 -1
  14. scitex/ai/_gen_ai/__init__.py +1 -0
  15. scitex/ai/_gen_ai/_format_output_func.py +3 -1
  16. scitex/ai/classification/CrossValidationExperiment.py +8 -14
  17. scitex/ai/classification/examples/timeseries_cv_demo.py +128 -112
  18. scitex/ai/classification/reporters/_BaseClassificationReporter.py +2 -0
  19. scitex/ai/classification/reporters/_ClassificationReporter.py +30 -45
  20. scitex/ai/classification/reporters/_MultiClassificationReporter.py +8 -11
  21. scitex/ai/classification/reporters/_SingleClassificationReporter.py +126 -182
  22. scitex/ai/classification/reporters/__init__.py +1 -1
  23. scitex/ai/classification/reporters/reporter_utils/_Plotter.py +213 -119
  24. scitex/ai/classification/reporters/reporter_utils/__init__.py +28 -36
  25. scitex/ai/classification/reporters/reporter_utils/aggregation.py +125 -143
  26. scitex/ai/classification/reporters/reporter_utils/data_models.py +128 -120
  27. scitex/ai/classification/reporters/reporter_utils/reporting.py +507 -340
  28. scitex/ai/classification/reporters/reporter_utils/storage.py +4 -1
  29. scitex/ai/classification/reporters/reporter_utils/validation.py +141 -154
  30. scitex/ai/classification/timeseries/_TimeSeriesBlockingSplit.py +204 -129
  31. scitex/ai/classification/timeseries/_TimeSeriesCalendarSplit.py +215 -171
  32. scitex/ai/classification/timeseries/_TimeSeriesMetadata.py +17 -17
  33. scitex/ai/classification/timeseries/_TimeSeriesSlidingWindowSplit.py +67 -143
  34. scitex/ai/classification/timeseries/_TimeSeriesSlidingWindowSplit_v01-not-using-n_splits.py +67 -143
  35. scitex/ai/classification/timeseries/_TimeSeriesStrategy.py +12 -13
  36. scitex/ai/classification/timeseries/_TimeSeriesStratifiedSplit.py +231 -144
  37. scitex/ai/classification/timeseries/__init__.py +2 -4
  38. scitex/ai/classification/timeseries/_normalize_timestamp.py +3 -0
  39. scitex/ai/clustering/_pca.py +0 -1
  40. scitex/ai/clustering/_umap.py +1 -2
  41. scitex/ai/feature_extraction/__init__.py +10 -8
  42. scitex/ai/feature_extraction/vit.py +0 -1
  43. scitex/ai/feature_selection/feature_selection.py +3 -8
  44. scitex/ai/metrics/_calc_conf_mat.py +2 -0
  45. scitex/ai/metrics/_calc_feature_importance.py +3 -7
  46. scitex/ai/metrics/_calc_pre_rec_auc.py +5 -5
  47. scitex/ai/metrics/_calc_roc_auc.py +4 -2
  48. scitex/ai/metrics/_calc_seizure_prediction_metrics.py +35 -20
  49. scitex/ai/metrics/_calc_silhouette_score.py +1 -3
  50. scitex/ai/optim/Ranger_Deep_Learning_Optimizer/ranger/ranger.py +0 -3
  51. scitex/ai/optim/Ranger_Deep_Learning_Optimizer/ranger/ranger2020.py +0 -3
  52. scitex/ai/optim/Ranger_Deep_Learning_Optimizer/ranger/ranger913A.py +0 -3
  53. scitex/ai/optim/_optimizers.py +1 -1
  54. scitex/ai/plt/__init__.py +6 -1
  55. scitex/ai/plt/_plot_feature_importance.py +1 -3
  56. scitex/ai/plt/_plot_learning_curve.py +9 -24
  57. scitex/ai/plt/_plot_optuna_study.py +4 -3
  58. scitex/ai/plt/_plot_pre_rec_curve.py +9 -15
  59. scitex/ai/plt/_plot_roc_curve.py +6 -8
  60. scitex/ai/plt/_stx_conf_mat.py +121 -122
  61. scitex/ai/sampling/undersample.py +3 -2
  62. scitex/ai/sklearn/__init__.py +2 -2
  63. scitex/ai/training/_LearningCurveLogger.py +23 -10
  64. scitex/ai/utils/_check_params.py +0 -1
  65. scitex/benchmark/__init__.py +15 -25
  66. scitex/benchmark/benchmark.py +124 -117
  67. scitex/benchmark/monitor.py +117 -107
  68. scitex/benchmark/profiler.py +61 -58
  69. scitex/bridge/__init__.py +110 -0
  70. scitex/bridge/_helpers.py +149 -0
  71. scitex/bridge/_plt_vis.py +529 -0
  72. scitex/bridge/_protocol.py +283 -0
  73. scitex/bridge/_stats_plt.py +261 -0
  74. scitex/bridge/_stats_vis.py +265 -0
  75. scitex/browser/__init__.py +0 -2
  76. scitex/browser/auth/__init__.py +0 -0
  77. scitex/browser/auth/google.py +16 -11
  78. scitex/browser/automation/CookieHandler.py +2 -3
  79. scitex/browser/collaboration/__init__.py +3 -0
  80. scitex/browser/collaboration/auth_helpers.py +3 -1
  81. scitex/browser/collaboration/collaborative_agent.py +2 -0
  82. scitex/browser/collaboration/interactive_panel.py +2 -2
  83. scitex/browser/collaboration/shared_session.py +20 -11
  84. scitex/browser/collaboration/standard_interactions.py +1 -0
  85. scitex/browser/core/BrowserMixin.py +12 -30
  86. scitex/browser/core/ChromeProfileManager.py +9 -24
  87. scitex/browser/debugging/_browser_logger.py +15 -25
  88. scitex/browser/debugging/_failure_capture.py +9 -2
  89. scitex/browser/debugging/_highlight_element.py +15 -6
  90. scitex/browser/debugging/_show_grid.py +5 -6
  91. scitex/browser/debugging/_sync_session.py +4 -3
  92. scitex/browser/debugging/_test_monitor.py +14 -5
  93. scitex/browser/debugging/_visual_cursor.py +46 -35
  94. scitex/browser/interaction/click_center.py +4 -3
  95. scitex/browser/interaction/click_with_fallbacks.py +7 -10
  96. scitex/browser/interaction/close_popups.py +79 -66
  97. scitex/browser/interaction/fill_with_fallbacks.py +8 -8
  98. scitex/browser/pdf/__init__.py +3 -1
  99. scitex/browser/pdf/click_download_for_chrome_pdf_viewer.py +11 -10
  100. scitex/browser/pdf/detect_chrome_pdf_viewer.py +3 -6
  101. scitex/browser/remote/CaptchaHandler.py +109 -96
  102. scitex/browser/remote/ZenRowsAPIClient.py +91 -97
  103. scitex/browser/remote/ZenRowsBrowserManager.py +138 -112
  104. scitex/browser/stealth/HumanBehavior.py +4 -9
  105. scitex/browser/stealth/StealthManager.py +11 -26
  106. scitex/capture/__init__.py +17 -17
  107. scitex/capture/__main__.py +2 -3
  108. scitex/capture/capture.py +23 -51
  109. scitex/capture/cli.py +14 -39
  110. scitex/capture/gif.py +5 -9
  111. scitex/capture/mcp_server.py +7 -20
  112. scitex/capture/session.py +4 -3
  113. scitex/capture/utils.py +18 -53
  114. scitex/cli/__init__.py +1 -1
  115. scitex/cli/cloud.py +158 -116
  116. scitex/cli/config.py +224 -0
  117. scitex/cli/main.py +41 -40
  118. scitex/cli/scholar.py +60 -27
  119. scitex/cli/security.py +14 -20
  120. scitex/cli/web.py +87 -90
  121. scitex/cli/writer.py +51 -45
  122. scitex/cloud/__init__.py +14 -11
  123. scitex/cloud/_matplotlib_hook.py +6 -6
  124. scitex/config/README.md +313 -0
  125. scitex/config/{PriorityConfig.py → _PriorityConfig.py} +114 -17
  126. scitex/config/_ScitexConfig.py +319 -0
  127. scitex/config/__init__.py +41 -9
  128. scitex/config/_paths.py +325 -0
  129. scitex/config/default.yaml +81 -0
  130. scitex/context/_suppress_output.py +2 -3
  131. scitex/db/_BaseMixins/_BaseBackupMixin.py +3 -1
  132. scitex/db/_BaseMixins/_BaseBatchMixin.py +3 -1
  133. scitex/db/_BaseMixins/_BaseBlobMixin.py +3 -1
  134. scitex/db/_BaseMixins/_BaseImportExportMixin.py +1 -3
  135. scitex/db/_BaseMixins/_BaseIndexMixin.py +3 -1
  136. scitex/db/_BaseMixins/_BaseMaintenanceMixin.py +1 -3
  137. scitex/db/_BaseMixins/_BaseQueryMixin.py +3 -1
  138. scitex/db/_BaseMixins/_BaseRowMixin.py +3 -1
  139. scitex/db/_BaseMixins/_BaseTableMixin.py +3 -1
  140. scitex/db/_BaseMixins/_BaseTransactionMixin.py +1 -3
  141. scitex/db/_BaseMixins/__init__.py +1 -1
  142. scitex/db/__init__.py +9 -1
  143. scitex/db/__main__.py +8 -21
  144. scitex/db/_check_health.py +15 -31
  145. scitex/db/_delete_duplicates.py +7 -4
  146. scitex/db/_inspect.py +22 -38
  147. scitex/db/_inspect_optimized.py +89 -85
  148. scitex/db/_postgresql/_PostgreSQL.py +0 -1
  149. scitex/db/_postgresql/_PostgreSQLMixins/_BlobMixin.py +3 -1
  150. scitex/db/_postgresql/_PostgreSQLMixins/_ConnectionMixin.py +1 -3
  151. scitex/db/_postgresql/_PostgreSQLMixins/_ImportExportMixin.py +1 -3
  152. scitex/db/_postgresql/_PostgreSQLMixins/_MaintenanceMixin.py +1 -4
  153. scitex/db/_postgresql/_PostgreSQLMixins/_QueryMixin.py +3 -3
  154. scitex/db/_postgresql/_PostgreSQLMixins/_RowMixin.py +3 -1
  155. scitex/db/_postgresql/_PostgreSQLMixins/_TransactionMixin.py +1 -3
  156. scitex/db/_postgresql/__init__.py +1 -1
  157. scitex/db/_sqlite3/_SQLite3.py +2 -4
  158. scitex/db/_sqlite3/_SQLite3Mixins/_ArrayMixin.py +11 -12
  159. scitex/db/_sqlite3/_SQLite3Mixins/_ArrayMixin_v01-need-_hash-col.py +19 -14
  160. scitex/db/_sqlite3/_SQLite3Mixins/_BatchMixin.py +3 -1
  161. scitex/db/_sqlite3/_SQLite3Mixins/_BlobMixin.py +7 -7
  162. scitex/db/_sqlite3/_SQLite3Mixins/_ColumnMixin.py +118 -111
  163. scitex/db/_sqlite3/_SQLite3Mixins/_ConnectionMixin.py +8 -10
  164. scitex/db/_sqlite3/_SQLite3Mixins/_GitMixin.py +17 -45
  165. scitex/db/_sqlite3/_SQLite3Mixins/_ImportExportMixin.py +1 -3
  166. scitex/db/_sqlite3/_SQLite3Mixins/_IndexMixin.py +3 -1
  167. scitex/db/_sqlite3/_SQLite3Mixins/_QueryMixin.py +3 -4
  168. scitex/db/_sqlite3/_SQLite3Mixins/_RowMixin.py +9 -9
  169. scitex/db/_sqlite3/_SQLite3Mixins/_TableMixin.py +18 -11
  170. scitex/db/_sqlite3/_SQLite3Mixins/__init__.py +1 -0
  171. scitex/db/_sqlite3/__init__.py +1 -1
  172. scitex/db/_sqlite3/_delete_duplicates.py +13 -11
  173. scitex/decorators/__init__.py +29 -4
  174. scitex/decorators/_auto_order.py +43 -43
  175. scitex/decorators/_batch_fn.py +12 -6
  176. scitex/decorators/_cache_disk.py +8 -9
  177. scitex/decorators/_cache_disk_async.py +8 -7
  178. scitex/decorators/_combined.py +19 -13
  179. scitex/decorators/_converters.py +16 -3
  180. scitex/decorators/_deprecated.py +32 -22
  181. scitex/decorators/_numpy_fn.py +18 -4
  182. scitex/decorators/_pandas_fn.py +17 -5
  183. scitex/decorators/_signal_fn.py +17 -3
  184. scitex/decorators/_torch_fn.py +32 -15
  185. scitex/decorators/_xarray_fn.py +23 -9
  186. scitex/dev/_analyze_code_flow.py +0 -2
  187. scitex/dict/_DotDict.py +15 -19
  188. scitex/dict/_flatten.py +1 -0
  189. scitex/dict/_listed_dict.py +1 -0
  190. scitex/dict/_pop_keys.py +1 -0
  191. scitex/dict/_replace.py +1 -0
  192. scitex/dict/_safe_merge.py +1 -0
  193. scitex/dict/_to_str.py +2 -3
  194. scitex/dsp/__init__.py +13 -4
  195. scitex/dsp/_crop.py +3 -1
  196. scitex/dsp/_detect_ripples.py +3 -1
  197. scitex/dsp/_modulation_index.py +3 -1
  198. scitex/dsp/_time.py +3 -1
  199. scitex/dsp/_wavelet.py +0 -1
  200. scitex/dsp/example.py +0 -5
  201. scitex/dsp/filt.py +4 -0
  202. scitex/dsp/utils/__init__.py +4 -1
  203. scitex/dsp/utils/pac.py +3 -3
  204. scitex/dt/_normalize_timestamp.py +4 -1
  205. scitex/errors.py +3 -6
  206. scitex/etc/__init__.py +1 -1
  207. scitex/gen/_DimHandler.py +6 -6
  208. scitex/gen/__init__.py +5 -1
  209. scitex/gen/_deprecated_close.py +1 -0
  210. scitex/gen/_deprecated_start.py +5 -3
  211. scitex/gen/_detect_environment.py +44 -41
  212. scitex/gen/_detect_notebook_path.py +51 -47
  213. scitex/gen/_embed.py +1 -1
  214. scitex/gen/_get_notebook_path.py +81 -62
  215. scitex/gen/_inspect_module.py +0 -1
  216. scitex/gen/_norm.py +16 -7
  217. scitex/gen/_norm_cache.py +78 -65
  218. scitex/gen/_print_config.py +0 -3
  219. scitex/gen/_src.py +2 -3
  220. scitex/gen/_title_case.py +3 -2
  221. scitex/gen/_to_even.py +8 -8
  222. scitex/gen/_transpose.py +3 -3
  223. scitex/gen/misc.py +0 -3
  224. scitex/gists/_SigMacro_processFigure_S.py +2 -2
  225. scitex/gists/_SigMacro_toBlue.py +2 -2
  226. scitex/gists/__init__.py +4 -1
  227. scitex/git/_branch.py +19 -11
  228. scitex/git/_clone.py +23 -15
  229. scitex/git/_commit.py +10 -12
  230. scitex/git/_init.py +15 -38
  231. scitex/git/_remote.py +9 -3
  232. scitex/git/_result.py +3 -0
  233. scitex/git/_retry.py +2 -5
  234. scitex/git/_types.py +4 -0
  235. scitex/git/_validation.py +8 -8
  236. scitex/git/_workflow.py +4 -4
  237. scitex/io/__init__.py +2 -1
  238. scitex/io/_glob.py +2 -2
  239. scitex/io/_json2md.py +3 -3
  240. scitex/io/_load.py +6 -8
  241. scitex/io/_load_cache.py +71 -71
  242. scitex/io/_load_configs.py +2 -3
  243. scitex/io/_load_modules/_H5Explorer.py +6 -12
  244. scitex/io/_load_modules/_ZarrExplorer.py +3 -3
  245. scitex/io/_load_modules/_bibtex.py +62 -63
  246. scitex/io/_load_modules/_canvas.py +4 -9
  247. scitex/io/_load_modules/_catboost.py +7 -2
  248. scitex/io/_load_modules/_hdf5.py +2 -0
  249. scitex/io/_load_modules/_image.py +5 -1
  250. scitex/io/_load_modules/_matlab.py +3 -1
  251. scitex/io/_load_modules/_optuna.py +0 -1
  252. scitex/io/_load_modules/_pdf.py +38 -29
  253. scitex/io/_load_modules/_sqlite3.py +1 -0
  254. scitex/io/_load_modules/_txt.py +2 -0
  255. scitex/io/_load_modules/_xml.py +9 -9
  256. scitex/io/_load_modules/_zarr.py +12 -10
  257. scitex/io/_metadata.py +76 -37
  258. scitex/io/_qr_utils.py +18 -13
  259. scitex/io/_save.py +220 -63
  260. scitex/io/_save_modules/__init__.py +7 -2
  261. scitex/io/_save_modules/_bibtex.py +66 -61
  262. scitex/io/_save_modules/_canvas.py +5 -6
  263. scitex/io/_save_modules/_catboost.py +2 -2
  264. scitex/io/_save_modules/_csv.py +4 -4
  265. scitex/io/_save_modules/_excel.py +5 -9
  266. scitex/io/_save_modules/_hdf5.py +9 -21
  267. scitex/io/_save_modules/_html.py +5 -5
  268. scitex/io/_save_modules/_image.py +105 -8
  269. scitex/io/_save_modules/_joblib.py +2 -2
  270. scitex/io/_save_modules/_json.py +51 -6
  271. scitex/io/_save_modules/_listed_dfs_as_csv.py +2 -1
  272. scitex/io/_save_modules/_listed_scalars_as_csv.py +2 -1
  273. scitex/io/_save_modules/_matlab.py +2 -2
  274. scitex/io/_save_modules/_numpy.py +6 -8
  275. scitex/io/_save_modules/_pickle.py +4 -4
  276. scitex/io/_save_modules/_plotly.py +3 -3
  277. scitex/io/_save_modules/_tex.py +23 -25
  278. scitex/io/_save_modules/_text.py +2 -2
  279. scitex/io/_save_modules/_yaml.py +9 -9
  280. scitex/io/_save_modules/_zarr.py +15 -15
  281. scitex/io/utils/__init__.py +2 -1
  282. scitex/io/utils/h5_to_zarr.py +173 -155
  283. scitex/linalg/__init__.py +1 -1
  284. scitex/linalg/_geometric_median.py +4 -3
  285. scitex/logging/_Tee.py +5 -7
  286. scitex/logging/__init__.py +18 -19
  287. scitex/logging/_config.py +4 -1
  288. scitex/logging/_context.py +6 -5
  289. scitex/logging/_formatters.py +2 -3
  290. scitex/logging/_handlers.py +19 -20
  291. scitex/logging/_levels.py +9 -17
  292. scitex/logging/_logger.py +74 -15
  293. scitex/logging/_print_capture.py +17 -17
  294. scitex/nn/_BNet.py +1 -3
  295. scitex/nn/_Filters.py +6 -2
  296. scitex/nn/_ModulationIndex.py +3 -1
  297. scitex/nn/_PAC.py +3 -2
  298. scitex/nn/_PSD.py +0 -1
  299. scitex/nn/__init__.py +16 -3
  300. scitex/path/_clean.py +10 -8
  301. scitex/path/_find.py +1 -1
  302. scitex/path/_get_spath.py +1 -2
  303. scitex/path/_mk_spath.py +1 -1
  304. scitex/path/_symlink.py +5 -10
  305. scitex/pd/__init__.py +4 -1
  306. scitex/pd/_force_df.py +24 -24
  307. scitex/pd/_get_unique.py +1 -0
  308. scitex/pd/_merge_columns.py +1 -1
  309. scitex/pd/_round.py +11 -7
  310. scitex/pd/_to_xy.py +0 -1
  311. scitex/plt/REQUESTS.md +191 -0
  312. scitex/plt/__init__.py +185 -87
  313. scitex/plt/_subplots/_AxesWrapper.py +22 -6
  314. scitex/plt/_subplots/_AxisWrapper.py +100 -39
  315. scitex/plt/_subplots/_AxisWrapperMixins/_AdjustmentMixin.py +74 -52
  316. scitex/plt/_subplots/_AxisWrapperMixins/_MatplotlibPlotMixin.py +183 -73
  317. scitex/plt/_subplots/_AxisWrapperMixins/_SeabornMixin.py +61 -45
  318. scitex/plt/_subplots/_AxisWrapperMixins/_TrackingMixin.py +26 -14
  319. scitex/plt/_subplots/_AxisWrapperMixins/_UnitAwareMixin.py +80 -73
  320. scitex/plt/_subplots/_FigWrapper.py +93 -60
  321. scitex/plt/_subplots/_SubplotsWrapper.py +135 -68
  322. scitex/plt/_subplots/__init__.py +10 -0
  323. scitex/plt/_subplots/_export_as_csv.py +89 -47
  324. scitex/plt/_subplots/_export_as_csv_formatters/__init__.py +1 -0
  325. scitex/plt/_subplots/_export_as_csv_formatters/_format_annotate.py +6 -4
  326. scitex/plt/_subplots/_export_as_csv_formatters/_format_bar.py +88 -38
  327. scitex/plt/_subplots/_export_as_csv_formatters/_format_barh.py +25 -31
  328. scitex/plt/_subplots/_export_as_csv_formatters/_format_boxplot.py +53 -23
  329. scitex/plt/_subplots/_export_as_csv_formatters/_format_contour.py +38 -25
  330. scitex/plt/_subplots/_export_as_csv_formatters/_format_contourf.py +17 -9
  331. scitex/plt/_subplots/_export_as_csv_formatters/_format_errorbar.py +70 -124
  332. scitex/plt/_subplots/_export_as_csv_formatters/_format_eventplot.py +12 -10
  333. scitex/plt/_subplots/_export_as_csv_formatters/_format_fill.py +31 -17
  334. scitex/plt/_subplots/_export_as_csv_formatters/_format_fill_between.py +33 -21
  335. scitex/plt/_subplots/_export_as_csv_formatters/_format_hexbin.py +14 -4
  336. scitex/plt/_subplots/_export_as_csv_formatters/_format_hist.py +43 -29
  337. scitex/plt/_subplots/_export_as_csv_formatters/_format_hist2d.py +14 -4
  338. scitex/plt/_subplots/_export_as_csv_formatters/_format_imshow.py +27 -11
  339. scitex/plt/_subplots/_export_as_csv_formatters/_format_imshow2d.py +7 -5
  340. scitex/plt/_subplots/_export_as_csv_formatters/_format_matshow.py +9 -7
  341. scitex/plt/_subplots/_export_as_csv_formatters/_format_pie.py +15 -6
  342. scitex/plt/_subplots/_export_as_csv_formatters/_format_plot.py +85 -46
  343. scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_box.py +52 -27
  344. scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_imshow.py +1 -0
  345. scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_kde.py +16 -17
  346. scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_scatter.py +7 -5
  347. scitex/plt/_subplots/_export_as_csv_formatters/_format_quiver.py +10 -8
  348. scitex/plt/_subplots/_export_as_csv_formatters/_format_scatter.py +17 -6
  349. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_barplot.py +43 -26
  350. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_boxplot.py +68 -47
  351. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_heatmap.py +52 -64
  352. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_histplot.py +55 -50
  353. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_jointplot.py +9 -11
  354. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_kdeplot.py +63 -29
  355. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_lineplot.py +4 -4
  356. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_pairplot.py +6 -4
  357. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_scatterplot.py +44 -40
  358. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_stripplot.py +46 -39
  359. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_swarmplot.py +46 -39
  360. scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_violinplot.py +75 -94
  361. scitex/plt/_subplots/_export_as_csv_formatters/_format_stem.py +12 -3
  362. scitex/plt/_subplots/_export_as_csv_formatters/_format_step.py +12 -3
  363. scitex/plt/_subplots/_export_as_csv_formatters/_format_streamplot.py +10 -8
  364. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_conf_mat.py +17 -15
  365. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_ecdf.py +10 -9
  366. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_fillv.py +35 -31
  367. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_heatmap.py +18 -18
  368. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_image.py +24 -18
  369. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_joyplot.py +9 -7
  370. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_line.py +34 -23
  371. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_mean_ci.py +15 -13
  372. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_mean_std.py +12 -10
  373. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_median_iqr.py +15 -13
  374. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_raster.py +11 -9
  375. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_rectangle.py +84 -56
  376. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_scatter_hist.py +35 -32
  377. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_shaded_line.py +46 -30
  378. scitex/plt/_subplots/_export_as_csv_formatters/_format_stx_violin.py +51 -51
  379. scitex/plt/_subplots/_export_as_csv_formatters/_format_text.py +32 -31
  380. scitex/plt/_subplots/_export_as_csv_formatters/_format_violin.py +34 -31
  381. scitex/plt/_subplots/_export_as_csv_formatters/_format_violinplot.py +44 -37
  382. scitex/plt/_subplots/_export_as_csv_formatters/verify_formatters.py +91 -74
  383. scitex/plt/_tpl.py +6 -5
  384. scitex/plt/ax/_plot/__init__.py +24 -0
  385. scitex/plt/ax/_plot/_add_fitted_line.py +12 -11
  386. scitex/plt/ax/_plot/_plot_circular_hist.py +3 -1
  387. scitex/plt/ax/_plot/_plot_statistical_shaded_line.py +25 -19
  388. scitex/plt/ax/_plot/_stx_conf_mat.py +6 -3
  389. scitex/plt/ax/_plot/_stx_ecdf.py +5 -3
  390. scitex/plt/ax/_plot/_stx_fillv.py +4 -2
  391. scitex/plt/ax/_plot/_stx_heatmap.py +7 -4
  392. scitex/plt/ax/_plot/_stx_image.py +7 -5
  393. scitex/plt/ax/_plot/_stx_joyplot.py +32 -10
  394. scitex/plt/ax/_plot/_stx_raster.py +26 -11
  395. scitex/plt/ax/_plot/_stx_rectangle.py +2 -2
  396. scitex/plt/ax/_plot/_stx_shaded_line.py +15 -11
  397. scitex/plt/ax/_plot/_stx_violin.py +3 -1
  398. scitex/plt/ax/_style/_add_marginal_ax.py +6 -4
  399. scitex/plt/ax/_style/_auto_scale_axis.py +14 -10
  400. scitex/plt/ax/_style/_extend.py +3 -1
  401. scitex/plt/ax/_style/_force_aspect.py +5 -3
  402. scitex/plt/ax/_style/_format_units.py +2 -2
  403. scitex/plt/ax/_style/_hide_spines.py +5 -1
  404. scitex/plt/ax/_style/_map_ticks.py +5 -3
  405. scitex/plt/ax/_style/_rotate_labels.py +5 -4
  406. scitex/plt/ax/_style/_rotate_labels_v01.py +73 -63
  407. scitex/plt/ax/_style/_set_log_scale.py +120 -85
  408. scitex/plt/ax/_style/_set_meta.py +99 -76
  409. scitex/plt/ax/_style/_set_supxyt.py +33 -16
  410. scitex/plt/ax/_style/_set_xyt.py +27 -18
  411. scitex/plt/ax/_style/_share_axes.py +15 -5
  412. scitex/plt/ax/_style/_show_spines.py +58 -57
  413. scitex/plt/ax/_style/_style_barplot.py +1 -1
  414. scitex/plt/ax/_style/_style_boxplot.py +25 -14
  415. scitex/plt/ax/_style/_style_errorbar.py +0 -0
  416. scitex/plt/ax/_style/_style_scatter.py +1 -1
  417. scitex/plt/ax/_style/_style_suptitles.py +3 -3
  418. scitex/plt/ax/_style/_style_violinplot.py +8 -2
  419. scitex/plt/color/__init__.py +34 -2
  420. scitex/plt/color/_add_hue_col.py +1 -0
  421. scitex/plt/color/_colors.py +0 -1
  422. scitex/plt/color/_get_colors_from_conf_matap.py +3 -1
  423. scitex/plt/color/_vizualize_colors.py +0 -1
  424. scitex/plt/docs/FIGURE_ARCHITECTURE.md +155 -97
  425. scitex/plt/gallery/README.md +75 -0
  426. scitex/plt/gallery/__init__.py +29 -0
  427. scitex/plt/gallery/_generate.py +153 -0
  428. scitex/plt/gallery/_plots.py +594 -0
  429. scitex/plt/gallery/_registry.py +153 -0
  430. scitex/plt/styles/__init__.py +9 -9
  431. scitex/plt/styles/_plot_defaults.py +62 -61
  432. scitex/plt/styles/_plot_postprocess.py +126 -77
  433. scitex/plt/styles/_style_loader.py +0 -0
  434. scitex/plt/styles/presets.py +43 -18
  435. scitex/plt/templates/research-master/scitex/vis/gallery/area/fill_between.json +110 -0
  436. scitex/plt/templates/research-master/scitex/vis/gallery/area/fill_betweenx.json +88 -0
  437. scitex/plt/templates/research-master/scitex/vis/gallery/area/stx_fill_between.json +103 -0
  438. scitex/plt/templates/research-master/scitex/vis/gallery/area/stx_fillv.json +106 -0
  439. scitex/plt/templates/research-master/scitex/vis/gallery/categorical/bar.json +92 -0
  440. scitex/plt/templates/research-master/scitex/vis/gallery/categorical/barh.json +92 -0
  441. scitex/plt/templates/research-master/scitex/vis/gallery/categorical/boxplot.json +92 -0
  442. scitex/plt/templates/research-master/scitex/vis/gallery/categorical/stx_bar.json +84 -0
  443. scitex/plt/templates/research-master/scitex/vis/gallery/categorical/stx_barh.json +84 -0
  444. scitex/plt/templates/research-master/scitex/vis/gallery/categorical/stx_box.json +83 -0
  445. scitex/plt/templates/research-master/scitex/vis/gallery/categorical/stx_boxplot.json +93 -0
  446. scitex/plt/templates/research-master/scitex/vis/gallery/categorical/stx_violin.json +91 -0
  447. scitex/plt/templates/research-master/scitex/vis/gallery/categorical/stx_violinplot.json +91 -0
  448. scitex/plt/templates/research-master/scitex/vis/gallery/categorical/violinplot.json +91 -0
  449. scitex/plt/templates/research-master/scitex/vis/gallery/contour/contour.json +97 -0
  450. scitex/plt/templates/research-master/scitex/vis/gallery/contour/contourf.json +98 -0
  451. scitex/plt/templates/research-master/scitex/vis/gallery/contour/stx_contour.json +84 -0
  452. scitex/plt/templates/research-master/scitex/vis/gallery/distribution/hist.json +101 -0
  453. scitex/plt/templates/research-master/scitex/vis/gallery/distribution/hist2d.json +96 -0
  454. scitex/plt/templates/research-master/scitex/vis/gallery/distribution/stx_ecdf.json +95 -0
  455. scitex/plt/templates/research-master/scitex/vis/gallery/distribution/stx_joyplot.json +95 -0
  456. scitex/plt/templates/research-master/scitex/vis/gallery/distribution/stx_kde.json +93 -0
  457. scitex/plt/templates/research-master/scitex/vis/gallery/grid/imshow.json +95 -0
  458. scitex/plt/templates/research-master/scitex/vis/gallery/grid/matshow.json +95 -0
  459. scitex/plt/templates/research-master/scitex/vis/gallery/grid/stx_conf_mat.json +83 -0
  460. scitex/plt/templates/research-master/scitex/vis/gallery/grid/stx_heatmap.json +92 -0
  461. scitex/plt/templates/research-master/scitex/vis/gallery/grid/stx_image.json +121 -0
  462. scitex/plt/templates/research-master/scitex/vis/gallery/grid/stx_imshow.json +84 -0
  463. scitex/plt/templates/research-master/scitex/vis/gallery/line/plot.json +110 -0
  464. scitex/plt/templates/research-master/scitex/vis/gallery/line/step.json +92 -0
  465. scitex/plt/templates/research-master/scitex/vis/gallery/line/stx_line.json +95 -0
  466. scitex/plt/templates/research-master/scitex/vis/gallery/line/stx_shaded_line.json +96 -0
  467. scitex/plt/templates/research-master/scitex/vis/gallery/scatter/hexbin.json +95 -0
  468. scitex/plt/templates/research-master/scitex/vis/gallery/scatter/scatter.json +95 -0
  469. scitex/plt/templates/research-master/scitex/vis/gallery/scatter/stem.json +92 -0
  470. scitex/plt/templates/research-master/scitex/vis/gallery/scatter/stx_scatter.json +84 -0
  471. scitex/plt/templates/research-master/scitex/vis/gallery/special/pie.json +94 -0
  472. scitex/plt/templates/research-master/scitex/vis/gallery/special/stx_raster.json +109 -0
  473. scitex/plt/templates/research-master/scitex/vis/gallery/special/stx_rectangle.json +108 -0
  474. scitex/plt/templates/research-master/scitex/vis/gallery/statistical/errorbar.json +93 -0
  475. scitex/plt/templates/research-master/scitex/vis/gallery/statistical/stx_errorbar.json +84 -0
  476. scitex/plt/templates/research-master/scitex/vis/gallery/statistical/stx_mean_ci.json +96 -0
  477. scitex/plt/templates/research-master/scitex/vis/gallery/statistical/stx_mean_std.json +96 -0
  478. scitex/plt/templates/research-master/scitex/vis/gallery/statistical/stx_median_iqr.json +96 -0
  479. scitex/plt/templates/research-master/scitex/vis/gallery/vector/quiver.json +99 -0
  480. scitex/plt/templates/research-master/scitex/vis/gallery/vector/streamplot.json +100 -0
  481. scitex/plt/utils/__init__.py +29 -2
  482. scitex/plt/utils/_close.py +8 -3
  483. scitex/plt/utils/_collect_figure_metadata.py +3031 -265
  484. scitex/plt/utils/_colorbar.py +15 -17
  485. scitex/plt/utils/_configure_mpl.py +22 -14
  486. scitex/plt/utils/_crop.py +60 -27
  487. scitex/plt/utils/_csv_column_naming.py +123 -72
  488. scitex/plt/utils/_dimension_viewer.py +7 -19
  489. scitex/plt/utils/_figure_from_axes_mm.py +70 -16
  490. scitex/plt/utils/_figure_mm.py +3 -2
  491. scitex/plt/utils/_get_actual_font.py +5 -4
  492. scitex/plt/utils/_histogram_utils.py +52 -48
  493. scitex/plt/utils/_is_valid_axis.py +19 -13
  494. scitex/plt/utils/_mk_colorbar.py +3 -3
  495. scitex/plt/utils/_scientific_captions.py +202 -139
  496. scitex/plt/utils/_scitex_config.py +98 -98
  497. scitex/plt/utils/_units.py +0 -0
  498. scitex/plt/utils/metadata/__init__.py +36 -0
  499. scitex/plt/utils/metadata/_artist_extraction.py +119 -0
  500. scitex/plt/utils/metadata/_axes_metadata.py +93 -0
  501. scitex/plt/utils/metadata/_collection_artists.py +292 -0
  502. scitex/plt/utils/metadata/_core.py +208 -0
  503. scitex/plt/utils/metadata/_csv_column_extraction.py +186 -0
  504. scitex/plt/utils/metadata/_csv_hash.py +115 -0
  505. scitex/plt/utils/metadata/_csv_verification.py +95 -0
  506. scitex/plt/utils/metadata/_data_linkage.py +263 -0
  507. scitex/plt/utils/metadata/_dimensions.py +239 -0
  508. scitex/plt/utils/metadata/_figure_metadata.py +58 -0
  509. scitex/plt/utils/metadata/_image_text_artists.py +168 -0
  510. scitex/plt/utils/metadata/_label_parsing.py +82 -0
  511. scitex/plt/utils/metadata/_legend_extraction.py +120 -0
  512. scitex/plt/utils/metadata/_line_artists.py +367 -0
  513. scitex/plt/utils/metadata/_line_semantic_handling.py +173 -0
  514. scitex/plt/utils/metadata/_patch_artists.py +211 -0
  515. scitex/plt/utils/metadata/_plot_content.py +26 -0
  516. scitex/plt/utils/metadata/_plot_type_detection.py +184 -0
  517. scitex/plt/utils/metadata/_precision.py +134 -0
  518. scitex/plt/utils/metadata/_precision_config.py +68 -0
  519. scitex/plt/utils/metadata/_precision_sections.py +211 -0
  520. scitex/plt/utils/metadata/_recipe_extraction.py +267 -0
  521. scitex/plt/utils/metadata/_style_parsing.py +174 -0
  522. scitex/repro/_RandomStateManager.py +33 -38
  523. scitex/repro/__init__.py +16 -7
  524. scitex/repro/_gen_ID.py +7 -9
  525. scitex/repro/_gen_timestamp.py +7 -6
  526. scitex/repro/_hash_array.py +8 -12
  527. scitex/reproduce/__init__.py +1 -1
  528. scitex/resource/_get_processor_usages.py +3 -1
  529. scitex/resource/_log_processor_usages.py +3 -1
  530. scitex/rng/__init__.py +1 -1
  531. scitex/schema/README.md +178 -0
  532. scitex/schema/__init__.py +144 -0
  533. scitex/schema/_canvas.py +444 -0
  534. scitex/schema/_stats.py +762 -0
  535. scitex/schema/_validation.py +590 -0
  536. scitex/scholar/.legacy/Scholar.py +5 -12
  537. scitex/scholar/.legacy/_Scholar.py +66 -99
  538. scitex/scholar/.legacy/_ScholarAPI.py +75 -66
  539. scitex/scholar/.legacy/_tmp/search_engine/_BaseSearchEngine.py +3 -3
  540. scitex/scholar/.legacy/_tmp/search_engine/_UnifiedSearcher.py +4 -9
  541. scitex/scholar/.legacy/_tmp/search_engine/__init__.py +14 -21
  542. scitex/scholar/.legacy/_tmp/search_engine/local/_LocalSearchEngine.py +40 -37
  543. scitex/scholar/.legacy/_tmp/search_engine/local/_VectorSearchEngine.py +31 -28
  544. scitex/scholar/.legacy/_tmp/search_engine/web/_ArxivSearchEngine.py +74 -65
  545. scitex/scholar/.legacy/_tmp/search_engine/web/_CrossRefSearchEngine.py +122 -116
  546. scitex/scholar/.legacy/_tmp/search_engine/web/_GoogleScholarSearchEngine.py +65 -59
  547. scitex/scholar/.legacy/_tmp/search_engine/web/_PubMedSearchEngine.py +121 -107
  548. scitex/scholar/.legacy/_tmp/search_engine/web/_SemanticScholarSearchEngine.py +5 -12
  549. scitex/scholar/.legacy/database/_DatabaseEntry.py +49 -45
  550. scitex/scholar/.legacy/database/_DatabaseIndex.py +131 -94
  551. scitex/scholar/.legacy/database/_LibraryManager.py +65 -63
  552. scitex/scholar/.legacy/database/_PaperDatabase.py +138 -124
  553. scitex/scholar/.legacy/database/_ScholarDatabaseIntegration.py +14 -36
  554. scitex/scholar/.legacy/database/_StorageIntegratedDB.py +192 -156
  555. scitex/scholar/.legacy/database/_ZoteroCompatibleDB.py +300 -237
  556. scitex/scholar/.legacy/database/__init__.py +2 -1
  557. scitex/scholar/.legacy/database/manage.py +92 -84
  558. scitex/scholar/.legacy/lookup/_LookupIndex.py +157 -101
  559. scitex/scholar/.legacy/lookup/__init__.py +2 -1
  560. scitex/scholar/.legacy/metadata/doi/batch/_MetadataHandlerForBatchDOIResolution.py +4 -9
  561. scitex/scholar/.legacy/metadata/doi/batch/_ProgressManagerForBatchDOIResolution.py +10 -23
  562. scitex/scholar/.legacy/metadata/doi/batch/_SourceStatsManagerForBatchDOIResolution.py +4 -9
  563. scitex/scholar/.legacy/metadata/doi/batch/__init__.py +3 -1
  564. scitex/scholar/.legacy/metadata/doi/resolvers/_BatchDOIResolver.py +10 -25
  565. scitex/scholar/.legacy/metadata/doi/resolvers/_BibTeXDOIResolver.py +19 -49
  566. scitex/scholar/.legacy/metadata/doi/resolvers/_DOIResolver.py +1 -0
  567. scitex/scholar/.legacy/metadata/doi/resolvers/_SingleDOIResolver.py +8 -20
  568. scitex/scholar/.legacy/metadata/doi/sources/.combined-SemanticScholarSource/_SemanticScholarSource.py +37 -35
  569. scitex/scholar/.legacy/metadata/doi/sources/.combined-SemanticScholarSource/_SemanticScholarSourceEnhanced.py +49 -37
  570. scitex/scholar/.legacy/metadata/doi/sources/_ArXivSource.py +11 -30
  571. scitex/scholar/.legacy/metadata/doi/sources/_BaseDOISource.py +19 -47
  572. scitex/scholar/.legacy/metadata/doi/sources/_CrossRefLocalSource.py +1 -0
  573. scitex/scholar/.legacy/metadata/doi/sources/_CrossRefSource.py +12 -33
  574. scitex/scholar/.legacy/metadata/doi/sources/_OpenAlexSource.py +8 -20
  575. scitex/scholar/.legacy/metadata/doi/sources/_PubMedSource.py +10 -27
  576. scitex/scholar/.legacy/metadata/doi/sources/_SemanticScholarSource.py +11 -29
  577. scitex/scholar/.legacy/metadata/doi/sources/_SourceManager.py +8 -21
  578. scitex/scholar/.legacy/metadata/doi/sources/_SourceResolutionStrategy.py +24 -55
  579. scitex/scholar/.legacy/metadata/doi/sources/_SourceRotationManager.py +8 -21
  580. scitex/scholar/.legacy/metadata/doi/sources/_URLDOISource.py +9 -16
  581. scitex/scholar/.legacy/metadata/doi/sources/_UnifiedSource.py +8 -22
  582. scitex/scholar/.legacy/metadata/doi/sources/__init__.py +1 -0
  583. scitex/scholar/.legacy/metadata/doi/utils/_PubMedConverter.py +4 -8
  584. scitex/scholar/.legacy/metadata/doi/utils/_RateLimitHandler.py +17 -43
  585. scitex/scholar/.legacy/metadata/doi/utils/_TextNormalizer.py +8 -18
  586. scitex/scholar/.legacy/metadata/doi/utils/_URLDOIExtractor.py +4 -8
  587. scitex/scholar/.legacy/metadata/doi/utils/__init__.py +1 -0
  588. scitex/scholar/.legacy/metadata/doi/utils/_to_complete_metadata_structure.py +1 -0
  589. scitex/scholar/.legacy/metadata/enrichment/_LibraryEnricher.py +2 -3
  590. scitex/scholar/.legacy/metadata/enrichment/enrichers/_ImpactFactorEnricher.py +6 -12
  591. scitex/scholar/.legacy/metadata/enrichment/enrichers/_SmartEnricher.py +5 -10
  592. scitex/scholar/.legacy/metadata/enrichment/sources/_UnifiedMetadataSource.py +4 -5
  593. scitex/scholar/.legacy/metadata/query_to_full_meta_json.py +8 -12
  594. scitex/scholar/.legacy/metadata/urls/_URLMetadataHandler.py +3 -3
  595. scitex/scholar/.legacy/metadata/urls/_ZoteroTranslatorRunner.py +15 -21
  596. scitex/scholar/.legacy/metadata/urls/__init__.py +3 -3
  597. scitex/scholar/.legacy/metadata/urls/_finder.py +4 -6
  598. scitex/scholar/.legacy/metadata/urls/_handler.py +7 -15
  599. scitex/scholar/.legacy/metadata/urls/_resolver.py +6 -12
  600. scitex/scholar/.legacy/search/_Embedder.py +74 -69
  601. scitex/scholar/.legacy/search/_SemanticSearch.py +91 -90
  602. scitex/scholar/.legacy/search/_SemanticSearchEngine.py +104 -109
  603. scitex/scholar/.legacy/search/_UnifiedSearcher.py +530 -471
  604. scitex/scholar/.legacy/search/_VectorDatabase.py +111 -92
  605. scitex/scholar/.legacy/search/__init__.py +1 -0
  606. scitex/scholar/.legacy/storage/_EnhancedStorageManager.py +182 -154
  607. scitex/scholar/.legacy/storage/__init__.py +2 -1
  608. scitex/scholar/__init__.py +0 -2
  609. scitex/scholar/__main__.py +1 -3
  610. scitex/scholar/auth/ScholarAuthManager.py +13 -36
  611. scitex/scholar/auth/core/AuthenticationGateway.py +15 -29
  612. scitex/scholar/auth/core/BrowserAuthenticator.py +22 -57
  613. scitex/scholar/auth/core/StrategyResolver.py +10 -27
  614. scitex/scholar/auth/core/__init__.py +5 -1
  615. scitex/scholar/auth/gateway/_OpenURLLinkFinder.py +11 -21
  616. scitex/scholar/auth/gateway/_OpenURLResolver.py +10 -18
  617. scitex/scholar/auth/gateway/_resolve_functions.py +3 -3
  618. scitex/scholar/auth/providers/BaseAuthenticator.py +1 -0
  619. scitex/scholar/auth/providers/EZProxyAuthenticator.py +7 -14
  620. scitex/scholar/auth/providers/OpenAthensAuthenticator.py +29 -57
  621. scitex/scholar/auth/providers/ShibbolethAuthenticator.py +87 -73
  622. scitex/scholar/auth/session/AuthCacheManager.py +12 -22
  623. scitex/scholar/auth/session/SessionManager.py +4 -6
  624. scitex/scholar/auth/sso/BaseSSOAutomator.py +13 -19
  625. scitex/scholar/auth/sso/OpenAthensSSOAutomator.py +16 -45
  626. scitex/scholar/auth/sso/SSOAutomator.py +8 -15
  627. scitex/scholar/auth/sso/UniversityOfMelbourneSSOAutomator.py +13 -23
  628. scitex/scholar/browser/ScholarBrowserManager.py +31 -56
  629. scitex/scholar/browser/__init__.py +1 -0
  630. scitex/scholar/browser/utils/click_and_wait.py +3 -4
  631. scitex/scholar/browser/utils/close_unwanted_pages.py +4 -7
  632. scitex/scholar/browser/utils/wait_redirects.py +15 -40
  633. scitex/scholar/citation_graph/__init__.py +0 -0
  634. scitex/scholar/citation_graph/builder.py +3 -7
  635. scitex/scholar/citation_graph/database.py +4 -11
  636. scitex/scholar/citation_graph/example.py +5 -10
  637. scitex/scholar/citation_graph/models.py +0 -0
  638. scitex/scholar/cli/_url_utils.py +1 -1
  639. scitex/scholar/cli/chrome.py +5 -3
  640. scitex/scholar/cli/download_pdf.py +13 -14
  641. scitex/scholar/cli/handlers/bibtex_handler.py +4 -12
  642. scitex/scholar/cli/handlers/doi_handler.py +1 -3
  643. scitex/scholar/cli/handlers/project_handler.py +6 -20
  644. scitex/scholar/cli/open_browser.py +41 -39
  645. scitex/scholar/cli/open_browser_auto.py +31 -39
  646. scitex/scholar/cli/open_browser_monitored.py +27 -24
  647. scitex/scholar/config/ScholarConfig.py +5 -8
  648. scitex/scholar/config/__init__.py +1 -0
  649. scitex/scholar/config/core/_CascadeConfig.py +3 -3
  650. scitex/scholar/config/core/_PathManager.py +16 -28
  651. scitex/scholar/core/Paper.py +79 -78
  652. scitex/scholar/core/Papers.py +16 -27
  653. scitex/scholar/core/Scholar.py +98 -229
  654. scitex/scholar/core/journal_normalizer.py +52 -49
  655. scitex/scholar/core/oa_cache.py +27 -23
  656. scitex/scholar/core/open_access.py +17 -8
  657. scitex/scholar/docs/template.py +4 -3
  658. scitex/scholar/docs/to_claude/examples/example-python-project-scitex/scripts/mnist/clf_svm.py +0 -0
  659. scitex/scholar/docs/to_claude/examples/example-python-project-scitex/scripts/mnist/download.py +0 -0
  660. scitex/scholar/docs/to_claude/examples/example-python-project-scitex/scripts/mnist/plot_conf_mat.py +0 -0
  661. scitex/scholar/docs/to_claude/examples/example-python-project-scitex/scripts/mnist/plot_digits.py +0 -0
  662. scitex/scholar/docs/to_claude/examples/example-python-project-scitex/scripts/mnist/plot_umap_space.py +0 -0
  663. scitex/scholar/examples/00_config.py +10 -9
  664. scitex/scholar/examples/01_auth.py +3 -0
  665. scitex/scholar/examples/02_browser.py +14 -10
  666. scitex/scholar/examples/03_01-engine.py +3 -0
  667. scitex/scholar/examples/03_02-engine-for-bibtex.py +4 -3
  668. scitex/scholar/examples/04_01-url.py +9 -9
  669. scitex/scholar/examples/04_02-url-for-bibtex.py +7 -3
  670. scitex/scholar/examples/04_02-url-for-dois.py +87 -97
  671. scitex/scholar/examples/05_download_pdf.py +10 -4
  672. scitex/scholar/examples/06_find_and_download.py +6 -6
  673. scitex/scholar/examples/06_parse_bibtex.py +17 -17
  674. scitex/scholar/examples/07_storage_integration.py +6 -9
  675. scitex/scholar/examples/99_fullpipeline-for-bibtex.py +14 -15
  676. scitex/scholar/examples/99_fullpipeline-for-one-entry.py +31 -23
  677. scitex/scholar/examples/99_maintenance.py +3 -0
  678. scitex/scholar/examples/dev.py +2 -3
  679. scitex/scholar/examples/zotero_integration.py +11 -18
  680. scitex/scholar/impact_factor/ImpactFactorEngine.py +7 -9
  681. scitex/scholar/impact_factor/estimation/__init__.py +4 -4
  682. scitex/scholar/impact_factor/estimation/core/__init__.py +3 -7
  683. scitex/scholar/impact_factor/estimation/core/cache_manager.py +223 -211
  684. scitex/scholar/impact_factor/estimation/core/calculator.py +165 -131
  685. scitex/scholar/impact_factor/estimation/core/journal_matcher.py +217 -172
  686. scitex/scholar/impact_factor/jcr/ImpactFactorJCREngine.py +6 -14
  687. scitex/scholar/impact_factor/jcr/build_database.py +4 -3
  688. scitex/scholar/integration/base.py +9 -17
  689. scitex/scholar/integration/mendeley/exporter.py +2 -4
  690. scitex/scholar/integration/mendeley/importer.py +3 -3
  691. scitex/scholar/integration/mendeley/linker.py +3 -3
  692. scitex/scholar/integration/mendeley/mapper.py +9 -6
  693. scitex/scholar/integration/zotero/__main__.py +26 -43
  694. scitex/scholar/integration/zotero/exporter.py +15 -11
  695. scitex/scholar/integration/zotero/importer.py +12 -10
  696. scitex/scholar/integration/zotero/linker.py +8 -12
  697. scitex/scholar/integration/zotero/mapper.py +17 -12
  698. scitex/scholar/metadata_engines/.combined-SemanticScholarSource/_SemanticScholarSource.py +37 -35
  699. scitex/scholar/metadata_engines/.combined-SemanticScholarSource/_SemanticScholarSourceEnhanced.py +47 -35
  700. scitex/scholar/metadata_engines/ScholarEngine.py +21 -43
  701. scitex/scholar/metadata_engines/__init__.py +1 -0
  702. scitex/scholar/metadata_engines/individual/ArXivEngine.py +15 -37
  703. scitex/scholar/metadata_engines/individual/CrossRefEngine.py +15 -42
  704. scitex/scholar/metadata_engines/individual/CrossRefLocalEngine.py +24 -45
  705. scitex/scholar/metadata_engines/individual/OpenAlexEngine.py +11 -21
  706. scitex/scholar/metadata_engines/individual/PubMedEngine.py +10 -27
  707. scitex/scholar/metadata_engines/individual/SemanticScholarEngine.py +28 -35
  708. scitex/scholar/metadata_engines/individual/URLDOIEngine.py +11 -22
  709. scitex/scholar/metadata_engines/individual/_BaseDOIEngine.py +20 -49
  710. scitex/scholar/metadata_engines/utils/_PubMedConverter.py +4 -8
  711. scitex/scholar/metadata_engines/utils/_URLDOIExtractor.py +5 -10
  712. scitex/scholar/metadata_engines/utils/__init__.py +2 -0
  713. scitex/scholar/metadata_engines/utils/_metadata2bibtex.py +3 -0
  714. scitex/scholar/metadata_engines/utils/_standardize_metadata.py +2 -3
  715. scitex/scholar/pdf_download/ScholarPDFDownloader.py +25 -37
  716. scitex/scholar/pdf_download/strategies/chrome_pdf_viewer.py +11 -19
  717. scitex/scholar/pdf_download/strategies/direct_download.py +5 -9
  718. scitex/scholar/pdf_download/strategies/manual_download_fallback.py +3 -3
  719. scitex/scholar/pdf_download/strategies/manual_download_utils.py +6 -13
  720. scitex/scholar/pdf_download/strategies/open_access_download.py +49 -31
  721. scitex/scholar/pdf_download/strategies/response_body.py +8 -19
  722. scitex/scholar/pipelines/ScholarPipelineBibTeX.py +9 -18
  723. scitex/scholar/pipelines/ScholarPipelineMetadataParallel.py +25 -26
  724. scitex/scholar/pipelines/ScholarPipelineMetadataSingle.py +62 -23
  725. scitex/scholar/pipelines/ScholarPipelineParallel.py +13 -30
  726. scitex/scholar/pipelines/ScholarPipelineSearchParallel.py +299 -220
  727. scitex/scholar/pipelines/ScholarPipelineSearchSingle.py +202 -165
  728. scitex/scholar/pipelines/ScholarPipelineSingle.py +25 -51
  729. scitex/scholar/pipelines/SearchQueryParser.py +55 -55
  730. scitex/scholar/search_engines/ScholarSearchEngine.py +31 -27
  731. scitex/scholar/search_engines/_BaseSearchEngine.py +20 -23
  732. scitex/scholar/search_engines/individual/ArXivSearchEngine.py +53 -35
  733. scitex/scholar/search_engines/individual/CrossRefSearchEngine.py +47 -40
  734. scitex/scholar/search_engines/individual/OpenAlexSearchEngine.py +55 -50
  735. scitex/scholar/search_engines/individual/PubMedSearchEngine.py +8 -10
  736. scitex/scholar/search_engines/individual/SemanticScholarSearchEngine.py +55 -49
  737. scitex/scholar/storage/BibTeXHandler.py +150 -95
  738. scitex/scholar/storage/PaperIO.py +3 -6
  739. scitex/scholar/storage/ScholarLibrary.py +70 -49
  740. scitex/scholar/storage/_DeduplicationManager.py +52 -25
  741. scitex/scholar/storage/_LibraryCacheManager.py +19 -46
  742. scitex/scholar/storage/_LibraryManager.py +65 -175
  743. scitex/scholar/url_finder/ScholarURLFinder.py +9 -25
  744. scitex/scholar/url_finder/strategies/find_pdf_urls_by_direct_links.py +1 -1
  745. scitex/scholar/url_finder/strategies/find_pdf_urls_by_href.py +6 -10
  746. scitex/scholar/url_finder/strategies/find_pdf_urls_by_navigation.py +4 -6
  747. scitex/scholar/url_finder/strategies/find_pdf_urls_by_publisher_patterns.py +8 -15
  748. scitex/scholar/url_finder/strategies/find_pdf_urls_by_zotero_translators.py +3 -3
  749. scitex/scholar/url_finder/strategies/find_supplementary_urls_by_href.py +3 -3
  750. scitex/scholar/url_finder/translators/core/patterns.py +6 -4
  751. scitex/scholar/url_finder/translators/core/registry.py +6 -9
  752. scitex/scholar/url_finder/translators/individual/BOFiP_Impots.py +60 -52
  753. scitex/scholar/url_finder/translators/individual/Baidu_Scholar.py +54 -62
  754. scitex/scholar/url_finder/translators/individual/Bangkok_Post.py +38 -44
  755. scitex/scholar/url_finder/translators/individual/Baruch_Foundation.py +43 -47
  756. scitex/scholar/url_finder/translators/individual/Beobachter.py +46 -50
  757. scitex/scholar/url_finder/translators/individual/Bezneng_Gajit.py +37 -41
  758. scitex/scholar/url_finder/translators/individual/BibLaTeX.py +59 -52
  759. scitex/scholar/url_finder/translators/individual/BibTeX.py +83 -79
  760. scitex/scholar/url_finder/translators/individual/Biblio_com.py +48 -51
  761. scitex/scholar/url_finder/translators/individual/Bibliontology_RDF.py +58 -56
  762. scitex/scholar/url_finder/translators/individual/Camara_Brasileira_do_Livro_ISBN.py +102 -99
  763. scitex/scholar/url_finder/translators/individual/CanLII.py +49 -43
  764. scitex/scholar/url_finder/translators/individual/Canada_com.py +36 -40
  765. scitex/scholar/url_finder/translators/individual/Canadian_Letters_and_Images.py +43 -43
  766. scitex/scholar/url_finder/translators/individual/Canadiana_ca.py +77 -66
  767. scitex/scholar/url_finder/translators/individual/Cascadilla_Proceedings_Project.py +68 -62
  768. scitex/scholar/url_finder/translators/individual/Central_and_Eastern_European_Online_Library_Journals.py +60 -60
  769. scitex/scholar/url_finder/translators/individual/Champlain_Society_Collection.py +63 -61
  770. scitex/scholar/url_finder/translators/individual/Chicago_Journal_of_Theoretical_Computer_Science.py +74 -58
  771. scitex/scholar/url_finder/translators/individual/Christian_Science_Monitor.py +32 -38
  772. scitex/scholar/url_finder/translators/individual/Columbia_University_Press.py +51 -47
  773. scitex/scholar/url_finder/translators/individual/Common_Place.py +66 -57
  774. scitex/scholar/url_finder/translators/individual/Cornell_LII.py +66 -62
  775. scitex/scholar/url_finder/translators/individual/Cornell_University_Press.py +38 -45
  776. scitex/scholar/url_finder/translators/individual/CourtListener.py +52 -56
  777. scitex/scholar/url_finder/translators/individual/DAI_Zenon.py +53 -54
  778. scitex/scholar/url_finder/translators/individual/access_medicine.py +27 -33
  779. scitex/scholar/url_finder/translators/individual/acm.py +1 -1
  780. scitex/scholar/url_finder/translators/individual/acm_digital_library.py +93 -63
  781. scitex/scholar/url_finder/translators/individual/airiti.py +3 -1
  782. scitex/scholar/url_finder/translators/individual/aosic.py +3 -1
  783. scitex/scholar/url_finder/translators/individual/archive_ouverte_aosic.py +3 -1
  784. scitex/scholar/url_finder/translators/individual/archive_ouverte_en_sciences_de_l_information_et_de_la_communication___aosic_.py +6 -2
  785. scitex/scholar/url_finder/translators/individual/artforum.py +35 -27
  786. scitex/scholar/url_finder/translators/individual/arxiv.py +1 -1
  787. scitex/scholar/url_finder/translators/individual/arxiv_org.py +8 -4
  788. scitex/scholar/url_finder/translators/individual/atlanta_journal_constitution.py +22 -18
  789. scitex/scholar/url_finder/translators/individual/atypon_journals.py +19 -11
  790. scitex/scholar/url_finder/translators/individual/austlii_and_nzlii.py +48 -44
  791. scitex/scholar/url_finder/translators/individual/australian_dictionary_of_biography.py +21 -17
  792. scitex/scholar/url_finder/translators/individual/bailii.py +22 -19
  793. scitex/scholar/url_finder/translators/individual/bbc.py +46 -42
  794. scitex/scholar/url_finder/translators/individual/bbc_genome.py +37 -25
  795. scitex/scholar/url_finder/translators/individual/biblioteca_nacional_de_maestros.py +24 -20
  796. scitex/scholar/url_finder/translators/individual/bibliotheque_archives_nationale_quebec_pistard.py +42 -43
  797. scitex/scholar/url_finder/translators/individual/bibliotheque_archives_nationales_quebec.py +87 -81
  798. scitex/scholar/url_finder/translators/individual/bibliotheque_nationale_france.py +39 -37
  799. scitex/scholar/url_finder/translators/individual/bibsys.py +32 -28
  800. scitex/scholar/url_finder/translators/individual/bioconductor.py +58 -52
  801. scitex/scholar/url_finder/translators/individual/biomed_central.py +23 -15
  802. scitex/scholar/url_finder/translators/individual/biorxiv.py +26 -13
  803. scitex/scholar/url_finder/translators/individual/blogger.py +39 -43
  804. scitex/scholar/url_finder/translators/individual/bloomberg.py +48 -52
  805. scitex/scholar/url_finder/translators/individual/bloomsbury_food_library.py +37 -37
  806. scitex/scholar/url_finder/translators/individual/bluesky.py +30 -28
  807. scitex/scholar/url_finder/translators/individual/bnf_isbn.py +1 -1
  808. scitex/scholar/url_finder/translators/individual/bocc.py +66 -60
  809. scitex/scholar/url_finder/translators/individual/boe.py +52 -52
  810. scitex/scholar/url_finder/translators/individual/brill.py +3 -1
  811. scitex/scholar/url_finder/translators/individual/business_standard.py +36 -38
  812. scitex/scholar/url_finder/translators/individual/cabi_cab_abstracts.py +39 -41
  813. scitex/scholar/url_finder/translators/individual/cambridge.py +3 -1
  814. scitex/scholar/url_finder/translators/individual/cambridge_core.py +30 -24
  815. scitex/scholar/url_finder/translators/individual/caod.py +50 -46
  816. scitex/scholar/url_finder/translators/individual/cbc.py +91 -67
  817. scitex/scholar/url_finder/translators/individual/ccfr_bnf.py +49 -53
  818. scitex/scholar/url_finder/translators/individual/cia_world_factbook.py +43 -33
  819. scitex/scholar/url_finder/translators/individual/crossref_rest.py +208 -174
  820. scitex/scholar/url_finder/translators/individual/current_affairs.py +29 -35
  821. scitex/scholar/url_finder/translators/individual/dabi.py +70 -66
  822. scitex/scholar/url_finder/translators/individual/dagens_nyheter.py +3 -1
  823. scitex/scholar/url_finder/translators/individual/dagstuhl.py +10 -15
  824. scitex/scholar/url_finder/translators/individual/dar_almandumah.py +13 -9
  825. scitex/scholar/url_finder/translators/individual/dart_europe.py +19 -22
  826. scitex/scholar/url_finder/translators/individual/data_gov.py +2 -2
  827. scitex/scholar/url_finder/translators/individual/databrary.py +27 -28
  828. scitex/scholar/url_finder/translators/individual/datacite_json.py +152 -137
  829. scitex/scholar/url_finder/translators/individual/dataverse.py +68 -64
  830. scitex/scholar/url_finder/translators/individual/daum_news.py +38 -38
  831. scitex/scholar/url_finder/translators/individual/dblp.py +4 -8
  832. scitex/scholar/url_finder/translators/individual/dblp_computer_science_bibliography.py +8 -3
  833. scitex/scholar/url_finder/translators/individual/dbpia.py +5 -3
  834. scitex/scholar/url_finder/translators/individual/defense_technical_information_center.py +30 -28
  835. scitex/scholar/url_finder/translators/individual/delpher.py +102 -79
  836. scitex/scholar/url_finder/translators/individual/demographic_research.py +35 -31
  837. scitex/scholar/url_finder/translators/individual/denik_cz.py +58 -54
  838. scitex/scholar/url_finder/translators/individual/depatisnet.py +7 -10
  839. scitex/scholar/url_finder/translators/individual/der_freitag.py +81 -66
  840. scitex/scholar/url_finder/translators/individual/der_spiegel.py +56 -54
  841. scitex/scholar/url_finder/translators/individual/digibib_net.py +3 -1
  842. scitex/scholar/url_finder/translators/individual/digizeitschriften.py +3 -1
  843. scitex/scholar/url_finder/translators/individual/dpla.py +13 -14
  844. scitex/scholar/url_finder/translators/individual/dspace.py +2 -2
  845. scitex/scholar/url_finder/translators/individual/ebrary.py +3 -1
  846. scitex/scholar/url_finder/translators/individual/ebscohost.py +3 -1
  847. scitex/scholar/url_finder/translators/individual/electronic_colloquium_on_computational_complexity.py +3 -1
  848. scitex/scholar/url_finder/translators/individual/elife.py +3 -1
  849. scitex/scholar/url_finder/translators/individual/elsevier_health_journals.py +3 -1
  850. scitex/scholar/url_finder/translators/individual/emerald.py +3 -1
  851. scitex/scholar/url_finder/translators/individual/emerald_insight.py +3 -1
  852. scitex/scholar/url_finder/translators/individual/epicurious.py +3 -1
  853. scitex/scholar/url_finder/translators/individual/eurogamerusgamer.py +3 -1
  854. scitex/scholar/url_finder/translators/individual/fachportal_padagogik.py +3 -1
  855. scitex/scholar/url_finder/translators/individual/frontiers.py +1 -1
  856. scitex/scholar/url_finder/translators/individual/gale_databases.py +3 -1
  857. scitex/scholar/url_finder/translators/individual/gms_german_medical_science.py +6 -2
  858. scitex/scholar/url_finder/translators/individual/ieee_computer_society.py +6 -2
  859. scitex/scholar/url_finder/translators/individual/ieee_xplore.py +41 -35
  860. scitex/scholar/url_finder/translators/individual/inter_research_science_center.py +6 -2
  861. scitex/scholar/url_finder/translators/individual/jisc_historical_texts.py +3 -1
  862. scitex/scholar/url_finder/translators/individual/jstor.py +14 -12
  863. scitex/scholar/url_finder/translators/individual/korean_national_library.py +3 -1
  864. scitex/scholar/url_finder/translators/individual/la_times.py +3 -1
  865. scitex/scholar/url_finder/translators/individual/landesbibliographie_baden_wurttemberg.py +3 -1
  866. scitex/scholar/url_finder/translators/individual/legislative_insight.py +3 -1
  867. scitex/scholar/url_finder/translators/individual/libraries_tasmania.py +3 -1
  868. scitex/scholar/url_finder/translators/individual/library_catalog__koha_.py +3 -1
  869. scitex/scholar/url_finder/translators/individual/lingbuzz.py +2 -2
  870. scitex/scholar/url_finder/translators/individual/max_planck_institute_for_the_history_of_science_virtual_laboratory_library.py +3 -1
  871. scitex/scholar/url_finder/translators/individual/mdpi.py +12 -6
  872. scitex/scholar/url_finder/translators/individual/microbiology_society_journals.py +3 -1
  873. scitex/scholar/url_finder/translators/individual/midas_journals.py +3 -1
  874. scitex/scholar/url_finder/translators/individual/nagoya_university_opac.py +3 -1
  875. scitex/scholar/url_finder/translators/individual/nature_publishing_group.py +32 -19
  876. scitex/scholar/url_finder/translators/individual/ntsb_accident_reports.py +3 -1
  877. scitex/scholar/url_finder/translators/individual/openedition_journals.py +8 -4
  878. scitex/scholar/url_finder/translators/individual/orcid.py +16 -15
  879. scitex/scholar/url_finder/translators/individual/oxford.py +25 -19
  880. scitex/scholar/url_finder/translators/individual/oxford_dictionaries_premium.py +3 -1
  881. scitex/scholar/url_finder/translators/individual/ozon_ru.py +3 -1
  882. scitex/scholar/url_finder/translators/individual/plos.py +9 -12
  883. scitex/scholar/url_finder/translators/individual/polygon.py +3 -1
  884. scitex/scholar/url_finder/translators/individual/primo.py +3 -1
  885. scitex/scholar/url_finder/translators/individual/project_muse.py +3 -1
  886. scitex/scholar/url_finder/translators/individual/pubfactory_journals.py +3 -1
  887. scitex/scholar/url_finder/translators/individual/pubmed.py +71 -65
  888. scitex/scholar/url_finder/translators/individual/pubmed_central.py +8 -6
  889. scitex/scholar/url_finder/translators/individual/rechtspraak_nl.py +3 -1
  890. scitex/scholar/url_finder/translators/individual/sage_journals.py +25 -17
  891. scitex/scholar/url_finder/translators/individual/sciencedirect.py +36 -17
  892. scitex/scholar/url_finder/translators/individual/semantics_visual_library.py +3 -1
  893. scitex/scholar/url_finder/translators/individual/silverchair.py +70 -52
  894. scitex/scholar/url_finder/translators/individual/sora.py +3 -1
  895. scitex/scholar/url_finder/translators/individual/springer.py +15 -11
  896. scitex/scholar/url_finder/translators/individual/ssrn.py +3 -3
  897. scitex/scholar/url_finder/translators/individual/stanford_encyclopedia_of_philosophy.py +3 -1
  898. scitex/scholar/url_finder/translators/individual/superlib.py +3 -1
  899. scitex/scholar/url_finder/translators/individual/treesearch.py +3 -1
  900. scitex/scholar/url_finder/translators/individual/university_of_chicago_press_books.py +3 -1
  901. scitex/scholar/url_finder/translators/individual/vlex.py +3 -1
  902. scitex/scholar/url_finder/translators/individual/web_of_science.py +3 -1
  903. scitex/scholar/url_finder/translators/individual/web_of_science_nextgen.py +3 -1
  904. scitex/scholar/url_finder/translators/individual/wiley.py +31 -25
  905. scitex/scholar/url_finder/translators/individual/wilson_center_digital_archive.py +3 -1
  906. scitex/scholar/utils/bibtex/_parse_bibtex.py +3 -3
  907. scitex/scholar/utils/cleanup/_cleanup_scholar_processes.py +5 -9
  908. scitex/scholar/utils/text/_TextNormalizer.py +249 -176
  909. scitex/scholar/utils/validation/DOIValidator.py +31 -28
  910. scitex/scholar/utils/validation/__init__.py +0 -0
  911. scitex/scholar/utils/validation/validate_library_dois.py +61 -57
  912. scitex/scholar/zotero/__init__.py +1 -1
  913. scitex/security/cli.py +7 -20
  914. scitex/security/github.py +45 -32
  915. scitex/session/__init__.py +8 -9
  916. scitex/session/_decorator.py +49 -42
  917. scitex/session/_lifecycle.py +39 -39
  918. scitex/session/_manager.py +24 -20
  919. scitex/sh/__init__.py +4 -3
  920. scitex/sh/_execute.py +10 -7
  921. scitex/sh/_security.py +3 -3
  922. scitex/sh/_types.py +2 -3
  923. scitex/stats/__init__.py +57 -6
  924. scitex/stats/_schema.py +42 -569
  925. scitex/stats/auto/__init__.py +188 -0
  926. scitex/stats/auto/_context.py +331 -0
  927. scitex/stats/auto/_formatting.py +679 -0
  928. scitex/stats/auto/_rules.py +901 -0
  929. scitex/stats/auto/_selector.py +554 -0
  930. scitex/stats/auto/_styles.py +721 -0
  931. scitex/stats/correct/__init__.py +4 -4
  932. scitex/stats/correct/_correct_bonferroni.py +43 -34
  933. scitex/stats/correct/_correct_fdr.py +14 -40
  934. scitex/stats/correct/_correct_fdr_.py +39 -46
  935. scitex/stats/correct/_correct_holm.py +14 -32
  936. scitex/stats/correct/_correct_sidak.py +36 -21
  937. scitex/stats/descriptive/_circular.py +20 -21
  938. scitex/stats/descriptive/_describe.py +19 -5
  939. scitex/stats/descriptive/_nan.py +5 -7
  940. scitex/stats/descriptive/_real.py +4 -3
  941. scitex/stats/effect_sizes/__init__.py +10 -11
  942. scitex/stats/effect_sizes/_cliffs_delta.py +35 -32
  943. scitex/stats/effect_sizes/_cohens_d.py +30 -31
  944. scitex/stats/effect_sizes/_epsilon_squared.py +19 -22
  945. scitex/stats/effect_sizes/_eta_squared.py +23 -27
  946. scitex/stats/effect_sizes/_prob_superiority.py +18 -21
  947. scitex/stats/posthoc/__init__.py +3 -3
  948. scitex/stats/posthoc/_dunnett.py +75 -55
  949. scitex/stats/posthoc/_games_howell.py +61 -43
  950. scitex/stats/posthoc/_tukey_hsd.py +42 -34
  951. scitex/stats/power/__init__.py +2 -2
  952. scitex/stats/power/_power.py +56 -56
  953. scitex/stats/tests/__init__.py +1 -1
  954. scitex/stats/tests/correlation/__init__.py +1 -1
  955. scitex/stats/tests/correlation/_test_pearson.py +28 -38
  956. scitex/stats/utils/__init__.py +14 -17
  957. scitex/stats/utils/_effect_size.py +85 -78
  958. scitex/stats/utils/_formatters.py +49 -43
  959. scitex/stats/utils/_normalizers.py +7 -14
  960. scitex/stats/utils/_power.py +56 -56
  961. scitex/str/__init__.py +1 -0
  962. scitex/str/_clean_path.py +3 -3
  963. scitex/str/_factor_out_digits.py +86 -58
  964. scitex/str/_format_plot_text.py +180 -111
  965. scitex/str/_latex.py +19 -19
  966. scitex/str/_latex_fallback.py +9 -10
  967. scitex/str/_parse.py +3 -6
  968. scitex/str/_print_debug.py +13 -13
  969. scitex/str/_printc.py +2 -0
  970. scitex/str/_search.py +3 -3
  971. scitex/template/.legacy/_clone_project.py +9 -13
  972. scitex/template/__init__.py +10 -2
  973. scitex/template/_clone_project.py +7 -2
  974. scitex/template/_copy.py +1 -0
  975. scitex/template/_customize.py +3 -6
  976. scitex/template/_git_strategy.py +2 -3
  977. scitex/template/_rename.py +1 -0
  978. scitex/template/clone_pip_project.py +6 -7
  979. scitex/template/clone_research.py +7 -10
  980. scitex/template/clone_singularity.py +6 -7
  981. scitex/template/clone_writer_directory.py +6 -7
  982. scitex/tex/_preview.py +26 -11
  983. scitex/tex/_to_vec.py +10 -7
  984. scitex/torch/__init__.py +11 -1
  985. scitex/types/_ArrayLike.py +2 -0
  986. scitex/types/_is_listed_X.py +3 -3
  987. scitex/units.py +110 -77
  988. scitex/utils/_compress_hdf5.py +3 -3
  989. scitex/utils/_email.py +8 -4
  990. scitex/utils/_notify.py +14 -8
  991. scitex/utils/_search.py +6 -6
  992. scitex/utils/_verify_scitex_format.py +17 -42
  993. scitex/utils/_verify_scitex_format_v01.py +12 -34
  994. scitex/utils/template.py +4 -3
  995. scitex/vis/__init__.py +0 -0
  996. scitex/vis/backend/__init__.py +3 -3
  997. scitex/vis/backend/{export.py → _export.py} +1 -1
  998. scitex/vis/backend/{parser.py → _parser.py} +1 -3
  999. scitex/vis/backend/{render.py → _render.py} +1 -1
  1000. scitex/vis/canvas.py +15 -3
  1001. scitex/vis/editor/__init__.py +0 -0
  1002. scitex/vis/editor/_dearpygui_editor.py +450 -304
  1003. scitex/vis/editor/_defaults.py +114 -123
  1004. scitex/vis/editor/_edit.py +38 -26
  1005. scitex/vis/editor/_flask_editor.py +8 -8
  1006. scitex/vis/editor/_mpl_editor.py +63 -48
  1007. scitex/vis/editor/_qt_editor.py +210 -159
  1008. scitex/vis/editor/_tkinter_editor.py +146 -89
  1009. scitex/vis/editor/flask_editor/__init__.py +10 -10
  1010. scitex/vis/editor/flask_editor/_bbox.py +529 -0
  1011. scitex/vis/editor/flask_editor/{core.py → _core.py} +45 -29
  1012. scitex/vis/editor/flask_editor/_plotter.py +567 -0
  1013. scitex/vis/editor/flask_editor/_renderer.py +393 -0
  1014. scitex/vis/editor/flask_editor/{utils.py → _utils.py} +13 -14
  1015. scitex/vis/editor/flask_editor/templates/__init__.py +5 -5
  1016. scitex/vis/editor/flask_editor/templates/{html.py → _html.py} +234 -16
  1017. scitex/vis/editor/flask_editor/templates/_scripts.py +1261 -0
  1018. scitex/vis/editor/flask_editor/templates/{styles.py → _styles.py} +192 -2
  1019. scitex/vis/io/__init__.py +5 -5
  1020. scitex/vis/io/{canvas.py → _canvas.py} +8 -4
  1021. scitex/vis/io/{data.py → _data.py} +13 -9
  1022. scitex/vis/io/{directory.py → _directory.py} +7 -4
  1023. scitex/vis/io/{export.py → _export.py} +15 -12
  1024. scitex/vis/io/{load.py → _load.py} +1 -1
  1025. scitex/vis/io/{panel.py → _panel.py} +21 -13
  1026. scitex/vis/io/{save.py → _save.py} +0 -0
  1027. scitex/vis/model/__init__.py +7 -7
  1028. scitex/vis/model/{annotations.py → _annotations.py} +2 -4
  1029. scitex/vis/model/{axes.py → _axes.py} +1 -1
  1030. scitex/vis/model/{figure.py → _figure.py} +0 -0
  1031. scitex/vis/model/{guides.py → _guides.py} +1 -1
  1032. scitex/vis/model/{plot.py → _plot.py} +2 -4
  1033. scitex/vis/model/{plot_types.py → _plot_types.py} +0 -0
  1034. scitex/vis/model/{styles.py → _styles.py} +0 -0
  1035. scitex/vis/utils/__init__.py +2 -2
  1036. scitex/vis/utils/{defaults.py → _defaults.py} +1 -2
  1037. scitex/vis/utils/{validate.py → _validate.py} +3 -9
  1038. scitex/web/__init__.py +7 -1
  1039. scitex/web/_scraping.py +54 -38
  1040. scitex/web/_search_pubmed.py +30 -14
  1041. scitex/writer/.legacy/Writer_v01-refactored.py +4 -4
  1042. scitex/writer/.legacy/_compile.py +18 -28
  1043. scitex/writer/Writer.py +8 -21
  1044. scitex/writer/__init__.py +11 -11
  1045. scitex/writer/_clone_writer_project.py +2 -6
  1046. scitex/writer/_compile/__init__.py +1 -0
  1047. scitex/writer/_compile/_parser.py +1 -0
  1048. scitex/writer/_compile/_runner.py +35 -38
  1049. scitex/writer/_compile/_validator.py +1 -0
  1050. scitex/writer/_compile/manuscript.py +1 -0
  1051. scitex/writer/_compile/revision.py +1 -0
  1052. scitex/writer/_compile/supplementary.py +1 -0
  1053. scitex/writer/_compile_async.py +5 -12
  1054. scitex/writer/_project/__init__.py +1 -0
  1055. scitex/writer/_project/_create.py +10 -25
  1056. scitex/writer/_project/_trees.py +4 -9
  1057. scitex/writer/_project/_validate.py +2 -3
  1058. scitex/writer/_validate_tree_structures.py +7 -18
  1059. scitex/writer/dataclasses/__init__.py +8 -10
  1060. scitex/writer/dataclasses/config/_CONSTANTS.py +2 -3
  1061. scitex/writer/dataclasses/config/_WriterConfig.py +4 -9
  1062. scitex/writer/dataclasses/contents/_ManuscriptContents.py +14 -25
  1063. scitex/writer/dataclasses/contents/_RevisionContents.py +21 -16
  1064. scitex/writer/dataclasses/contents/_SupplementaryContents.py +21 -24
  1065. scitex/writer/dataclasses/core/_Document.py +2 -3
  1066. scitex/writer/dataclasses/core/_DocumentSection.py +8 -23
  1067. scitex/writer/dataclasses/results/_CompilationResult.py +2 -3
  1068. scitex/writer/dataclasses/results/_LaTeXIssue.py +3 -6
  1069. scitex/writer/dataclasses/results/_SaveSectionsResponse.py +20 -9
  1070. scitex/writer/dataclasses/results/_SectionReadResponse.py +24 -10
  1071. scitex/writer/dataclasses/tree/_ConfigTree.py +7 -4
  1072. scitex/writer/dataclasses/tree/_ManuscriptTree.py +10 -13
  1073. scitex/writer/dataclasses/tree/_RevisionTree.py +16 -17
  1074. scitex/writer/dataclasses/tree/_ScriptsTree.py +10 -5
  1075. scitex/writer/dataclasses/tree/_SharedTree.py +10 -13
  1076. scitex/writer/dataclasses/tree/_SupplementaryTree.py +15 -14
  1077. scitex/writer/utils/.legacy_git_retry.py +3 -8
  1078. scitex/writer/utils/_parse_latex_logs.py +2 -3
  1079. scitex/writer/utils/_parse_script_args.py +20 -23
  1080. scitex/writer/utils/_watch.py +5 -5
  1081. {scitex-2.5.0.dist-info → scitex-2.7.0.dist-info}/METADATA +4 -10
  1082. {scitex-2.5.0.dist-info → scitex-2.7.0.dist-info}/RECORD +1071 -975
  1083. scitex/db/_sqlite3/_SQLite3Mixins/_ColumnMixin_v01-indentation-issues.py +0 -583
  1084. scitex/plt/_subplots/_export_as_csv_formatters.py +0 -112
  1085. scitex/vis/editor/flask_editor/bbox.py +0 -216
  1086. scitex/vis/editor/flask_editor/plotter.py +0 -130
  1087. scitex/vis/editor/flask_editor/renderer.py +0 -184
  1088. scitex/vis/editor/flask_editor/templates/scripts.py +0 -614
  1089. {scitex-2.5.0.dist-info → scitex-2.7.0.dist-info}/WHEEL +0 -0
  1090. {scitex-2.5.0.dist-info → scitex-2.7.0.dist-info}/entry_points.txt +0 -0
  1091. {scitex-2.5.0.dist-info → scitex-2.7.0.dist-info}/licenses/LICENSE +0 -0
@@ -33,11 +33,19 @@ from datetime import datetime
33
33
  from scitex import logging
34
34
  from scitex.scholar.core import Paper
35
35
  from scitex.scholar.core import normalize_journal_name
36
- from scitex.scholar.search_engines.individual.PubMedSearchEngine import PubMedSearchEngine
37
- from scitex.scholar.search_engines.individual.CrossRefSearchEngine import CrossRefSearchEngine
36
+ from scitex.scholar.search_engines.individual.PubMedSearchEngine import (
37
+ PubMedSearchEngine,
38
+ )
39
+ from scitex.scholar.search_engines.individual.CrossRefSearchEngine import (
40
+ CrossRefSearchEngine,
41
+ )
38
42
  from scitex.scholar.search_engines.individual.ArXivSearchEngine import ArXivSearchEngine
39
- from scitex.scholar.search_engines.individual.SemanticScholarSearchEngine import SemanticScholarSearchEngine
40
- from scitex.scholar.search_engines.individual.OpenAlexSearchEngine import OpenAlexSearchEngine
43
+ from scitex.scholar.search_engines.individual.SemanticScholarSearchEngine import (
44
+ SemanticScholarSearchEngine,
45
+ )
46
+ from scitex.scholar.search_engines.individual.OpenAlexSearchEngine import (
47
+ OpenAlexSearchEngine,
48
+ )
41
49
 
42
50
  logger = logging.getLogger(__name__)
43
51
 
@@ -68,31 +76,31 @@ class ScholarPipelineSearchParallel:
68
76
 
69
77
  # Initialize search engines with email for rate limit benefits
70
78
  self.engines = {
71
- 'PubMed': PubMedSearchEngine(email=self.email),
72
- 'CrossRef': CrossRefSearchEngine(email=self.email),
73
- 'arXiv': ArXivSearchEngine(email=self.email),
74
- 'Semantic_Scholar': SemanticScholarSearchEngine(email=self.email),
75
- 'OpenAlex': OpenAlexSearchEngine(email=self.email),
79
+ "PubMed": PubMedSearchEngine(email=self.email),
80
+ "CrossRef": CrossRefSearchEngine(email=self.email),
81
+ "arXiv": ArXivSearchEngine(email=self.email),
82
+ "Semantic_Scholar": SemanticScholarSearchEngine(email=self.email),
83
+ "OpenAlex": OpenAlexSearchEngine(email=self.email),
76
84
  }
77
85
 
78
86
  # Statistics
79
87
  self.stats = {
80
- 'total_searches': 0,
81
- 'successful_searches': 0,
82
- 'failed_searches': 0,
83
- 'cache_hits': 0,
84
- 'total_time': 0.0,
85
- 'parallel_speedup': 0.0,
86
- 'engine_stats': {
88
+ "total_searches": 0,
89
+ "successful_searches": 0,
90
+ "failed_searches": 0,
91
+ "cache_hits": 0,
92
+ "total_time": 0.0,
93
+ "parallel_speedup": 0.0,
94
+ "engine_stats": {
87
95
  name: {
88
- 'attempts': 0,
89
- 'successes': 0,
90
- 'failures': 0,
91
- 'avg_response_time': 0.0,
92
- 'total_results': 0,
96
+ "attempts": 0,
97
+ "successes": 0,
98
+ "failures": 0,
99
+ "avg_response_time": 0.0,
100
+ "total_results": 0,
93
101
  }
94
102
  for name in self.engines.keys()
95
- }
103
+ },
96
104
  }
97
105
 
98
106
  logger.info(
@@ -130,7 +138,7 @@ class ScholarPipelineSearchParallel:
130
138
  - metadata: Search metadata (engines used, timing, engine_counts, etc.)
131
139
  """
132
140
  start_time = datetime.now()
133
- self.stats['total_searches'] += 1
141
+ self.stats["total_searches"] += 1
134
142
 
135
143
  # Determine search mode
136
144
  search_query = query or title or doi
@@ -144,7 +152,7 @@ class ScholarPipelineSearchParallel:
144
152
 
145
153
  # Prepare search parameters
146
154
  filters = filters or {}
147
- search_fields = search_fields or ['title', 'abstract']
155
+ search_fields = search_fields or ["title", "abstract"]
148
156
  per_engine_limit = max(10, max_results // len(self.engines))
149
157
 
150
158
  # Initialize engine counts dictionary
@@ -178,16 +186,18 @@ class ScholarPipelineSearchParallel:
178
186
  for engine_name, result in zip(engine_names, results):
179
187
  if isinstance(result, Exception):
180
188
  logger.error(f"{self.name}: {engine_name} search failed: {result}")
181
- self.stats['engine_stats'][engine_name]['failures'] += 1
189
+ self.stats["engine_stats"][engine_name]["failures"] += 1
182
190
  continue
183
191
 
184
- logger.info(f"{self.name}: {engine_name} returned {len(result) if result else 0} results (type: {type(result).__name__})")
192
+ logger.info(
193
+ f"{self.name}: {engine_name} returned {len(result) if result else 0} results (type: {type(result).__name__})"
194
+ )
185
195
 
186
196
  if result:
187
197
  all_papers.extend(result)
188
198
  engines_used.append(engine_name)
189
- self.stats['engine_stats'][engine_name]['successes'] += 1
190
- self.stats['engine_stats'][engine_name]['total_results'] += len(result)
199
+ self.stats["engine_stats"][engine_name]["successes"] += 1
200
+ self.stats["engine_stats"][engine_name]["total_results"] += len(result)
191
201
 
192
202
  # Deduplicate by DOI and title
193
203
  unique_papers = self._deduplicate_papers(all_papers)
@@ -202,9 +212,11 @@ class ScholarPipelineSearchParallel:
202
212
  unique_papers = self._apply_threshold_filters(unique_papers, filters)
203
213
 
204
214
  # Sort if requested
205
- sort_by = filters.get('sort_by', 'relevance')
206
- if sort_by and sort_by != 'relevance':
207
- unique_papers = self._sort_papers(unique_papers, sort_by, filters.get('sort_order', 'desc'))
215
+ sort_by = filters.get("sort_by", "relevance")
216
+ if sort_by and sort_by != "relevance":
217
+ unique_papers = self._sort_papers(
218
+ unique_papers, sort_by, filters.get("sort_order", "desc")
219
+ )
208
220
 
209
221
  # Limit to max_results
210
222
  unique_papers = unique_papers[:max_results]
@@ -215,8 +227,8 @@ class ScholarPipelineSearchParallel:
215
227
  # Calculate timing
216
228
  end_time = datetime.now()
217
229
  search_time = (end_time - start_time).total_seconds()
218
- self.stats['total_time'] += search_time
219
- self.stats['successful_searches'] += 1
230
+ self.stats["total_time"] += search_time
231
+ self.stats["successful_searches"] += 1
220
232
 
221
233
  logger.success(
222
234
  f"{self.name}: Parallel search completed in {search_time:.2f}s, "
@@ -225,19 +237,19 @@ class ScholarPipelineSearchParallel:
225
237
  )
226
238
 
227
239
  return {
228
- 'results': response_papers,
229
- 'metadata': {
230
- 'query': search_query,
231
- 'search_fields': search_fields,
232
- 'filters': filters,
233
- 'engines_used': engines_used,
234
- 'total_engines': len(self.engines),
235
- 'successful_engines': len(engines_used),
236
- 'total_results': len(response_papers),
237
- 'search_time': search_time,
238
- 'timestamp': datetime.now().isoformat(),
239
- 'engine_counts': engine_counts, # Per-engine result counts
240
- }
240
+ "results": response_papers,
241
+ "metadata": {
242
+ "query": search_query,
243
+ "search_fields": search_fields,
244
+ "filters": filters,
245
+ "engines_used": engines_used,
246
+ "total_engines": len(self.engines),
247
+ "successful_engines": len(engines_used),
248
+ "total_results": len(response_papers),
249
+ "search_time": search_time,
250
+ "timestamp": datetime.now().isoformat(),
251
+ "engine_counts": engine_counts, # Per-engine result counts
252
+ },
241
253
  }
242
254
 
243
255
  async def _search_engine(
@@ -263,16 +275,20 @@ class ScholarPipelineSearchParallel:
263
275
  on_progress: Optional callback(engine_name, status, count)
264
276
  engine_counts: Shared dictionary to store per-engine counts
265
277
  """
266
- self.stats['engine_stats'][engine_name]['attempts'] += 1
278
+ self.stats["engine_stats"][engine_name]["attempts"] += 1
267
279
  engine_start = datetime.now()
268
280
 
269
281
  # Notify start of search
270
282
  if on_progress:
271
283
  try:
272
- on_progress(engine_name, 'loading', 0)
273
- logger.info(f"{self.name}: Called on_progress for {engine_name}: loading, 0")
284
+ on_progress(engine_name, "loading", 0)
285
+ logger.info(
286
+ f"{self.name}: Called on_progress for {engine_name}: loading, 0"
287
+ )
274
288
  except Exception as e:
275
- logger.error(f"{self.name}: Progress callback error for {engine_name}: {e}")
289
+ logger.error(
290
+ f"{self.name}: Progress callback error for {engine_name}: {e}"
291
+ )
276
292
 
277
293
  try:
278
294
  # Run synchronous search in executor to make it async
@@ -280,9 +296,9 @@ class ScholarPipelineSearchParallel:
280
296
 
281
297
  # Prepare filters for API
282
298
  api_filters = {
283
- 'year_start': filters.get('year_start'),
284
- 'year_end': filters.get('year_end'),
285
- 'open_access': filters.get('open_access'),
299
+ "year_start": filters.get("year_start"),
300
+ "year_end": filters.get("year_end"),
301
+ "open_access": filters.get("open_access"),
286
302
  }
287
303
 
288
304
  # Search with timeout using new search_by_keywords method
@@ -290,74 +306,82 @@ class ScholarPipelineSearchParallel:
290
306
  loop.run_in_executor(
291
307
  None,
292
308
  lambda: engine.search_by_keywords(
293
- query=query,
294
- filters=api_filters,
295
- max_results=max_results
296
- )
309
+ query=query, filters=api_filters, max_results=max_results
310
+ ),
297
311
  ),
298
- timeout=self.timeout_per_engine
312
+ timeout=self.timeout_per_engine,
299
313
  )
300
314
 
301
315
  # Convert result dicts to Paper objects
302
316
  results = []
303
- for result in (results_list or []):
317
+ for result in results_list or []:
304
318
  paper = Paper()
305
319
 
306
320
  # Populate paper metadata from result
307
- if 'id' in result:
308
- if result['id'].get('doi'):
309
- paper.metadata.id.doi = result['id']['doi']
310
- paper.metadata.id.doi_engines = result['id'].get('doi_engines', [])
311
- if result['id'].get('pmid'):
312
- paper.metadata.id.pmid = result['id']['pmid']
313
- if result['id'].get('arxiv'):
314
- paper.metadata.id.arxiv_id = result['id']['arxiv']
315
-
316
- if 'basic' in result:
317
- if result['basic'].get('title'):
318
- paper.metadata.basic.title = result['basic']['title']
319
- if result['basic'].get('authors'):
320
- paper.metadata.basic.authors = result['basic']['authors']
321
- if result['basic'].get('abstract'):
322
- paper.metadata.basic.abstract = result['basic']['abstract']
323
- if result['basic'].get('keywords'):
324
- paper.metadata.basic.keywords = result['basic']['keywords']
325
-
326
- if 'publication' in result:
327
- if result['publication'].get('year'):
328
- paper.metadata.basic.year = result['publication']['year']
329
- if result['publication'].get('journal'):
330
- paper.metadata.publication.journal = result['publication']['journal']
331
-
332
- if 'metrics' in result:
333
- if result['metrics'].get('citation_count'):
334
- paper.metadata.citation_count.total = result['metrics']['citation_count']
335
- if 'is_open_access' in result['metrics']:
336
- paper.metadata.access.is_open_access = result['metrics']['is_open_access']
321
+ if "id" in result:
322
+ if result["id"].get("doi"):
323
+ paper.metadata.id.doi = result["id"]["doi"]
324
+ paper.metadata.id.doi_engines = result["id"].get(
325
+ "doi_engines", []
326
+ )
327
+ if result["id"].get("pmid"):
328
+ paper.metadata.id.pmid = result["id"]["pmid"]
329
+ if result["id"].get("arxiv"):
330
+ paper.metadata.id.arxiv_id = result["id"]["arxiv"]
331
+
332
+ if "basic" in result:
333
+ if result["basic"].get("title"):
334
+ paper.metadata.basic.title = result["basic"]["title"]
335
+ if result["basic"].get("authors"):
336
+ paper.metadata.basic.authors = result["basic"]["authors"]
337
+ if result["basic"].get("abstract"):
338
+ paper.metadata.basic.abstract = result["basic"]["abstract"]
339
+ if result["basic"].get("keywords"):
340
+ paper.metadata.basic.keywords = result["basic"]["keywords"]
341
+
342
+ if "publication" in result:
343
+ if result["publication"].get("year"):
344
+ paper.metadata.basic.year = result["publication"]["year"]
345
+ if result["publication"].get("journal"):
346
+ paper.metadata.publication.journal = result["publication"][
347
+ "journal"
348
+ ]
349
+
350
+ if "metrics" in result:
351
+ if result["metrics"].get("citation_count"):
352
+ paper.metadata.citation_count.total = result["metrics"][
353
+ "citation_count"
354
+ ]
355
+ if "is_open_access" in result["metrics"]:
356
+ paper.metadata.access.is_open_access = result["metrics"][
357
+ "is_open_access"
358
+ ]
337
359
  paper.metadata.access.is_open_access_engines = [engine_name]
338
360
 
339
- if 'urls' in result:
340
- if result['urls'].get('pdf'):
361
+ if "urls" in result:
362
+ if result["urls"].get("pdf"):
341
363
  # pdfs is a list of dicts with url/source keys
342
- paper.metadata.url.pdfs = [{'url': result['urls']['pdf'], 'source': 'search'}]
364
+ paper.metadata.url.pdfs = [
365
+ {"url": result["urls"]["pdf"], "source": "search"}
366
+ ]
343
367
  # If this is an open access paper, also store the PDF URL as oa_url
344
368
  if paper.metadata.access.is_open_access:
345
- paper.metadata.access.oa_url = result['urls']['pdf']
369
+ paper.metadata.access.oa_url = result["urls"]["pdf"]
346
370
  paper.metadata.access.oa_url_engines = [engine_name]
347
- if result['urls'].get('publisher'):
348
- paper.metadata.url.publisher = result['urls']['publisher']
349
- if result['urls'].get('doi_url'):
350
- paper.metadata.url.doi = result['urls']['doi_url']
371
+ if result["urls"].get("publisher"):
372
+ paper.metadata.url.publisher = result["urls"]["publisher"]
373
+ if result["urls"].get("doi_url"):
374
+ paper.metadata.url.doi = result["urls"]["doi_url"]
351
375
 
352
376
  results.append(paper)
353
377
 
354
378
  # Update stats
355
379
  response_time = (datetime.now() - engine_start).total_seconds()
356
- stats = self.stats['engine_stats'][engine_name]
357
- n = stats['attempts']
358
- stats['avg_response_time'] = (
359
- (stats['avg_response_time'] * (n - 1) + response_time) / n
360
- )
380
+ stats = self.stats["engine_stats"][engine_name]
381
+ n = stats["attempts"]
382
+ stats["avg_response_time"] = (
383
+ stats["avg_response_time"] * (n - 1) + response_time
384
+ ) / n
361
385
 
362
386
  # Store engine count
363
387
  if engine_counts is not None:
@@ -366,10 +390,14 @@ class ScholarPipelineSearchParallel:
366
390
  # Notify completion
367
391
  if on_progress:
368
392
  try:
369
- on_progress(engine_name, 'completed', len(results))
370
- logger.info(f"{self.name}: Called on_progress for {engine_name}: completed, {len(results)}")
393
+ on_progress(engine_name, "completed", len(results))
394
+ logger.info(
395
+ f"{self.name}: Called on_progress for {engine_name}: completed, {len(results)}"
396
+ )
371
397
  except Exception as e:
372
- logger.error(f"{self.name}: Progress callback error for {engine_name}: {e}")
398
+ logger.error(
399
+ f"{self.name}: Progress callback error for {engine_name}: {e}"
400
+ )
373
401
 
374
402
  logger.info(
375
403
  f"{self.name}: {engine_name} returned {len(results)} results "
@@ -379,22 +407,27 @@ class ScholarPipelineSearchParallel:
379
407
  return results
380
408
 
381
409
  except asyncio.TimeoutError:
382
- logger.warning(f"{self.name}: {engine_name} timed out after {self.timeout_per_engine}s")
410
+ logger.warning(
411
+ f"{self.name}: {engine_name} timed out after {self.timeout_per_engine}s"
412
+ )
383
413
  # Notify error
384
414
  if on_progress:
385
415
  try:
386
- on_progress(engine_name, 'error', 0)
416
+ on_progress(engine_name, "error", 0)
387
417
  except Exception:
388
418
  pass
389
419
  return []
390
420
  except Exception as e:
391
421
  logger.error(f"{self.name}: {engine_name} search failed: {e}")
392
422
  import traceback
393
- logger.error(f"{self.name}: {engine_name} traceback:\n{traceback.format_exc()}")
423
+
424
+ logger.error(
425
+ f"{self.name}: {engine_name} traceback:\n{traceback.format_exc()}"
426
+ )
394
427
  # Notify error
395
428
  if on_progress:
396
429
  try:
397
- on_progress(engine_name, 'error', 0)
430
+ on_progress(engine_name, "error", 0)
398
431
  except Exception:
399
432
  pass
400
433
  return []
@@ -411,12 +444,16 @@ class ScholarPipelineSearchParallel:
411
444
  enriched = 0
412
445
  for paper in papers:
413
446
  # Skip if already has citations
414
- if hasattr(paper.metadata, 'citation_count') and paper.metadata.citation_count.total and paper.metadata.citation_count.total > 0:
447
+ if (
448
+ hasattr(paper.metadata, "citation_count")
449
+ and paper.metadata.citation_count.total
450
+ and paper.metadata.citation_count.total > 0
451
+ ):
415
452
  continue
416
453
 
417
454
  # Try to enrich via DOI using OpenAlex (fastest)
418
455
  doi = None
419
- if hasattr(paper.metadata, 'id') and paper.metadata.id.doi:
456
+ if hasattr(paper.metadata, "id") and paper.metadata.id.doi:
420
457
  doi = paper.metadata.id.doi
421
458
 
422
459
  if doi:
@@ -426,13 +463,15 @@ class ScholarPipelineSearchParallel:
426
463
  result = await asyncio.wait_for(
427
464
  loop.run_in_executor(
428
465
  None,
429
- lambda: self.engines['OpenAlex'].get_metadata_by_doi(doi)
466
+ lambda: self.engines["OpenAlex"].get_metadata_by_doi(doi),
430
467
  ),
431
- timeout=2.0 # Quick timeout for enrichment
468
+ timeout=2.0, # Quick timeout for enrichment
432
469
  )
433
470
 
434
- if result and result.get('metrics', {}).get('citation_count'):
435
- paper.metadata.citation_count.total = result['metrics']['citation_count']
471
+ if result and result.get("metrics", {}).get("citation_count"):
472
+ paper.metadata.citation_count.total = result["metrics"][
473
+ "citation_count"
474
+ ]
436
475
  enriched += 1
437
476
 
438
477
  except asyncio.TimeoutError:
@@ -461,23 +500,33 @@ class ScholarPipelineSearchParallel:
461
500
 
462
501
  for paper in papers:
463
502
  # Skip if already has impact factor
464
- if hasattr(paper.metadata, 'publication') and paper.metadata.publication.impact_factor:
503
+ if (
504
+ hasattr(paper.metadata, "publication")
505
+ and paper.metadata.publication.impact_factor
506
+ ):
465
507
  continue
466
508
 
467
509
  # Get journal name
468
510
  journal = None
469
- if hasattr(paper.metadata, 'publication') and paper.metadata.publication.journal:
511
+ if (
512
+ hasattr(paper.metadata, "publication")
513
+ and paper.metadata.publication.journal
514
+ ):
470
515
  journal = paper.metadata.publication.journal
471
516
 
472
517
  if journal:
473
518
  try:
474
519
  metrics = engine.get_metrics(journal)
475
- if metrics and metrics.get('impact_factor'):
476
- paper.metadata.publication.impact_factor = metrics['impact_factor']
477
- if not hasattr(paper.metadata.publication, 'impact_factor_engines'):
520
+ if metrics and metrics.get("impact_factor"):
521
+ paper.metadata.publication.impact_factor = metrics[
522
+ "impact_factor"
523
+ ]
524
+ if not hasattr(
525
+ paper.metadata.publication, "impact_factor_engines"
526
+ ):
478
527
  paper.metadata.publication.impact_factor_engines = []
479
528
  paper.metadata.publication.impact_factor_engines.append(
480
- metrics.get('source', 'ImpactFactorEngine')
529
+ metrics.get("source", "ImpactFactorEngine")
481
530
  )
482
531
  enriched += 1
483
532
  except Exception:
@@ -488,7 +537,9 @@ class ScholarPipelineSearchParallel:
488
537
 
489
538
  return papers
490
539
 
491
- def _apply_threshold_filters(self, papers: List[Paper], filters: Dict[str, Any]) -> List[Paper]:
540
+ def _apply_threshold_filters(
541
+ self, papers: List[Paper], filters: Dict[str, Any]
542
+ ) -> List[Paper]:
492
543
  """Apply threshold filters to papers.
493
544
 
494
545
  Args:
@@ -504,56 +555,67 @@ class ScholarPipelineSearchParallel:
504
555
  """
505
556
  filtered_papers = []
506
557
  filter_stats = {
507
- 'min_year': 0,
508
- 'max_year': 0,
509
- 'min_citations': 0,
510
- 'min_impact_factor': 0
558
+ "min_year": 0,
559
+ "max_year": 0,
560
+ "min_citations": 0,
561
+ "min_impact_factor": 0,
511
562
  }
512
563
 
513
564
  for paper in papers:
514
565
  # Check year range
515
- if 'min_year' in filters:
566
+ if "min_year" in filters:
516
567
  try:
517
- min_year = int(filters['min_year'])
518
- year = paper.metadata.basic.year if hasattr(paper.metadata, 'basic') else None
568
+ min_year = int(filters["min_year"])
569
+ year = (
570
+ paper.metadata.basic.year
571
+ if hasattr(paper.metadata, "basic")
572
+ else None
573
+ )
519
574
  if not year or year < min_year:
520
- filter_stats['min_year'] += 1
575
+ filter_stats["min_year"] += 1
521
576
  continue
522
577
  except (ValueError, AttributeError):
523
578
  pass
524
579
 
525
- if 'max_year' in filters:
580
+ if "max_year" in filters:
526
581
  try:
527
- max_year = int(filters['max_year'])
528
- year = paper.metadata.basic.year if hasattr(paper.metadata, 'basic') else None
582
+ max_year = int(filters["max_year"])
583
+ year = (
584
+ paper.metadata.basic.year
585
+ if hasattr(paper.metadata, "basic")
586
+ else None
587
+ )
529
588
  if not year or year > max_year:
530
- filter_stats['max_year'] += 1
589
+ filter_stats["max_year"] += 1
531
590
  continue
532
591
  except (ValueError, AttributeError):
533
592
  pass
534
593
 
535
594
  # Check minimum citations
536
- if 'min_citations' in filters:
595
+ if "min_citations" in filters:
537
596
  try:
538
- min_citations = int(filters['min_citations'])
597
+ min_citations = int(filters["min_citations"])
539
598
  citations = 0
540
- if hasattr(paper.metadata, 'citation_count'):
599
+ if hasattr(paper.metadata, "citation_count"):
541
600
  citations = paper.metadata.citation_count.total or 0
542
601
  if citations < min_citations:
543
- filter_stats['min_citations'] += 1
602
+ filter_stats["min_citations"] += 1
544
603
  continue
545
604
  except (ValueError, AttributeError):
546
605
  pass
547
606
 
548
607
  # Check minimum impact factor
549
- if 'min_impact_factor' in filters:
608
+ if "min_impact_factor" in filters:
550
609
  try:
551
- min_if = float(filters['min_impact_factor'])
610
+ min_if = float(filters["min_impact_factor"])
552
611
  impact_factor = 0.0
553
- if hasattr(paper.metadata, 'publication') and paper.metadata.publication.impact_factor:
612
+ if (
613
+ hasattr(paper.metadata, "publication")
614
+ and paper.metadata.publication.impact_factor
615
+ ):
554
616
  impact_factor = paper.metadata.publication.impact_factor or 0.0
555
617
  if impact_factor < min_if:
556
- filter_stats['min_impact_factor'] += 1
618
+ filter_stats["min_impact_factor"] += 1
557
619
  continue
558
620
  except (ValueError, AttributeError):
559
621
  pass
@@ -564,7 +626,11 @@ class ScholarPipelineSearchParallel:
564
626
  # Log filter statistics
565
627
  total_filtered = sum(filter_stats.values())
566
628
  if total_filtered > 0:
567
- filter_msgs = [f"{count} by {name}" for name, count in filter_stats.items() if count > 0]
629
+ filter_msgs = [
630
+ f"{count} by {name}"
631
+ for name, count in filter_stats.items()
632
+ if count > 0
633
+ ]
568
634
  logger.info(
569
635
  f"{self.name}: Filtered {total_filtered} papers ({', '.join(filter_msgs)}), "
570
636
  f"{len(filtered_papers)} remain"
@@ -572,7 +638,9 @@ class ScholarPipelineSearchParallel:
572
638
 
573
639
  return filtered_papers
574
640
 
575
- def _sort_papers(self, papers: List[Paper], sort_by: str, sort_order: str = 'desc') -> List[Paper]:
641
+ def _sort_papers(
642
+ self, papers: List[Paper], sort_by: str, sort_order: str = "desc"
643
+ ) -> List[Paper]:
576
644
  """Sort papers by specified criteria (supports multi-level sorting).
577
645
 
578
646
  Args:
@@ -588,12 +656,12 @@ class ScholarPipelineSearchParallel:
588
656
  # Parse sort criteria (supports both old single format and new multi-level format)
589
657
  sort_criteria = []
590
658
 
591
- if ',' in sort_by:
659
+ if "," in sort_by:
592
660
  # Multi-level sorting: "citations:desc,year:desc,title:asc"
593
- for criterion in sort_by.split(','):
661
+ for criterion in sort_by.split(","):
594
662
  criterion = criterion.strip()
595
- if ':' in criterion:
596
- field, order = criterion.split(':', 1)
663
+ if ":" in criterion:
664
+ field, order = criterion.split(":", 1)
597
665
  sort_criteria.append((field.strip(), order.strip()))
598
666
  else:
599
667
  sort_criteria.append((criterion, sort_order))
@@ -603,20 +671,23 @@ class ScholarPipelineSearchParallel:
603
671
 
604
672
  def get_sort_value(paper, field):
605
673
  """Get sortable value for a specific field."""
606
- if field == 'citations':
607
- if hasattr(paper.metadata, 'citation_count'):
674
+ if field == "citations":
675
+ if hasattr(paper.metadata, "citation_count"):
608
676
  return paper.metadata.citation_count.total or 0
609
677
  return 0
610
- elif field == 'year':
611
- if hasattr(paper.metadata, 'basic'):
678
+ elif field == "year":
679
+ if hasattr(paper.metadata, "basic"):
612
680
  return paper.metadata.basic.year or 0
613
681
  return 0
614
- elif field == 'title':
615
- if hasattr(paper.metadata, 'basic'):
616
- return (paper.metadata.basic.title or '').lower()
617
- return ''
618
- elif field == 'impact_factor':
619
- if hasattr(paper.metadata, 'publication') and paper.metadata.publication.impact_factor:
682
+ elif field == "title":
683
+ if hasattr(paper.metadata, "basic"):
684
+ return (paper.metadata.basic.title or "").lower()
685
+ return ""
686
+ elif field == "impact_factor":
687
+ if (
688
+ hasattr(paper.metadata, "publication")
689
+ and paper.metadata.publication.impact_factor
690
+ ):
620
691
  return paper.metadata.publication.impact_factor or 0
621
692
  return 0
622
693
  return 0
@@ -627,7 +698,7 @@ class ScholarPipelineSearchParallel:
627
698
  for field, order in sort_criteria:
628
699
  value = get_sort_value(paper, field)
629
700
  # Negate numeric values for descending order (so higher values come first)
630
- if order == 'desc' and isinstance(value, (int, float)):
701
+ if order == "desc" and isinstance(value, (int, float)):
631
702
  value = -value
632
703
  # For strings, we'll handle reverse in the sorted() call
633
704
  key_tuple.append(value)
@@ -635,28 +706,32 @@ class ScholarPipelineSearchParallel:
635
706
 
636
707
  # Sort by the multi-level key
637
708
  # String fields need special handling for desc order
638
- has_string_fields = any(field in ['title'] for field, _ in sort_criteria)
709
+ has_string_fields = any(field in ["title"] for field, _ in sort_criteria)
639
710
 
640
711
  if has_string_fields:
641
712
  # Use multiple sorted() passes for mixed numeric/string fields (stable sort)
642
713
  sorted_papers = papers[:]
643
714
  for field, order in reversed(sort_criteria):
644
- reverse = (order == 'desc')
715
+ reverse = order == "desc"
645
716
  sorted_papers = sorted(
646
717
  sorted_papers,
647
718
  key=lambda p: get_sort_value(p, field),
648
- reverse=reverse
719
+ reverse=reverse,
649
720
  )
650
721
  else:
651
722
  # Pure numeric sorting can use single pass
652
723
  sorted_papers = sorted(papers, key=get_sort_key)
653
724
 
654
725
  if len(sort_criteria) > 1:
655
- criteria_str = ', then by '.join([f"{field} ({order})" for field, order in sort_criteria])
726
+ criteria_str = ", then by ".join(
727
+ [f"{field} ({order})" for field, order in sort_criteria]
728
+ )
656
729
  logger.info(f"{self.name}: Sorted {len(papers)} papers by {criteria_str}")
657
730
  else:
658
731
  field, order = sort_criteria[0]
659
- logger.info(f"{self.name}: Sorted {len(papers)} papers by {field} ({order})")
732
+ logger.info(
733
+ f"{self.name}: Sorted {len(papers)} papers by {field} ({order})"
734
+ )
660
735
 
661
736
  return sorted_papers
662
737
 
@@ -669,12 +744,12 @@ class ScholarPipelineSearchParallel:
669
744
  for paper in papers:
670
745
  # Get DOI
671
746
  doi = None
672
- if hasattr(paper, 'metadata') and hasattr(paper.metadata, 'id'):
747
+ if hasattr(paper, "metadata") and hasattr(paper.metadata, "id"):
673
748
  doi = paper.metadata.id.doi
674
749
 
675
750
  # Get title
676
751
  title = None
677
- if hasattr(paper, 'metadata') and hasattr(paper.metadata, 'basic'):
752
+ if hasattr(paper, "metadata") and hasattr(paper.metadata, "basic"):
678
753
  title = paper.metadata.basic.title
679
754
 
680
755
  # Skip if duplicate
@@ -700,67 +775,69 @@ class ScholarPipelineSearchParallel:
700
775
  def _paper_to_dict(self, paper: Paper) -> Dict[str, Any]:
701
776
  """Convert Paper object to dictionary for API response."""
702
777
  result = {
703
- 'title': '',
704
- 'authors': [],
705
- 'year': None,
706
- 'abstract': '',
707
- 'journal': '',
708
- 'impact_factor': None,
709
- 'doi': '',
710
- 'pmid': '',
711
- 'arxiv_id': '',
712
- 'citation_count': 0,
713
- 'is_open_access': False,
714
- 'pdf_url': '',
715
- 'external_url': '',
716
- 'document_type': 'article',
717
- 'keywords': [],
718
- 'source_engines': [],
778
+ "title": "",
779
+ "authors": [],
780
+ "year": None,
781
+ "abstract": "",
782
+ "journal": "",
783
+ "impact_factor": None,
784
+ "doi": "",
785
+ "pmid": "",
786
+ "arxiv_id": "",
787
+ "citation_count": 0,
788
+ "is_open_access": False,
789
+ "pdf_url": "",
790
+ "external_url": "",
791
+ "document_type": "article",
792
+ "keywords": [],
793
+ "source_engines": [],
719
794
  }
720
795
 
721
- if not hasattr(paper, 'metadata'):
796
+ if not hasattr(paper, "metadata"):
722
797
  return result
723
798
 
724
799
  meta = paper.metadata
725
800
 
726
801
  # Basic info
727
- if hasattr(meta, 'basic'):
728
- result['title'] = meta.basic.title or ''
729
- result['authors'] = meta.basic.authors or []
730
- result['abstract'] = meta.basic.abstract or ''
731
- result['keywords'] = meta.basic.keywords or []
732
- result['year'] = meta.basic.year
802
+ if hasattr(meta, "basic"):
803
+ result["title"] = meta.basic.title or ""
804
+ result["authors"] = meta.basic.authors or []
805
+ result["abstract"] = meta.basic.abstract or ""
806
+ result["keywords"] = meta.basic.keywords or []
807
+ result["year"] = meta.basic.year
733
808
 
734
809
  # IDs
735
- if hasattr(meta, 'id'):
736
- result['doi'] = meta.id.doi or ''
737
- result['pmid'] = meta.id.pmid or ''
738
- result['arxiv_id'] = meta.id.arxiv_id or ''
739
- result['source_engines'] = meta.id.doi_engines or []
810
+ if hasattr(meta, "id"):
811
+ result["doi"] = meta.id.doi or ""
812
+ result["pmid"] = meta.id.pmid or ""
813
+ result["arxiv_id"] = meta.id.arxiv_id or ""
814
+ result["source_engines"] = meta.id.doi_engines or []
740
815
 
741
816
  # Publication info
742
- if hasattr(meta, 'publication'):
743
- journal_raw = meta.publication.journal or ''
744
- result['journal'] = normalize_journal_name(journal_raw) if journal_raw else ''
745
- result['impact_factor'] = meta.publication.impact_factor
817
+ if hasattr(meta, "publication"):
818
+ journal_raw = meta.publication.journal or ""
819
+ result["journal"] = (
820
+ normalize_journal_name(journal_raw) if journal_raw else ""
821
+ )
822
+ result["impact_factor"] = meta.publication.impact_factor
746
823
 
747
824
  # Metrics
748
- if hasattr(meta, 'citation_count'):
749
- result['citation_count'] = meta.citation_count.total or 0
825
+ if hasattr(meta, "citation_count"):
826
+ result["citation_count"] = meta.citation_count.total or 0
750
827
 
751
828
  # Access metadata
752
- if hasattr(meta, 'access'):
753
- result['is_open_access'] = meta.access.is_open_access or False
754
- result['oa_status'] = meta.access.oa_status
755
- result['oa_url'] = meta.access.oa_url
829
+ if hasattr(meta, "access"):
830
+ result["is_open_access"] = meta.access.is_open_access or False
831
+ result["oa_status"] = meta.access.oa_status
832
+ result["oa_url"] = meta.access.oa_url
756
833
  else:
757
- result['is_open_access'] = False
834
+ result["is_open_access"] = False
758
835
 
759
836
  # URLs
760
- if hasattr(meta, 'url'):
837
+ if hasattr(meta, "url"):
761
838
  # Extract first PDF URL from pdfs list
762
- result['pdf_url'] = meta.url.pdfs[0]['url'] if meta.url.pdfs else ''
763
- result['external_url'] = meta.url.publisher or meta.url.doi or ''
839
+ result["pdf_url"] = meta.url.pdfs[0]["url"] if meta.url.pdfs else ""
840
+ result["external_url"] = meta.url.publisher or meta.url.doi or ""
764
841
 
765
842
  return result
766
843
 
@@ -768,13 +845,15 @@ class ScholarPipelineSearchParallel:
768
845
  """Get pipeline statistics."""
769
846
  return {
770
847
  **self.stats,
771
- 'success_rate': (
772
- 100 * self.stats['successful_searches'] / self.stats['total_searches']
773
- if self.stats['total_searches'] > 0 else 0
848
+ "success_rate": (
849
+ 100 * self.stats["successful_searches"] / self.stats["total_searches"]
850
+ if self.stats["total_searches"] > 0
851
+ else 0
774
852
  ),
775
- 'average_time': (
776
- self.stats['total_time'] / self.stats['successful_searches']
777
- if self.stats['successful_searches'] > 0 else 0
853
+ "average_time": (
854
+ self.stats["total_time"] / self.stats["successful_searches"]
855
+ if self.stats["successful_searches"] > 0
856
+ else 0
778
857
  ),
779
858
  }
780
859
 
@@ -784,12 +863,12 @@ class ScholarPipelineSearchParallel:
784
863
  return {}
785
864
 
786
865
  return {
787
- 'name': engine_name,
788
- 'supports_query_search': True,
789
- 'supports_doi_lookup': True,
790
- 'supports_filters': True,
791
- 'max_results': 1000,
792
- 'stats': self.stats['engine_stats'].get(engine_name, {}),
866
+ "name": engine_name,
867
+ "supports_query_search": True,
868
+ "supports_doi_lookup": True,
869
+ "supports_filters": True,
870
+ "max_results": 1000,
871
+ "stats": self.stats["engine_stats"].get(engine_name, {}),
793
872
  }
794
873
 
795
874