PyPI - scitex - Versions diffs - 2.0.0__py2.py3-none-any.whl → 2.1.0__py2.py3-none-any.whl - Mend

scitex 2.0.0py2.py3-none-any.whl → 2.1.0py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (704) hide show

scitex/__init__.py +53 -15
scitex/__main__.py +72 -26
scitex/__version__.py +1 -1
scitex/_sh.py +145 -23
scitex/ai/__init__.py +30 -16
scitex/ai/_gen_ai/_Anthropic.py +5 -7
scitex/ai/_gen_ai/_BaseGenAI.py +2 -2
scitex/ai/_gen_ai/_DeepSeek.py +10 -2
scitex/ai/_gen_ai/_Google.py +2 -2
scitex/ai/_gen_ai/_Llama.py +2 -2
scitex/ai/_gen_ai/_OpenAI.py +2 -2
scitex/ai/_gen_ai/_PARAMS.py +51 -65
scitex/ai/_gen_ai/_Perplexity.py +2 -2
scitex/ai/_gen_ai/__init__.py +25 -14
scitex/ai/_gen_ai/_format_output_func.py +4 -4
scitex/ai/classification/{classifier_server.py → Classifier.py} +5 -5
scitex/ai/classification/CrossValidationExperiment.py +374 -0
scitex/ai/classification/__init__.py +43 -4
scitex/ai/classification/reporters/_BaseClassificationReporter.py +281 -0
scitex/ai/classification/reporters/_ClassificationReporter.py +773 -0
scitex/ai/classification/reporters/_MultiClassificationReporter.py +406 -0
scitex/ai/classification/reporters/_SingleClassificationReporter.py +1834 -0
scitex/ai/classification/reporters/__init__.py +11 -0
scitex/ai/classification/reporters/reporter_utils/_Plotter.py +1028 -0
scitex/ai/classification/reporters/reporter_utils/__init__.py +80 -0
scitex/ai/classification/reporters/reporter_utils/aggregation.py +457 -0
scitex/ai/classification/reporters/reporter_utils/data_models.py +313 -0
scitex/ai/classification/reporters/reporter_utils/reporting.py +1056 -0
scitex/ai/classification/reporters/reporter_utils/storage.py +221 -0
scitex/ai/classification/reporters/reporter_utils/validation.py +395 -0
scitex/ai/classification/timeseries/_TimeSeriesBlockingSplit.py +568 -0
scitex/ai/classification/timeseries/_TimeSeriesCalendarSplit.py +688 -0
scitex/ai/classification/timeseries/_TimeSeriesMetadata.py +139 -0
scitex/ai/classification/timeseries/_TimeSeriesSlidingWindowSplit.py +1716 -0
scitex/ai/classification/timeseries/_TimeSeriesSlidingWindowSplit_v01-not-using-n_splits.py +1685 -0
scitex/ai/classification/timeseries/_TimeSeriesStrategy.py +84 -0
scitex/ai/classification/timeseries/_TimeSeriesStratifiedSplit.py +610 -0
scitex/ai/classification/timeseries/__init__.py +39 -0
scitex/ai/classification/timeseries/_normalize_timestamp.py +436 -0
scitex/ai/clustering/_umap.py +2 -2
scitex/ai/feature_extraction/vit.py +1 -0
scitex/ai/feature_selection/__init__.py +30 -0
scitex/ai/feature_selection/feature_selection.py +364 -0
scitex/ai/loss/multi_task_loss.py +1 -1
scitex/ai/metrics/__init__.py +51 -4
scitex/ai/metrics/_calc_bacc.py +61 -0
scitex/ai/metrics/_calc_bacc_from_conf_mat.py +38 -0
scitex/ai/metrics/_calc_clf_report.py +78 -0
scitex/ai/metrics/_calc_conf_mat.py +93 -0
scitex/ai/metrics/_calc_feature_importance.py +183 -0
scitex/ai/metrics/_calc_mcc.py +61 -0
scitex/ai/metrics/_calc_pre_rec_auc.py +116 -0
scitex/ai/metrics/_calc_roc_auc.py +110 -0
scitex/ai/metrics/_calc_seizure_prediction_metrics.py +490 -0
scitex/ai/metrics/{silhoute_score_block.py → _calc_silhouette_score.py} +15 -8
scitex/ai/metrics/_normalize_labels.py +83 -0
scitex/ai/plt/__init__.py +47 -8
scitex/ai/plt/{_conf_mat.py → _plot_conf_mat.py} +158 -87
scitex/ai/plt/_plot_feature_importance.py +323 -0
scitex/ai/plt/_plot_learning_curve.py +345 -0
scitex/ai/plt/_plot_optuna_study.py +225 -0
scitex/ai/plt/_plot_pre_rec_curve.py +290 -0
scitex/ai/plt/_plot_roc_curve.py +255 -0
scitex/ai/training/{learning_curve_logger.py → _LearningCurveLogger.py} +197 -213
scitex/ai/training/__init__.py +2 -2
scitex/ai/utils/grid_search.py +3 -3
scitex/benchmark/__init__.py +52 -0
scitex/benchmark/benchmark.py +400 -0
scitex/benchmark/monitor.py +370 -0
scitex/benchmark/profiler.py +297 -0
scitex/browser/__init__.py +48 -0
scitex/browser/automation/CookieHandler.py +216 -0
scitex/browser/automation/__init__.py +7 -0
scitex/browser/collaboration/__init__.py +55 -0
scitex/browser/collaboration/auth_helpers.py +94 -0
scitex/browser/collaboration/collaborative_agent.py +136 -0
scitex/browser/collaboration/credential_manager.py +188 -0
scitex/browser/collaboration/interactive_panel.py +400 -0
scitex/browser/collaboration/persistent_browser.py +170 -0
scitex/browser/collaboration/shared_session.py +383 -0
scitex/browser/collaboration/standard_interactions.py +246 -0
scitex/browser/collaboration/visual_feedback.py +181 -0
scitex/browser/core/BrowserMixin.py +326 -0
scitex/browser/core/ChromeProfileManager.py +446 -0
scitex/browser/core/__init__.py +9 -0
scitex/browser/debugging/__init__.py +18 -0
scitex/browser/debugging/_browser_logger.py +657 -0
scitex/browser/debugging/_highlight_element.py +143 -0
scitex/browser/debugging/_show_grid.py +154 -0
scitex/browser/interaction/__init__.py +24 -0
scitex/browser/interaction/click_center.py +149 -0
scitex/browser/interaction/click_with_fallbacks.py +206 -0
scitex/browser/interaction/close_popups.py +498 -0
scitex/browser/interaction/fill_with_fallbacks.py +209 -0
scitex/browser/pdf/__init__.py +14 -0
scitex/browser/pdf/click_download_for_chrome_pdf_viewer.py +200 -0
scitex/browser/pdf/detect_chrome_pdf_viewer.py +198 -0
scitex/browser/remote/CaptchaHandler.py +434 -0
scitex/browser/remote/ZenRowsAPIClient.py +347 -0
scitex/browser/remote/ZenRowsBrowserManager.py +570 -0
scitex/browser/remote/__init__.py +11 -0
scitex/browser/stealth/HumanBehavior.py +344 -0
scitex/browser/stealth/StealthManager.py +1008 -0
scitex/browser/stealth/__init__.py +9 -0
scitex/browser/template.py +122 -0
scitex/capture/__init__.py +110 -0
scitex/capture/__main__.py +25 -0
scitex/capture/capture.py +848 -0
scitex/capture/cli.py +233 -0
scitex/capture/gif.py +344 -0
scitex/capture/mcp_server.py +961 -0
scitex/capture/session.py +70 -0
scitex/capture/utils.py +705 -0
scitex/cli/__init__.py +17 -0
scitex/cli/cloud.py +447 -0
scitex/cli/main.py +42 -0
scitex/cli/scholar.py +280 -0
scitex/context/_suppress_output.py +5 -3
scitex/db/__init__.py +30 -3
scitex/db/__main__.py +75 -0
scitex/db/_check_health.py +381 -0
scitex/db/_delete_duplicates.py +25 -386
scitex/db/_inspect.py +335 -114
scitex/db/_inspect_optimized.py +301 -0
scitex/db/{_PostgreSQL.py → _postgresql/_PostgreSQL.py} +3 -3
scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_BackupMixin.py +1 -1
scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_BatchMixin.py +1 -1
scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_BlobMixin.py +1 -1
scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_ConnectionMixin.py +1 -1
scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_MaintenanceMixin.py +1 -1
scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_QueryMixin.py +1 -1
scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_SchemaMixin.py +1 -1
scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_TransactionMixin.py +1 -1
scitex/db/_postgresql/__init__.py +6 -0
scitex/db/_sqlite3/_SQLite3.py +210 -0
scitex/db/_sqlite3/_SQLite3Mixins/_ArrayMixin.py +581 -0
scitex/db/_sqlite3/_SQLite3Mixins/_ArrayMixin_v01-need-_hash-col.py +517 -0
scitex/db/{_SQLite3Mixins → _sqlite3/_SQLite3Mixins}/_BatchMixin.py +1 -1
scitex/db/_sqlite3/_SQLite3Mixins/_BlobMixin.py +281 -0
scitex/db/_sqlite3/_SQLite3Mixins/_ColumnMixin.py +548 -0
scitex/db/_sqlite3/_SQLite3Mixins/_ColumnMixin_v01-indentation-issues.py +583 -0
scitex/db/{_SQLite3Mixins → _sqlite3/_SQLite3Mixins}/_ConnectionMixin.py +29 -13
scitex/db/_sqlite3/_SQLite3Mixins/_GitMixin.py +583 -0
scitex/db/{_SQLite3Mixins → _sqlite3/_SQLite3Mixins}/_ImportExportMixin.py +1 -1
scitex/db/{_SQLite3Mixins → _sqlite3/_SQLite3Mixins}/_IndexMixin.py +1 -1
scitex/db/{_SQLite3Mixins → _sqlite3/_SQLite3Mixins}/_MaintenanceMixin.py +2 -1
scitex/db/{_SQLite3Mixins → _sqlite3/_SQLite3Mixins}/_QueryMixin.py +37 -10
scitex/db/{_SQLite3Mixins → _sqlite3/_SQLite3Mixins}/_RowMixin.py +46 -6
scitex/db/{_SQLite3Mixins → _sqlite3/_SQLite3Mixins}/_TableMixin.py +56 -10
scitex/db/{_SQLite3Mixins → _sqlite3/_SQLite3Mixins}/_TransactionMixin.py +1 -1
scitex/db/{_SQLite3Mixins → _sqlite3/_SQLite3Mixins}/__init__.py +14 -2
scitex/db/_sqlite3/__init__.py +7 -0
scitex/db/_sqlite3/_delete_duplicates.py +274 -0
scitex/decorators/__init__.py +2 -0
scitex/decorators/_cache_disk.py +13 -5
scitex/decorators/_cache_disk_async.py +49 -0
scitex/decorators/_deprecated.py +175 -10
scitex/decorators/_timeout.py +1 -1
scitex/dev/_analyze_code_flow.py +2 -2
scitex/dict/_DotDict.py +73 -15
scitex/dict/_DotDict_v01-not-handling-recursive-instantiations.py +442 -0
scitex/dict/_DotDict_v02-not-serializing-Path-object.py +446 -0
scitex/dict/__init__.py +2 -0
scitex/dict/_flatten.py +27 -0
scitex/dsp/_crop.py +2 -2
scitex/dsp/_demo_sig.py +2 -2
scitex/dsp/_detect_ripples.py +2 -2
scitex/dsp/_hilbert.py +2 -2
scitex/dsp/_listen.py +6 -6
scitex/dsp/_modulation_index.py +2 -2
scitex/dsp/_pac.py +1 -1
scitex/dsp/_psd.py +2 -2
scitex/dsp/_resample.py +2 -1
scitex/dsp/_time.py +3 -2
scitex/dsp/_wavelet.py +3 -2
scitex/dsp/add_noise.py +2 -2
scitex/dsp/example.py +1 -0
scitex/dsp/filt.py +10 -9
scitex/dsp/template.py +3 -2
scitex/dsp/utils/_differential_bandpass_filters.py +1 -1
scitex/dsp/utils/pac.py +2 -2
scitex/dt/_normalize_timestamp.py +432 -0
scitex/errors.py +572 -0
scitex/gen/_DimHandler.py +2 -2
scitex/gen/__init__.py +37 -7
scitex/gen/_deprecated_close.py +80 -0
scitex/gen/_deprecated_start.py +26 -0
scitex/gen/_detect_environment.py +152 -0
scitex/gen/_detect_notebook_path.py +169 -0
scitex/gen/_embed.py +6 -2
scitex/gen/_get_notebook_path.py +257 -0
scitex/gen/_less.py +1 -1
scitex/gen/_list_packages.py +2 -2
scitex/gen/_norm.py +44 -9
scitex/gen/_norm_cache.py +269 -0
scitex/gen/_src.py +3 -5
scitex/gen/_title_case.py +3 -3
scitex/io/__init__.py +28 -6
scitex/io/_glob.py +13 -7
scitex/io/_load.py +108 -21
scitex/io/_load_cache.py +303 -0
scitex/io/_load_configs.py +40 -15
scitex/io/{_H5Explorer.py → _load_modules/_H5Explorer.py} +80 -17
scitex/io/_load_modules/_ZarrExplorer.py +114 -0
scitex/io/_load_modules/_bibtex.py +207 -0
scitex/io/_load_modules/_hdf5.py +53 -178
scitex/io/_load_modules/_json.py +5 -3
scitex/io/_load_modules/_pdf.py +871 -16
scitex/io/_load_modules/_sqlite3.py +15 -0
scitex/io/_load_modules/_txt.py +41 -12
scitex/io/_load_modules/_yaml.py +4 -3
scitex/io/_load_modules/_zarr.py +126 -0
scitex/io/_save.py +429 -171
scitex/io/_save_modules/__init__.py +6 -0
scitex/io/_save_modules/_bibtex.py +194 -0
scitex/io/_save_modules/_csv.py +8 -4
scitex/io/_save_modules/_excel.py +174 -15
scitex/io/_save_modules/_hdf5.py +251 -226
scitex/io/_save_modules/_image.py +1 -3
scitex/io/_save_modules/_json.py +49 -4
scitex/io/_save_modules/_listed_dfs_as_csv.py +1 -3
scitex/io/_save_modules/_listed_scalars_as_csv.py +1 -3
scitex/io/_save_modules/_tex.py +277 -0
scitex/io/_save_modules/_yaml.py +42 -3
scitex/io/_save_modules/_zarr.py +160 -0
scitex/io/utils/__init__.py +20 -0
scitex/io/utils/h5_to_zarr.py +616 -0
scitex/linalg/_geometric_median.py +6 -2
scitex/{gen/_tee.py → logging/_Tee.py} +43 -84
scitex/logging/__init__.py +122 -0
scitex/logging/_config.py +158 -0
scitex/logging/_context.py +103 -0
scitex/logging/_formatters.py +128 -0
scitex/logging/_handlers.py +64 -0
scitex/logging/_levels.py +35 -0
scitex/logging/_logger.py +163 -0
scitex/logging/_print_capture.py +95 -0
scitex/ml/__init__.py +69 -0
scitex/{ai/genai/anthropic.py → ml/_gen_ai/_Anthropic.py} +13 -19
scitex/{ai/genai/base_genai.py → ml/_gen_ai/_BaseGenAI.py} +5 -5
scitex/{ai/genai/deepseek.py → ml/_gen_ai/_DeepSeek.py} +11 -16
scitex/{ai/genai/google.py → ml/_gen_ai/_Google.py} +7 -15
scitex/{ai/genai/groq.py → ml/_gen_ai/_Groq.py} +1 -8
scitex/{ai/genai/llama.py → ml/_gen_ai/_Llama.py} +3 -16
scitex/{ai/genai/openai.py → ml/_gen_ai/_OpenAI.py} +3 -3
scitex/{ai/genai/params.py → ml/_gen_ai/_PARAMS.py} +51 -65
scitex/{ai/genai/perplexity.py → ml/_gen_ai/_Perplexity.py} +3 -14
scitex/ml/_gen_ai/__init__.py +43 -0
scitex/{ai/genai/calc_cost.py → ml/_gen_ai/_calc_cost.py} +1 -1
scitex/{ai/genai/format_output_func.py → ml/_gen_ai/_format_output_func.py} +4 -4
scitex/{ai/genai/genai_factory.py → ml/_gen_ai/_genai_factory.py} +8 -8
scitex/ml/activation/__init__.py +8 -0
scitex/ml/activation/_define.py +11 -0
scitex/{ai/classifier_server.py → ml/classification/Classifier.py} +5 -5
scitex/ml/classification/CrossValidationExperiment.py +374 -0
scitex/ml/classification/__init__.py +46 -0
scitex/ml/classification/reporters/_BaseClassificationReporter.py +281 -0
scitex/ml/classification/reporters/_ClassificationReporter.py +773 -0
scitex/ml/classification/reporters/_MultiClassificationReporter.py +406 -0
scitex/ml/classification/reporters/_SingleClassificationReporter.py +1834 -0
scitex/ml/classification/reporters/__init__.py +11 -0
scitex/ml/classification/reporters/reporter_utils/_Plotter.py +1028 -0
scitex/ml/classification/reporters/reporter_utils/__init__.py +80 -0
scitex/ml/classification/reporters/reporter_utils/aggregation.py +457 -0
scitex/ml/classification/reporters/reporter_utils/data_models.py +313 -0
scitex/ml/classification/reporters/reporter_utils/reporting.py +1056 -0
scitex/ml/classification/reporters/reporter_utils/storage.py +221 -0
scitex/ml/classification/reporters/reporter_utils/validation.py +395 -0
scitex/ml/classification/timeseries/_TimeSeriesBlockingSplit.py +568 -0
scitex/ml/classification/timeseries/_TimeSeriesCalendarSplit.py +688 -0
scitex/ml/classification/timeseries/_TimeSeriesMetadata.py +139 -0
scitex/ml/classification/timeseries/_TimeSeriesSlidingWindowSplit.py +1716 -0
scitex/ml/classification/timeseries/_TimeSeriesSlidingWindowSplit_v01-not-using-n_splits.py +1685 -0
scitex/ml/classification/timeseries/_TimeSeriesStrategy.py +84 -0
scitex/ml/classification/timeseries/_TimeSeriesStratifiedSplit.py +610 -0
scitex/ml/classification/timeseries/__init__.py +39 -0
scitex/ml/classification/timeseries/_normalize_timestamp.py +436 -0
scitex/ml/clustering/__init__.py +11 -0
scitex/ml/clustering/_pca.py +115 -0
scitex/ml/clustering/_umap.py +376 -0
scitex/ml/feature_extraction/__init__.py +56 -0
scitex/ml/feature_extraction/vit.py +149 -0
scitex/ml/feature_selection/__init__.py +30 -0
scitex/ml/feature_selection/feature_selection.py +364 -0
scitex/ml/loss/_L1L2Losses.py +34 -0
scitex/ml/loss/__init__.py +12 -0
scitex/ml/loss/multi_task_loss.py +47 -0
scitex/ml/metrics/__init__.py +56 -0
scitex/ml/metrics/_calc_bacc.py +61 -0
scitex/ml/metrics/_calc_bacc_from_conf_mat.py +38 -0
scitex/ml/metrics/_calc_clf_report.py +78 -0
scitex/ml/metrics/_calc_conf_mat.py +93 -0
scitex/ml/metrics/_calc_feature_importance.py +183 -0
scitex/ml/metrics/_calc_mcc.py +61 -0
scitex/ml/metrics/_calc_pre_rec_auc.py +116 -0
scitex/ml/metrics/_calc_roc_auc.py +110 -0
scitex/ml/metrics/_calc_seizure_prediction_metrics.py +490 -0
scitex/ml/metrics/_calc_silhouette_score.py +503 -0
scitex/ml/metrics/_normalize_labels.py +83 -0
scitex/ml/optim/Ranger_Deep_Learning_Optimizer/__init__.py +0 -0
scitex/ml/optim/Ranger_Deep_Learning_Optimizer/ranger/__init__.py +3 -0
scitex/ml/optim/Ranger_Deep_Learning_Optimizer/ranger/ranger.py +207 -0
scitex/ml/optim/Ranger_Deep_Learning_Optimizer/ranger/ranger2020.py +238 -0
scitex/ml/optim/Ranger_Deep_Learning_Optimizer/ranger/ranger913A.py +215 -0
scitex/ml/optim/Ranger_Deep_Learning_Optimizer/ranger/rangerqh.py +184 -0
scitex/ml/optim/Ranger_Deep_Learning_Optimizer/setup.py +24 -0
scitex/ml/optim/__init__.py +13 -0
scitex/ml/optim/_get_set.py +31 -0
scitex/ml/optim/_optimizers.py +71 -0
scitex/ml/plt/__init__.py +60 -0
scitex/ml/plt/_plot_conf_mat.py +663 -0
scitex/ml/plt/_plot_feature_importance.py +323 -0
scitex/ml/plt/_plot_learning_curve.py +345 -0
scitex/ml/plt/_plot_optuna_study.py +225 -0
scitex/ml/plt/_plot_pre_rec_curve.py +290 -0
scitex/ml/plt/_plot_roc_curve.py +255 -0
scitex/ml/sk/__init__.py +11 -0
scitex/ml/sk/_clf.py +58 -0
scitex/ml/sk/_to_sktime.py +100 -0
scitex/ml/sklearn/__init__.py +26 -0
scitex/ml/sklearn/clf.py +58 -0
scitex/ml/sklearn/to_sktime.py +100 -0
scitex/{ai/training/early_stopping.py → ml/training/_EarlyStopping.py} +1 -2
scitex/{ai → ml/training}/_LearningCurveLogger.py +198 -242
scitex/ml/training/__init__.py +7 -0
scitex/ml/utils/__init__.py +22 -0
scitex/ml/utils/_check_params.py +50 -0
scitex/ml/utils/_default_dataset.py +46 -0
scitex/ml/utils/_format_samples_for_sktime.py +26 -0
scitex/ml/utils/_label_encoder.py +134 -0
scitex/ml/utils/_merge_labels.py +22 -0
scitex/ml/utils/_sliding_window_data_augmentation.py +11 -0
scitex/ml/utils/_under_sample.py +51 -0
scitex/ml/utils/_verify_n_gpus.py +16 -0
scitex/ml/utils/grid_search.py +148 -0
scitex/nn/_BNet.py +15 -9
scitex/nn/_Filters.py +2 -2
scitex/nn/_ModulationIndex.py +2 -2
scitex/nn/_PAC.py +1 -1
scitex/nn/_Spectrogram.py +12 -3
scitex/nn/__init__.py +9 -10
scitex/path/__init__.py +18 -0
scitex/path/_clean.py +4 -0
scitex/path/_find.py +9 -4
scitex/path/_symlink.py +348 -0
scitex/path/_version.py +4 -3
scitex/pd/__init__.py +2 -0
scitex/pd/_get_unique.py +99 -0
scitex/plt/__init__.py +114 -5
scitex/plt/_subplots/_AxesWrapper.py +1 -3
scitex/plt/_subplots/_AxisWrapper.py +7 -3
scitex/plt/_subplots/_AxisWrapperMixins/_AdjustmentMixin.py +47 -13
scitex/plt/_subplots/_AxisWrapperMixins/_MatplotlibPlotMixin.py +160 -2
scitex/plt/_subplots/_AxisWrapperMixins/_SeabornMixin.py +26 -4
scitex/plt/_subplots/_AxisWrapperMixins/_UnitAwareMixin.py +322 -0
scitex/plt/_subplots/_AxisWrapperMixins/__init__.py +1 -0
scitex/plt/_subplots/_FigWrapper.py +62 -6
scitex/plt/_subplots/_export_as_csv.py +43 -27
scitex/plt/_subplots/_export_as_csv_formatters/__init__.py +5 -4
scitex/plt/_subplots/_export_as_csv_formatters/_format_annotate.py +81 -0
scitex/plt/_subplots/_export_as_csv_formatters/_format_bar.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_barh.py +20 -5
scitex/plt/_subplots/_export_as_csv_formatters/_format_boxplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_contour.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_errorbar.py +35 -18
scitex/plt/_subplots/_export_as_csv_formatters/_format_eventplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_fill.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_fill_between.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_hist.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_imshow.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_imshow2d.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot.py +15 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_box.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_conf_mat.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_ecdf.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_fillv.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_heatmap.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_image.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_joyplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_kde.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_line.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_mean_ci.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_mean_std.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_median_iqr.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_raster.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_rectangle.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_scatter.py +35 -0
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_scatter_hist.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_shaded_line.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_plot_violin.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_scatter.py +6 -4
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_barplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_boxplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_heatmap.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_histplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_jointplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_kdeplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_lineplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_pairplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_scatterplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_stripplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_swarmplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_sns_violinplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_text.py +60 -0
scitex/plt/_subplots/_export_as_csv_formatters/_format_violin.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/_format_violinplot.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters/test_formatters.py +1 -3
scitex/plt/_subplots/_export_as_csv_formatters.py +56 -59
scitex/plt/ax/_style/_hide_spines.py +1 -3
scitex/plt/ax/_style/_rotate_labels.py +180 -76
scitex/plt/ax/_style/_rotate_labels_v01.py +248 -0
scitex/plt/ax/_style/_set_meta.py +11 -4
scitex/plt/ax/_style/_set_supxyt.py +3 -3
scitex/plt/ax/_style/_set_xyt.py +3 -3
scitex/plt/ax/_style/_share_axes.py +2 -2
scitex/plt/color/__init__.py +4 -4
scitex/plt/color/{_get_colors_from_cmap.py → _get_colors_from_conf_matap.py} +7 -7
scitex/plt/utils/_configure_mpl.py +99 -86
scitex/plt/utils/_histogram_utils.py +1 -3
scitex/plt/utils/_is_valid_axis.py +1 -3
scitex/plt/utils/_scitex_config.py +1 -0
scitex/repro/__init__.py +75 -0
scitex/{reproduce → repro}/_gen_ID.py +1 -1
scitex/{reproduce → repro}/_gen_timestamp.py +1 -1
scitex/repro_rng/_RandomStateManager.py +590 -0
scitex/repro_rng/_RandomStateManager_v01-no-verbose-options.py +414 -0
scitex/repro_rng/__init__.py +39 -0
scitex/reproduce/__init__.py +25 -13
scitex/reproduce/_hash_array.py +22 -0
scitex/resource/_get_processor_usages.py +4 -4
scitex/resource/_get_specs.py +2 -2
scitex/resource/_log_processor_usages.py +2 -2
scitex/rng/_RandomStateManager.py +590 -0
scitex/rng/_RandomStateManager_v01-no-verbose-options.py +414 -0
scitex/rng/__init__.py +39 -0
scitex/scholar/__init__.py +309 -19
scitex/scholar/__main__.py +319 -0
scitex/scholar/auth/ScholarAuthManager.py +308 -0
scitex/scholar/auth/__init__.py +12 -0
scitex/scholar/auth/core/AuthenticationGateway.py +473 -0
scitex/scholar/auth/core/BrowserAuthenticator.py +386 -0
scitex/scholar/auth/core/StrategyResolver.py +309 -0
scitex/scholar/auth/core/__init__.py +16 -0
scitex/scholar/auth/gateway/_OpenURLLinkFinder.py +120 -0
scitex/scholar/auth/gateway/_OpenURLResolver.py +209 -0
scitex/scholar/auth/gateway/__init__.py +38 -0
scitex/scholar/auth/gateway/_resolve_functions.py +101 -0
scitex/scholar/auth/providers/BaseAuthenticator.py +166 -0
scitex/scholar/auth/providers/EZProxyAuthenticator.py +484 -0
scitex/scholar/auth/providers/OpenAthensAuthenticator.py +619 -0
scitex/scholar/auth/providers/ShibbolethAuthenticator.py +686 -0
scitex/scholar/auth/providers/__init__.py +18 -0
scitex/scholar/auth/session/AuthCacheManager.py +189 -0
scitex/scholar/auth/session/SessionManager.py +159 -0
scitex/scholar/auth/session/__init__.py +11 -0
scitex/scholar/auth/sso/BaseSSOAutomator.py +373 -0
scitex/scholar/auth/sso/OpenAthensSSOAutomator.py +378 -0
scitex/scholar/auth/sso/SSOAutomator.py +180 -0
scitex/scholar/auth/sso/UniversityOfMelbourneSSOAutomator.py +380 -0
scitex/scholar/auth/sso/__init__.py +15 -0
scitex/scholar/browser/ScholarBrowserManager.py +705 -0
scitex/scholar/browser/__init__.py +38 -0
scitex/scholar/browser/utils/__init__.py +13 -0
scitex/scholar/browser/utils/click_and_wait.py +205 -0
scitex/scholar/browser/utils/close_unwanted_pages.py +140 -0
scitex/scholar/browser/utils/wait_redirects.py +732 -0
scitex/scholar/config/PublisherRules.py +132 -0
scitex/scholar/config/ScholarConfig.py +126 -0
scitex/scholar/config/__init__.py +17 -0
scitex/scholar/core/Paper.py +627 -0
scitex/scholar/core/Papers.py +722 -0
scitex/scholar/core/Scholar.py +1975 -0
scitex/scholar/core/__init__.py +9 -0
scitex/scholar/impact_factor/ImpactFactorEngine.py +204 -0
scitex/scholar/impact_factor/__init__.py +20 -0
scitex/scholar/impact_factor/estimation/ImpactFactorEstimationEngine.py +0 -0
scitex/scholar/impact_factor/estimation/__init__.py +40 -0
scitex/scholar/impact_factor/estimation/build_database.py +0 -0
scitex/scholar/impact_factor/estimation/core/__init__.py +28 -0
scitex/scholar/impact_factor/estimation/core/cache_manager.py +523 -0
scitex/scholar/impact_factor/estimation/core/calculator.py +355 -0
scitex/scholar/impact_factor/estimation/core/journal_matcher.py +428 -0
scitex/scholar/integration/__init__.py +59 -0
scitex/scholar/integration/base.py +502 -0
scitex/scholar/integration/mendeley/__init__.py +22 -0
scitex/scholar/integration/mendeley/exporter.py +166 -0
scitex/scholar/integration/mendeley/importer.py +236 -0
scitex/scholar/integration/mendeley/linker.py +79 -0
scitex/scholar/integration/mendeley/mapper.py +212 -0
scitex/scholar/integration/zotero/__init__.py +27 -0
scitex/scholar/integration/zotero/__main__.py +264 -0
scitex/scholar/integration/zotero/exporter.py +351 -0
scitex/scholar/integration/zotero/importer.py +372 -0
scitex/scholar/integration/zotero/linker.py +415 -0
scitex/scholar/integration/zotero/mapper.py +286 -0
scitex/scholar/metadata_engines/ScholarEngine.py +588 -0
scitex/scholar/metadata_engines/__init__.py +21 -0
scitex/scholar/metadata_engines/individual/ArXivEngine.py +397 -0
scitex/scholar/metadata_engines/individual/CrossRefEngine.py +274 -0
scitex/scholar/metadata_engines/individual/CrossRefLocalEngine.py +263 -0
scitex/scholar/metadata_engines/individual/OpenAlexEngine.py +350 -0
scitex/scholar/metadata_engines/individual/PubMedEngine.py +329 -0
scitex/scholar/metadata_engines/individual/SemanticScholarEngine.py +438 -0
scitex/scholar/metadata_engines/individual/URLDOIEngine.py +410 -0
scitex/scholar/metadata_engines/individual/_BaseDOIEngine.py +487 -0
scitex/scholar/metadata_engines/individual/__init__.py +7 -0
scitex/scholar/metadata_engines/utils/_PubMedConverter.py +469 -0
scitex/scholar/metadata_engines/utils/_URLDOIExtractor.py +283 -0
scitex/scholar/metadata_engines/utils/__init__.py +30 -0
scitex/scholar/metadata_engines/utils/_metadata2bibtex.py +103 -0
scitex/scholar/metadata_engines/utils/_standardize_metadata.py +376 -0
scitex/scholar/pdf_download/ScholarPDFDownloader.py +579 -0
scitex/scholar/pdf_download/__init__.py +5 -0
scitex/scholar/pdf_download/strategies/__init__.py +38 -0
scitex/scholar/pdf_download/strategies/chrome_pdf_viewer.py +376 -0
scitex/scholar/pdf_download/strategies/direct_download.py +131 -0
scitex/scholar/pdf_download/strategies/manual_download_fallback.py +167 -0
scitex/scholar/pdf_download/strategies/manual_download_utils.py +996 -0
scitex/scholar/pdf_download/strategies/response_body.py +207 -0
scitex/scholar/pipelines/ScholarPipelineBibTeX.py +364 -0
scitex/scholar/pipelines/ScholarPipelineParallel.py +478 -0
scitex/scholar/pipelines/ScholarPipelineSingle.py +767 -0
scitex/scholar/pipelines/__init__.py +49 -0
scitex/scholar/storage/BibTeXHandler.py +1018 -0
scitex/scholar/storage/PaperIO.py +468 -0
scitex/scholar/storage/ScholarLibrary.py +182 -0
scitex/scholar/storage/_DeduplicationManager.py +548 -0
scitex/scholar/storage/_LibraryCacheManager.py +724 -0
scitex/scholar/storage/_LibraryManager.py +1835 -0
scitex/scholar/storage/__init__.py +28 -0
scitex/scholar/url_finder/ScholarURLFinder.py +379 -0
scitex/scholar/url_finder/__init__.py +7 -0
scitex/scholar/url_finder/strategies/__init__.py +33 -0
scitex/scholar/url_finder/strategies/find_pdf_urls_by_direct_links.py +261 -0
scitex/scholar/url_finder/strategies/find_pdf_urls_by_dropdown.py +67 -0
scitex/scholar/url_finder/strategies/find_pdf_urls_by_href.py +204 -0
scitex/scholar/url_finder/strategies/find_pdf_urls_by_navigation.py +256 -0
scitex/scholar/url_finder/strategies/find_pdf_urls_by_publisher_patterns.py +165 -0
scitex/scholar/url_finder/strategies/find_pdf_urls_by_zotero_translators.py +163 -0
scitex/scholar/url_finder/strategies/find_supplementary_urls_by_href.py +70 -0
scitex/scholar/utils/__init__.py +22 -0
scitex/scholar/utils/bibtex/__init__.py +9 -0
scitex/scholar/utils/bibtex/_parse_bibtex.py +71 -0
scitex/scholar/utils/cleanup/__init__.py +8 -0
scitex/scholar/utils/cleanup/_cleanup_scholar_processes.py +96 -0
scitex/scholar/utils/cleanup/cleanup_old_extractions.py +117 -0
scitex/scholar/utils/text/_TextNormalizer.py +407 -0
scitex/scholar/utils/text/__init__.py +9 -0
scitex/scholar/zotero/__init__.py +38 -0
scitex/session/__init__.py +51 -0
scitex/session/_lifecycle.py +736 -0
scitex/session/_manager.py +102 -0
scitex/session/template.py +122 -0
scitex/stats/__init__.py +30 -26
scitex/stats/correct/__init__.py +21 -0
scitex/stats/correct/_correct_bonferroni.py +551 -0
scitex/stats/correct/_correct_fdr.py +634 -0
scitex/stats/correct/_correct_holm.py +548 -0
scitex/stats/correct/_correct_sidak.py +499 -0
scitex/stats/descriptive/__init__.py +85 -0
scitex/stats/descriptive/_circular.py +540 -0
scitex/stats/descriptive/_describe.py +219 -0
scitex/stats/descriptive/_nan.py +518 -0
scitex/stats/descriptive/_real.py +189 -0
scitex/stats/effect_sizes/__init__.py +41 -0
scitex/stats/effect_sizes/_cliffs_delta.py +325 -0
scitex/stats/effect_sizes/_cohens_d.py +342 -0
scitex/stats/effect_sizes/_epsilon_squared.py +315 -0
scitex/stats/effect_sizes/_eta_squared.py +302 -0
scitex/stats/effect_sizes/_prob_superiority.py +296 -0
scitex/stats/posthoc/__init__.py +19 -0
scitex/stats/posthoc/_dunnett.py +463 -0
scitex/stats/posthoc/_games_howell.py +383 -0
scitex/stats/posthoc/_tukey_hsd.py +367 -0
scitex/stats/power/__init__.py +19 -0
scitex/stats/power/_power.py +433 -0
scitex/stats/template.py +119 -0
scitex/stats/utils/__init__.py +62 -0
scitex/stats/utils/_effect_size.py +985 -0
scitex/stats/utils/_formatters.py +270 -0
scitex/stats/utils/_normalizers.py +927 -0
scitex/stats/utils/_power.py +433 -0
scitex/stats_v01/_EffectSizeCalculator.py +488 -0
scitex/stats_v01/_StatisticalValidator.py +411 -0
scitex/stats_v01/__init__.py +60 -0
scitex/stats_v01/_additional_tests.py +415 -0
scitex/{stats → stats_v01}/_p2stars.py +19 -5
scitex/stats_v01/_two_sample_tests.py +141 -0
scitex/stats_v01/desc/__init__.py +83 -0
scitex/stats_v01/desc/_circular.py +540 -0
scitex/stats_v01/desc/_describe.py +219 -0
scitex/stats_v01/desc/_nan.py +518 -0
scitex/{stats/desc/_nan.py → stats_v01/desc/_nan_v01-20250920_145731.py} +23 -12
scitex/stats_v01/desc/_real.py +189 -0
scitex/stats_v01/tests/__corr_test_optimized.py +221 -0
scitex/stats_v01/tests/_corr_test_optimized.py +179 -0
scitex/str/__init__.py +1 -3
scitex/str/_clean_path.py +6 -2
scitex/str/_latex_fallback.py +267 -160
scitex/str/_parse.py +44 -36
scitex/str/_printc.py +1 -3
scitex/template/__init__.py +87 -0
scitex/template/_create_project.py +267 -0
scitex/template/create_pip_project.py +80 -0
scitex/template/create_research.py +80 -0
scitex/template/create_singularity.py +80 -0
scitex/units.py +291 -0
scitex/utils/_compress_hdf5.py +14 -3
scitex/utils/_email.py +21 -2
scitex/utils/_grid.py +6 -4
scitex/utils/_notify.py +13 -10
scitex/utils/_verify_scitex_format.py +589 -0
scitex/utils/_verify_scitex_format_v01.py +370 -0
scitex/utils/template.py +122 -0
scitex/web/_search_pubmed.py +62 -16
scitex-2.1.0.dist-info/LICENSE +21 -0
scitex-2.1.0.dist-info/METADATA +677 -0
scitex-2.1.0.dist-info/RECORD +919 -0
{scitex-2.0.0.dist-info → scitex-2.1.0.dist-info}/WHEEL +1 -1
scitex-2.1.0.dist-info/entry_points.txt +3 -0
scitex/ai/__Classifiers.py +0 -101
scitex/ai/classification/classification_reporter.py +0 -1137
scitex/ai/classification/classifiers.py +0 -101
scitex/ai/classification_reporter.py +0 -1161
scitex/ai/genai/__init__.py +0 -277
scitex/ai/genai/anthropic_provider.py +0 -320
scitex/ai/genai/anthropic_refactored.py +0 -109
scitex/ai/genai/auth_manager.py +0 -200
scitex/ai/genai/base_provider.py +0 -291
scitex/ai/genai/chat_history.py +0 -307
scitex/ai/genai/cost_tracker.py +0 -276
scitex/ai/genai/deepseek_provider.py +0 -251
scitex/ai/genai/google_provider.py +0 -228
scitex/ai/genai/groq_provider.py +0 -248
scitex/ai/genai/image_processor.py +0 -250
scitex/ai/genai/llama_provider.py +0 -214
scitex/ai/genai/mock_provider.py +0 -127
scitex/ai/genai/model_registry.py +0 -304
scitex/ai/genai/openai_provider.py +0 -293
scitex/ai/genai/perplexity_provider.py +0 -205
scitex/ai/genai/provider_base.py +0 -302
scitex/ai/genai/provider_factory.py +0 -370
scitex/ai/genai/response_handler.py +0 -235
scitex/ai/layer/_Pass.py +0 -21
scitex/ai/layer/__init__.py +0 -10
scitex/ai/layer/_switch.py +0 -8
scitex/ai/metrics/_bACC.py +0 -51
scitex/ai/plt/_learning_curve.py +0 -194
scitex/ai/plt/_optuna_study.py +0 -111
scitex/ai/plt/aucs/__init__.py +0 -2
scitex/ai/plt/aucs/example.py +0 -60
scitex/ai/plt/aucs/pre_rec_auc.py +0 -223
scitex/ai/plt/aucs/roc_auc.py +0 -246
scitex/ai/sampling/undersample.py +0 -29
scitex/db/_SQLite3.py +0 -2136
scitex/db/_SQLite3Mixins/_BlobMixin.py +0 -229
scitex/gen/_close.py +0 -222
scitex/gen/_start.py +0 -451
scitex/general/__init__.py +0 -5
scitex/io/_load_modules/_db.py +0 -24
scitex/life/__init__.py +0 -10
scitex/life/_monitor_rain.py +0 -49
scitex/reproduce/_fix_seeds.py +0 -45
scitex/res/__init__.py +0 -5
scitex/scholar/_local_search.py +0 -454
scitex/scholar/_paper.py +0 -244
scitex/scholar/_pdf_downloader.py +0 -325
scitex/scholar/_search.py +0 -393
scitex/scholar/_vector_search.py +0 -370
scitex/scholar/_web_sources.py +0 -457
scitex/stats/desc/__init__.py +0 -40
scitex-2.0.0.dist-info/METADATA +0 -307
scitex-2.0.0.dist-info/RECORD +0 -572
scitex-2.0.0.dist-info/licenses/LICENSE +0 -7
/scitex/ai/{act → activation}/__init__.py +0 -0
/scitex/ai/{act → activation}/_define.py +0 -0
/scitex/ai/{early_stopping.py → training/_EarlyStopping.py} +0 -0
/scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_ImportExportMixin.py +0 -0
/scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_IndexMixin.py +0 -0
/scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_RowMixin.py +0 -0
/scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/_TableMixin.py +0 -0
/scitex/db/{_PostgreSQLMixins → _postgresql/_PostgreSQLMixins}/__init__.py +0 -0
/scitex/{stats → stats_v01}/_calc_partial_corr.py +0 -0
/scitex/{stats → stats_v01}/_corr_test_multi.py +0 -0
/scitex/{stats → stats_v01}/_corr_test_wrapper.py +0 -0
/scitex/{stats → stats_v01}/_describe_wrapper.py +0 -0
/scitex/{stats → stats_v01}/_multiple_corrections.py +0 -0
/scitex/{stats → stats_v01}/_nan_stats.py +0 -0
/scitex/{stats → stats_v01}/_p2stars_wrapper.py +0 -0
/scitex/{stats → stats_v01}/_statistical_tests.py +0 -0
/scitex/{stats/desc/_describe.py → stats_v01/desc/_describe_v01-20250920_145731.py} +0 -0
/scitex/{stats/desc/_real.py → stats_v01/desc/_real_v01-20250920_145731.py} +0 -0
/scitex/{stats → stats_v01}/multiple/__init__.py +0 -0
/scitex/{stats → stats_v01}/multiple/_bonferroni_correction.py +0 -0
/scitex/{stats → stats_v01}/multiple/_fdr_correction.py +0 -0
/scitex/{stats → stats_v01}/multiple/_multicompair.py +0 -0
/scitex/{stats → stats_v01}/tests/__corr_test.py +0 -0
/scitex/{stats → stats_v01}/tests/__corr_test_multi.py +0 -0
/scitex/{stats → stats_v01}/tests/__corr_test_single.py +0 -0
/scitex/{stats → stats_v01}/tests/__init__.py +0 -0
/scitex/{stats → stats_v01}/tests/_brunner_munzel_test.py +0 -0
/scitex/{stats → stats_v01}/tests/_nocorrelation_test.py +0 -0
/scitex/{stats → stats_v01}/tests/_smirnov_grubbs.py +0 -0
{scitex-2.0.0.dist-info → scitex-2.1.0.dist-info}/top_level.txt +0 -0

scitex/scholar/core/Scholar.py ADDED Viewed

@@ -0,0 +1,1975 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# Timestamp: "2025-10-13 08:11:40 (ywatanabe)"
+# File: /home/ywatanabe/proj/scitex_repo/src/scitex/scholar/core/Scholar.py
+# ----------------------------------------
+from __future__ import annotations
+import os
+__FILE__ = (
+    "./src/scitex/scholar/core/Scholar.py"
+)
+__DIR__ = os.path.dirname(__FILE__)
+# ----------------------------------------
+__FILE__ = __file__
+"""
+Unified Scholar class for scientific literature management.
+This is the main entry point for all scholar functionality, providing:
+- Simple, intuitive API
+- Smart defaults
+- Method chaining
+- Progressive disclosure of advanced features
+"""
+import json
+from datetime import datetime
+from pathlib import Path
+from typing import Any
+from typing import Dict
+from typing import List
+from typing import Optional
+from typing import Union
+from copy import deepcopy
+from scitex import logging
+import shutil
+# PDF extraction is now handled by scitex.io
+from scitex.errors import ScholarError
+from scitex.scholar.config import ScholarConfig
+# Updated imports for current architecture
+from scitex.scholar.auth import ScholarAuthManager
+from scitex.browser.debugging import browser_logger
+from scitex.scholar.browser import ScholarBrowserManager
+from scitex.scholar.storage import LibraryManager
+from scitex.scholar.storage import ScholarLibrary
+from scitex.scholar.metadata_engines.ScholarEngine import ScholarEngine
+from scitex.scholar.pdf_download.ScholarPDFDownloader import (
+    ScholarPDFDownloader,
+)
+from scitex.scholar.auth.core.AuthenticationGateway import (
+    AuthenticationGateway,
+)
+from scitex.scholar.url_finder.ScholarURLFinder import ScholarURLFinder
+import asyncio
+import nest_asyncio
+from scitex.scholar.impact_factor.ImpactFactorEngine import ImpactFactorEngine
+from .Papers import Papers
+logger = logging.getLogger(__name__)
+class Scholar:
+    """
+    Main interface for SciTeX Scholar - scientific literature management made simple.
+    By default, papers are automatically enriched with:
+    - Journal impact factors from impact_factor package (2024 JCR data)
+    - Citation counts from Semantic Scholar (via DOI/title matching)
+    Example usage:
+        # Basic search with automatic enrichment
+        scholar = Scholar()
+        papers = scholar.search("deep learning neuroscience")
+        # Papers now have impact_factor and citation_count populated
+        papers.save("my_pac.bib")
+        # Disable automatic enrichment if needed
+        config = ScholarConfig(enable_auto_enrich=False)
+        scholar = Scholar(config=config)
+        # Search specific source
+        papers = scholar.search("transformer models", sources='arxiv')
+        # Advanced workflow
+        papers = scholar.search("transformer models", year_min=2020) \\
+                      .filter(min_citations=50) \\
+                      .sort_by("impact_factor") \\
+                      .save("transformers.bib")
+        # Local library
+        scholar._index_local_pdfs("./my_papers")
+        local_papers = scholar.search_local("attention mechanism")
+    """
+    @property
+    def name(self):
+        """Class name for logging."""
+        return self.__class__.__name__
+    def __init__(
+        self,
+        config: Optional[Union[ScholarConfig, str, Path]] = None,
+        project: Optional[str] = None,
+        project_description: Optional[str] = None,
+        browser_mode: Optional[str] = None,
+    ):
+        """
+        Initialize Scholar with configuration.
+        Args:
+            config: Can be:
+                   - ScholarConfig instance
+                   - Path to YAML config file (str or Path)
+                   - None (uses ScholarConfig.load() to find config)
+            project: Default project name for operations
+            project_description: Optional description for the project
+            browser_mode: Browser mode ('stealth', 'interactive', 'manual')
+        """
+        self.config = self._init_config(config)
+        # Store browser mode for later use
+        self.browser_mode = browser_mode or "stealth"
+        # Set project and workspace
+        self.project = self.config.resolve("project", project, "default")
+        self.workspace_dir = self.config.path_manager.get_workspace_dir()
+        # Auto-create project directory if it doesn't exist
+        if project:
+            self._ensure_project_exists(project, project_description)
+        # Initialize service components (lazy loading for better performance)
+        # Use mangled names for private properties
+        self._Scholar__scholar_engine = (
+            None  # Replaces DOIResolver and LibraryEnricher
+        )
+        self._Scholar__auth_manager = None
+        self._Scholar__browser_manager = None
+        self._Scholar__library_manager = None
+        self._Scholar__library = (
+            None  # ScholarLibrary for high-level operations
+        )
+        # Show user-friendly initialization message with library location
+        library_path = self.config.get_library_project_dir()
+        if project:
+            project_path = library_path / project
+            logger.info(
+                f"Scholar initialized with project '{project}' at {project_path}"
+            )
+        else:
+            logger.info(
+                f"{self.name}: Scholar initialized (library: {library_path})"
+            )
+    # ----------------------------------------
+    # Enrichers
+    # ----------------------------------------
+    async def enrich_papers_async(self, papers: Papers) -> Papers:
+        """Async version of enrich_papers for use in async contexts.
+        Args:
+            papers: Papers collection to enrich.
+        Returns:
+            Enriched Papers collection
+        """
+        enriched_list = []
+        for paper in papers:
+            try:
+                # Use ScholarEngine to search and enrich
+                results = await self._scholar_engine.search_async(
+                    title=paper.metadata.basic.title,
+                    year=paper.metadata.basic.year,
+                    authors=(
+                        paper.metadata.basic.authors[0]
+                        if paper.metadata.basic.authors
+                        else None
+                    ),
+                )
+                # Create a copy to avoid modifying original
+                enriched_paper = self._merge_enrichment_data(paper, results)
+                enriched_list.append(enriched_paper)
+                title = paper.metadata.basic.title or "No title"
+                logger.info(f"{self.name}: Enriched: {title[:50]}...")
+            except Exception as e:
+                title = paper.metadata.basic.title or "No title"
+                logger.warning(
+                    f"{self.name}: Failed to enrich paper '{title[:50]}...': {e}"
+                )
+                enriched_list.append(
+                    paper
+                )  # Keep original if enrichment fails
+        enriched_papers = Papers(enriched_list, project=self.project)
+        # Add impact factors as post-processing step
+        if self.config.resolve("enrich_impact_factors", None, True):
+            enriched_papers = self._enrich_impact_factors(enriched_papers)
+        return enriched_papers
+    def enrich_papers(
+        self, papers: Optional[Papers] = None
+    ) -> Union[Papers, Dict[str, int]]:
+        """Enrich papers with metadata from multiple sources.
+        Args:
+            papers: Papers collection to enrich. If None, enriches all papers in current project.
+        Returns:
+            - If papers provided: Returns enriched Papers collection
+            - If no papers: Returns dict with enrichment statistics for project
+        """
+        # If no papers provided, enrich entire project
+        if papers is None:
+            return self._enrich_current_project()
+        # Enrich the provided papers collection
+        enriched_list = []
+        nest_asyncio.apply()  # Allow nested event loops
+        for paper in papers:
+            try:
+                # Use ScholarEngine to search and enrich
+                results = asyncio.run(
+                    self._scholar_engine.search_async(
+                        title=paper.metadata.basic.title,
+                        year=paper.metadata.basic.year,
+                        authors=(
+                            paper.metadata.basic.authors[0]
+                            if paper.metadata.basic.authors
+                            else None
+                        ),
+                    )
+                )
+                # Create a copy to avoid modifying original
+                enriched_paper = self._merge_enrichment_data(paper, results)
+                enriched_list.append(enriched_paper)
+                title = paper.metadata.basic.title or "No title"
+                logger.info(f"{self.name}: Enriched: {title[:50]}...")
+            except Exception as e:
+                title = paper.metadata.basic.title or "No title"
+                logger.warning(
+                    f"{self.name}: Failed to enrich paper '{title[:50]}...': {e}"
+                )
+                enriched_list.append(
+                    paper
+                )  # Keep original if enrichment fails
+        enriched_papers = Papers(enriched_list, project=self.project)
+        # Add impact factors as post-processing step
+        if self.config.resolve("enrich_impact_factors", None, True):
+            enriched_papers = self._enrich_impact_factors(enriched_papers)
+        return enriched_papers
+    def _enrich_impact_factors(self, papers: "Papers") -> "Papers":
+        """Add journal impact factors to papers.
+        Args:
+            papers: Papers collection to enrich with impact factors
+        Returns:
+            Papers collection with impact factors added where available
+        """
+        try:
+            # Try JCR database first (fast)
+            jcr_engine = ImpactFactorEngine()
+            papers = jcr_engine.enrich_papers(papers)
+            return papers
+        except Exception as e:
+            logger.debug(
+                f"{self.name}: JCR engine unavailable: {e}, falling back to calculation method"
+            )
+        return papers
+    def _merge_enrichment_data(self, paper: "Paper", results: Dict) -> "Paper":
+        """Merge enrichment results into paper object.
+        Creates a new Paper object with merged data to avoid modifying the original.
+        """
+        # Import here to avoid circular dependency
+        enriched = deepcopy(paper)
+        # Results from ScholarEngine is already combined metadata, not individual engine results
+        if not results:
+            return enriched
+        # Extract from the combined metadata structure
+        # ID section
+        if "id" in results:
+            if results["id"].get("doi") and not enriched.metadata.id.doi:
+                enriched.metadata.set_doi(results["id"]["doi"])
+            if results["id"].get("pmid") and not enriched.metadata.id.pmid:
+                enriched.metadata.id.pmid = results["id"]["pmid"]
+            if (
+                results["id"].get("arxiv_id")
+                and not enriched.metadata.id.arxiv_id
+            ):
+                enriched.metadata.id.arxiv_id = results["id"]["arxiv_id"]
+            # Note: corpus_id, semantic_id, ieee_id are in results but not in Paper dataclass
+        # Basic metadata section
+        if "basic" in results:
+            # Always update abstract if found (key enrichment goal)
+            if results["basic"].get("abstract"):
+                enriched.metadata.basic.abstract = results["basic"]["abstract"]
+            # Update title if more complete
+            if results["basic"].get("title"):
+                new_title = results["basic"]["title"]
+                current_title = enriched.metadata.basic.title or ""
+                if not current_title or len(new_title) > len(current_title):
+                    enriched.metadata.basic.title = new_title
+            # Update authors if found
+            if (
+                results["basic"].get("authors")
+                and not enriched.metadata.basic.authors
+            ):
+                enriched.metadata.basic.authors = results["basic"]["authors"]
+            # Update year if found
+            if (
+                results["basic"].get("year")
+                and not enriched.metadata.basic.year
+            ):
+                enriched.metadata.basic.year = results["basic"]["year"]
+            # Update keywords if found
+            if (
+                results["basic"].get("keywords")
+                and not enriched.metadata.basic.keywords
+            ):
+                enriched.metadata.basic.keywords = results["basic"]["keywords"]
+        # Publication metadata
+        if "publication" in results:
+            if (
+                results["publication"].get("journal")
+                and not enriched.metadata.publication.journal
+            ):
+                enriched.metadata.publication.journal = results["publication"][
+                    "journal"
+                ]
+            if (
+                results["publication"].get("publisher")
+                and not enriched.metadata.publication.publisher
+            ):
+                enriched.metadata.publication.publisher = results[
+                    "publication"
+                ]["publisher"]
+            if (
+                results["publication"].get("volume")
+                and not enriched.metadata.publication.volume
+            ):
+                enriched.metadata.publication.volume = results["publication"][
+                    "volume"
+                ]
+            if (
+                results["publication"].get("issue")
+                and not enriched.metadata.publication.issue
+            ):
+                enriched.metadata.publication.issue = results["publication"][
+                    "issue"
+                ]
+            if (
+                results["publication"].get("pages")
+                and not enriched.metadata.publication.pages
+            ):
+                enriched.metadata.publication.pages = results["publication"][
+                    "pages"
+                ]
+        # Citation metadata
+        if "citation_count" in results:
+            # Try both "count" and "total" fields
+            count = results["citation_count"].get("count") or results[
+                "citation_count"
+            ].get("total")
+            if count:
+                # Always take the maximum citation count
+                current_count = enriched.metadata.citation_count.total or 0
+                if not current_count or count > current_count:
+                    enriched.metadata.citation_count.total = count
+            # Note: influential_citation_count is in results but not in Paper dataclass
+        # URL metadata
+        if "url" in results:
+            if results["url"].get("pdf"):
+                # Check if this PDF is not already in the list
+                pdf_url = results["url"]["pdf"]
+                if not any(
+                    p.get("url") == pdf_url for p in enriched.metadata.url.pdfs
+                ):
+                    enriched.metadata.url.pdfs.append(
+                        {"url": pdf_url, "source": "enrichment"}
+                    )
+            if (
+                results["url"].get("url")
+                and not enriched.metadata.url.publisher
+            ):
+                enriched.metadata.url.publisher = results["url"]["url"]
+        # Note: Metrics section (journal_impact_factor, h_index) not stored in Paper dataclass
+        return enriched
+    def _enrich_current_project(self) -> Dict[str, int]:
+        """Enrich all papers in the current project.
+        Returns:
+            Dictionary with enrichment statistics
+        """
+        if not self.project:
+            raise ValueError(
+                "No project specified. Use Scholar(project='name') or provide papers to enrich()."
+            )
+        # Load papers from project library
+        papers = self.load_project(self.project)
+        logger.info(
+            f"{self.name}: Enriching {len(papers)} papers in project '{self.project}'"
+        )
+        # Enrich the papers
+        enriched_papers = self.enrich_papers(papers)
+        # Count successes
+        enriched_count = sum(
+            1
+            for i, p in enumerate(enriched_papers)
+            if p.abstract
+            and not papers[i].abstract  # Check if abstract was added
+        )
+        # Save enriched papers back to library
+        saved_ids = self.save_papers_to_library(enriched_papers)
+        return {
+            "enriched": enriched_count,
+            "failed": len(papers) - enriched_count,
+            "total": len(papers),
+            "saved": len(saved_ids),
+        }
+    # ----------------------------------------
+    # URL Finding (Orchestration)
+    # ----------------------------------------
+    async def _find_urls_for_doi_async(
+        self, doi: str, context
+    ) -> Dict[str, Any]:
+        """Find all URLs for a DOI (orchestration layer).
+        Workflow:
+            DOI → Publisher URL → PDF URLs → OpenURL (fallback)
+        Args:
+            doi: DOI string
+            context: Authenticated browser context
+        Returns:
+            Dictionary with URL information: {
+                "url_doi": "https://doi.org/...",
+                "url_publisher": "https://publisher.com/...",
+                "urls_pdf": [{"url": "...", "source": "zotero_translator"}],
+                "url_openurl_resolved": "..." (if fallback used)
+            }
+        """
+        from scitex.scholar.auth.gateway import (
+            normalize_doi_as_http,
+            resolve_publisher_url_by_navigating_to_doi_page,
+            OpenURLResolver,
+        )
+        # Initialize result
+        urls = {"url_doi": normalize_doi_as_http(doi)}
+        # Step 1: Resolve publisher URL
+        page = await context.new_page()
+        try:
+            url_publisher = (
+                await resolve_publisher_url_by_navigating_to_doi_page(
+                    doi, page
+                )
+            )
+            urls["url_publisher"] = url_publisher
+        finally:
+            await page.close()
+        # Step 2: Find PDF URLs from publisher URL
+        url_finder = ScholarURLFinder(context, config=self.config)
+        urls_pdf = []
+        if url_publisher:
+            urls_pdf = await url_finder.find_pdf_urls(url_publisher)
+        # Step 3: Try OpenURL fallback if no PDFs found
+        if not urls_pdf:
+            openurl_resolver = OpenURLResolver(config=self.config)
+            page = await context.new_page()
+            try:
+                url_openurl_resolved = await openurl_resolver.resolve_doi(
+                    doi, page
+                )
+                urls["url_openurl_resolved"] = url_openurl_resolved
+                if url_openurl_resolved and url_openurl_resolved != "skipped":
+                    urls_pdf = await url_finder.find_pdf_urls(
+                        url_openurl_resolved
+                    )
+            finally:
+                await page.close()
+        # Deduplicate and store
+        urls["urls_pdf"] = (
+            self._deduplicate_pdf_urls(urls_pdf) if urls_pdf else []
+        )
+        return urls
+    def _deduplicate_pdf_urls(self, urls_pdf: List[Dict]) -> List[Dict]:
+        """Remove duplicate PDF URLs.
+        Args:
+            urls_pdf: List of PDF URL dicts
+        Returns:
+            Deduplicated list of PDF URL dicts
+        """
+        seen = set()
+        unique = []
+        for pdf in urls_pdf:
+            url = pdf.get("url") if isinstance(pdf, dict) else pdf
+            if url not in seen:
+                seen.add(url)
+                unique.append(pdf)
+        return unique
+    # ----------------------------------------
+    # PDF Downloaders
+    # ----------------------------------------
+    async def download_pdfs_from_dois_async(
+        self,
+        dois: List[str],
+        output_dir: Optional[Path] = None,
+        max_concurrent: int = 1,
+    ) -> Dict[str, int]:
+        """Download PDFs for given DOIs using ScholarPDFDownloader.
+        Args:
+            dois: List of DOI strings
+            output_dir: Output directory (not used - downloads to library MASTER)
+            max_concurrent: Maximum concurrent downloads (default: 1 for sequential)
+        Returns:
+            Dictionary with download statistics
+        """
+        if not dois:
+            return {"downloaded": 0, "failed": 0, "errors": 0}
+        # Get authenticated browser context
+        browser, context = (
+            await self._browser_manager.get_authenticated_browser_and_context_async()
+        )
+        try:
+            # Initialize PDF downloader with browser context
+            pdf_downloader = ScholarPDFDownloader(
+                context=context,
+                config=self.config,
+            )
+            # Use download_from_dois from ScholarPDFDownloader
+            # This handles parallel downloads with semaphore control
+            logger.info(
+                f"{self.name}: Starting PDF download for {len(dois)} DOIs (max_concurrent={max_concurrent})"
+            )
+            results = await pdf_downloader.download_from_dois(
+                dois=dois,
+                output_dir=str(output_dir) if output_dir else "/tmp/",
+                max_concurrent=max_concurrent,
+            )
+            # Process results and organize in library
+            stats = {"downloaded": 0, "failed": 0, "errors": 0}
+            library_dir = self.config.get_library_project_dir()
+            master_dir = library_dir / "MASTER"
+            master_dir.mkdir(parents=True, exist_ok=True)
+            for doi, downloaded_paths in zip(dois, results):
+                try:
+                    if downloaded_paths and len(downloaded_paths) > 0:
+                        # PDF was downloaded successfully
+                        # Take the first downloaded PDF (if multiple)
+                        temp_pdf_path = downloaded_paths[0]
+                        # Generate paper ID and create storage
+                        paper_id = self.config.path_manager._generate_paper_id(
+                            doi=doi
+                        )
+                        storage_path = master_dir / paper_id
+                        storage_path.mkdir(parents=True, exist_ok=True)
+                        # Move PDF to MASTER library
+                        pdf_filename = f"DOI_{doi.replace('/', '_').replace(':', '_')}.pdf"
+                        master_pdf_path = storage_path / pdf_filename
+                        shutil.move(str(temp_pdf_path), str(master_pdf_path))
+                        # Create/update metadata
+                        metadata_file = storage_path / "metadata.json"
+                        if metadata_file.exists():
+                            with open(metadata_file, "r") as f:
+                                metadata = json.load(f)
+                        else:
+                            metadata = {
+                                "doi": doi,
+                                "scitex_id": paper_id,
+                                "created_at": datetime.now().isoformat(),
+                                "created_by": "SciTeX Scholar",
+                            }
+                        # Update metadata with PDF info
+                        metadata["pdf_path"] = str(
+                            master_pdf_path.relative_to(library_dir)
+                        )
+                        metadata["pdf_downloaded_at"] = (
+                            datetime.now().isoformat()
+                        )
+                        metadata["pdf_size_bytes"] = (
+                            master_pdf_path.stat().st_size
+                        )
+                        metadata["updated_at"] = datetime.now().isoformat()
+                        with open(metadata_file, "w") as f:
+                            json.dump(
+                                metadata, f, indent=2, ensure_ascii=False
+                            )
+                        # Update symlink using LibraryManager
+                        if self.project not in ["master", "MASTER"]:
+                            self._library_manager.update_symlink(
+                                master_storage_path=storage_path,
+                                project=self.project,
+                            )
+                        logger.success(
+                            f"{self.name}: Downloaded and organized PDF for {doi}: {master_pdf_path}"
+                        )
+                        stats["downloaded"] += 1
+                    else:
+                        logger.warning(
+                            f"{self.name}: No PDF downloaded for DOI: {doi}"
+                        )
+                        stats["failed"] += 1
+                except Exception as e:
+                    logger.error(
+                        f"{self.name}: Failed to organize PDF for {doi}: {e}"
+                    )
+                    stats["errors"] += 1
+                    stats["failed"] += 1
+            return stats
+        finally:
+            # Always close browser
+            await self._browser_manager.close()
+    async def _download_pdfs_sequential(
+        self, dois: List[str], output_dir: Optional[Path] = None
+    ) -> Dict[str, int]:
+        """Sequential PDF download with authentication gateway."""
+        results = {"downloaded": 0, "failed": 0, "errors": 0}
+        # Get authenticated browser context
+        browser, context = (
+            await self._browser_manager.get_authenticated_browser_and_context_async()
+        )
+        # Initialize authentication gateway (NEW)
+        auth_gateway = AuthenticationGateway(
+            auth_manager=self._auth_manager,
+            browser_manager=self._browser_manager,
+            config=self.config,
+        )
+        # Use simple downloader for sequential downloads
+        pdf_downloader = ScholarPDFDownloader(
+            context=context,
+            config=self.config,
+        )
+        library_dir = self.config.get_library_project_dir()
+        master_dir = library_dir / "MASTER"
+        project_dir = library_dir / self.project
+        master_dir.mkdir(parents=True, exist_ok=True)
+        project_dir.mkdir(parents=True, exist_ok=True)
+        for doi in dois:
+            try:
+                logger.info(f"{self.name}: Processing DOI: {doi}")
+                # NEW: Prepare authentication context BEFORE URL finding
+                # This establishes publisher-specific cookies if needed
+                _url_context = await auth_gateway.prepare_context_async(
+                    doi=doi, context=context
+                )
+                # Step 1: Find URLs for the DOI (orchestration)
+                urls = await self._find_urls_for_doi_async(doi, context)
+                # Step 2: Get PDF URLs
+                pdf_urls = urls.get("urls_pdf", [])
+                if not pdf_urls:
+                    logger.warning(
+                        f"{self.name}: No PDF URLs found for DOI: {doi}"
+                    )
+                    results["failed"] += 1
+                    continue
+                # Step 3: Try to download from each PDF URL
+                downloaded_path = None
+                for pdf_entry in pdf_urls:
+                    # Handle both dict and string formats
+                    pdf_url = (
+                        pdf_entry.get("url")
+                        if isinstance(pdf_entry, dict)
+                        else pdf_entry
+                    )
+                    if not pdf_url:
+                        continue
+                    # Download to temp location first
+                    temp_output = (
+                        Path("/tmp")
+                        / f"{doi.replace('/', '_').replace(':', '_')}.pdf"
+                    )
+                    # Download PDF using simple downloader
+                    result = await pdf_downloader.download_from_url(
+                        pdf_url=pdf_url, output_path=temp_output
+                    )
+                    if result and result.exists():
+                        downloaded_path = result
+                        break
+                if downloaded_path:
+                    # Step 4: Store PDF in MASTER library with proper organization
+                    # Generate unique ID from DOI using PathManager
+                    paper_id = self.config.path_manager._generate_paper_id(
+                        doi=doi
+                    )
+                    # Create MASTER storage directory
+                    storage_path = master_dir / paper_id
+                    storage_path.mkdir(parents=True, exist_ok=True)
+                    # Try to get paper metadata to generate readable name
+                    readable_name = None
+                    temp_paper = None
+                    try:
+                        # Try to load paper from DOI to get metadata
+                        from scitex.scholar.core.Paper import Paper
+                        from scitex.scholar.core.Papers import Papers
+                        temp_paper = Paper()
+                        temp_paper.metadata.id.doi = doi
+                        # Try to enrich to get author/year/journal using async method
+                        temp_papers = Papers([temp_paper])
+                        enriched = await self.enrich_papers_async(temp_papers)
+                        if enriched and len(enriched) > 0:
+                            temp_paper = enriched[0]
+                        # Generate readable name from metadata
+                        first_author = "Unknown"
+                        authors = temp_paper.metadata.basic.authors
+                        if authors and len(authors) > 0:
+                            author_parts = authors[0].split()
+                            if len(author_parts) > 1:
+                                first_author = author_parts[-1]  # Last name
+                            else:
+                                first_author = author_parts[0]
+                        year = temp_paper.metadata.basic.year
+                        year_str = str(year) if year else "Unknown"
+                        journal_clean = "Unknown"
+                        journal = temp_paper.metadata.publication.journal
+                        if journal:
+                            # Clean journal name - remove special chars, keep alphanumeric
+                            journal_clean = "".join(
+                                c for c in journal if c.isalnum() or c in " "
+                            ).replace(" ", "")
+                            if not journal_clean:
+                                journal_clean = "Unknown"
+                        # Format: Author-Year-Journal
+                        readable_name = (
+                            f"{first_author}-{year_str}-{journal_clean}"
+                        )
+                    except:
+                        pass
+                    # Fallback to DOI if metadata extraction failed
+                    if not readable_name:
+                        readable_name = (
+                            f"DOI_{doi.replace('/', '_').replace(':', '_')}"
+                        )
+                    # Copy PDF to MASTER storage with ORIGINAL filename to track how downloaded
+                    # The PDF filename preserves the DOI format for tracking
+                    pdf_filename = (
+                        f"DOI_{doi.replace('/', '_').replace(':', '_')}.pdf"
+                    )
+                    master_pdf_path = storage_path / pdf_filename
+                    shutil.copy2(downloaded_path, master_pdf_path)
+                    # Load existing metadata or create minimal new metadata
+                    metadata_file = storage_path / "metadata.json"
+                    if metadata_file.exists():
+                        # Load existing rich metadata - DO NOT OVERWRITE IT
+                        with open(metadata_file, "r") as f:
+                            metadata = json.load(f)
+                        logger.debug(
+                            f"{self.name}: Loaded existing metadata for {paper_id}"
+                        )
+                    else:
+                        # Create new minimal metadata only if none exists
+                        metadata = {
+                            "doi": doi,
+                            "scitex_id": paper_id,
+                            "created_at": datetime.now().isoformat(),
+                            "created_by": "SciTeX Scholar",
+                        }
+                        # Add enriched paper metadata for new papers only
+                        if temp_paper:
+                            # Use Pydantic to_dict() for Paper
+                            paper_dict = temp_paper.to_dict()
+                            # Merge paper metadata
+                            for key, value in paper_dict.items():
+                                if value is not None and key not in [
+                                    "doi",
+                                    "scitex_id",
+                                ]:
+                                    metadata[key] = value
+                    # Add PDF information
+                    metadata["pdf_path"] = str(
+                        master_pdf_path.relative_to(library_dir)
+                    )
+                    metadata["pdf_downloaded_at"] = datetime.now().isoformat()
+                    metadata["pdf_size_bytes"] = master_pdf_path.stat().st_size
+                    metadata["updated_at"] = datetime.now().isoformat()
+                    # Save updated metadata
+                    with open(metadata_file, "w") as f:
+                        json.dump(metadata, f, indent=2, ensure_ascii=False)
+                    # Update symlink using LibraryManager
+                    if self.project not in ["master", "MASTER"]:
+                        self._library_manager.update_symlink(
+                            master_storage_path=storage_path,
+                            project=self.project,
+                        )
+                    # Clean up temp file
+                    downloaded_path.unlink()
+                    logger.success(
+                        f"{self.name}: Downloaded PDF for {doi}: MASTER/{paper_id}/{pdf_filename}"
+                    )
+                    results["downloaded"] += 1
+                else:
+                    logger.warning(
+                        f"{self.name}: Failed to download any PDF for DOI: {doi}"
+                    )
+                    results["failed"] += 1
+            except Exception as e:
+                logger.error(f"{self.name}: Failed to process {doi}: {e}")
+                results["errors"] += 1
+                results["failed"] += 1
+        await self._browser_manager.close()
+        logger.info(f"{self.name}: PDF download complete: {results}")
+        return results
+    def download_pdfs_from_dois(
+        self, dois: List[str], output_dir: Optional[Path] = None
+    ) -> Dict[str, int]:
+        """Download PDFs for given DOIs.
+        Args:
+            dois: List of DOI strings
+            output_dir: Output directory (uses config default if None)
+        Returns:
+            Dictionary with download statistics
+        """
+        import asyncio
+        return asyncio.run(
+            self.download_pdfs_from_dois_async(dois, output_dir)
+        )
+    def download_pdfs_from_bibtex(
+        self,
+        bibtex_input: Union[str, Path, Papers],
+        output_dir: Optional[Path] = None,
+    ) -> Dict[str, int]:
+        """Download PDFs from BibTeX file or Papers collection.
+        Args:
+            bibtex_input: BibTeX file path, content string, or Papers collection
+            output_dir: Output directory (uses config default if None)
+        Returns:
+            Dictionary with download statistics
+        """
+        # Load papers if bibtex_input is not already Papers
+        if isinstance(bibtex_input, Papers):
+            papers = bibtex_input
+        else:
+            papers = self.load_bibtex(bibtex_input)
+        # Extract DOIs from papers
+        dois = [
+            paper.metadata.id.doi for paper in papers if paper.metadata.id.doi
+        ]
+        if not dois:
+            logger.warning(
+                f"{self.name}: No papers with DOIs found in BibTeX input"
+            )
+            return {"downloaded": 0, "failed": 0, "errors": 0}
+        logger.info(
+            f"{self.name}: Found {len(dois)} papers with DOIs out of {len(papers)} total papers"
+        )
+        # Download PDFs using DOI method
+        return self.download_pdfs_from_dois(dois, output_dir)
+    # ----------------------------------------
+    # Loaders
+    # ----------------------------------------
+    def load_project(self, project: Optional[str] = None) -> Papers:
+        """Load papers from a project using library manager service.
+        Args:
+            project: Project name (uses self.project if None)
+        Returns:
+            Papers collection from the project
+        """
+        project_name = project or self.project
+        if not project_name:
+            raise ValueError("No project specified")
+        # Load papers from library by reading symlinks in project directory
+        from ..core.Papers import Papers
+        from ..core.Paper import Paper
+        import json
+        logger.info(
+            f"{self.name}: Loading papers from project: {project_name}"
+        )
+        library_dir = self.config.get_library_project_dir()
+        project_dir = library_dir / project_name
+        if not project_dir.exists():
+            logger.warning(
+                f"{self.name}: Project directory does not exist: {project_dir}"
+            )
+            return Papers([], project=project_name)
+        papers = []
+        for item in project_dir.iterdir():
+            # Skip info directory and metadata files
+            if item.name in ["info", "project_metadata.json", "README.md"]:
+                continue
+            # Follow symlink to MASTER directory
+            if item.is_symlink():
+                master_path = item.resolve()
+                if master_path.exists():
+                    # Load metadata.json from MASTER directory
+                    metadata_file = master_path / "metadata.json"
+                    if metadata_file.exists():
+                        try:
+                            with open(metadata_file, "r") as f:
+                                metadata = json.load(f)
+                            # Create Paper object using from_dict class method
+                            paper = Paper.from_dict(metadata)
+                            papers.append(paper)
+                        except Exception as e:
+                            logger.warning(
+                                f"{self.name}: Failed to load metadata from {metadata_file}: {e}"
+                            )
+        logger.info(
+            f"{self.name}: Loaded {len(papers)} papers from project: {project_name}"
+        )
+        return Papers(papers, project=project_name)
+    def load_bibtex(self, bibtex_input: Union[str, Path]) -> Papers:
+        """Load Papers collection from BibTeX file or content.
+        Args:
+            bibtex_input: BibTeX file path or content string
+        Returns:
+            Papers collection
+        """
+        # Use the internal library to load papers
+        papers = self._library.papers_from_bibtex(bibtex_input)
+        # Convert to Papers collection
+        from .Papers import Papers
+        papers_collection = Papers(
+            papers, config=self.config, project=self.project
+        )
+        papers_collection.library = (
+            self._library
+        )  # Attach library for save operations
+        return papers_collection
+    # ----------------------------------------
+    # Searchers
+    # ----------------------------------------
+    def search_library(
+        self, query: str, project: Optional[str] = None
+    ) -> Papers:
+        """
+        Search papers in local library.
+        For new literature search (not in library), use AI2 Scholar QA:
+        https://scholarqa.allen.ai/chat/ then process with:
+        papers = scholar.load_bibtex('file.bib') followed by scholar.enrich(papers)
+        Args:
+            query: Search query
+            project: Project filter (uses self.project if None)
+        Returns:
+            Papers collection matching the query
+        """
+        # For now, return empty Papers until search is implemented
+        from ..core.Papers import Papers
+        logger.info(f"{self.name}: Searching library for: {query}")
+        return Papers([], project=project or self.project)
+    def search_across_projects(
+        self, query: str, projects: Optional[List[str]] = None
+    ) -> Papers:
+        """Search for papers across multiple projects or the entire library.
+        Args:
+            query: Search query
+            projects: List of project names to search (None for all)
+        Returns:
+            Papers collection with search results
+        """
+        if projects is None:
+            # Search all projects
+            all_projects = [p["name"] for p in self.list_projects()]
+        else:
+            all_projects = projects
+        all_papers = []
+        for project in all_projects:
+            try:
+                project_papers = Papers.from_project(project, self.config)
+                # Simple text search implementation
+                matching_papers = [
+                    p
+                    for p in project_papers._papers
+                    if query.lower() in (p.title or "").lower()
+                    or query.lower() in (p.abstract or "").lower()
+                    or any(
+                        query.lower() in (author or "").lower()
+                        for author in (p.authors or [])
+                    )
+                ]
+                all_papers.extend(matching_papers)
+            except Exception as e:
+                logger.debug(
+                    f"{self.name}: Failed to search project {project}: {e}"
+                )
+        return Papers(all_papers, config=self.config, project="search_results")
+    # ----------------------------------------
+    # Savers
+    # ----------------------------------------
+    def save_papers_to_library(self, papers: Papers) -> List[str]:
+        """Save papers collection to library.
+        Args:
+            papers: Papers collection to save
+        Returns:
+            List of paper IDs saved
+        """
+        saved_ids = []
+        for paper in papers:
+            try:
+                paper_id = self._library.save_paper(paper)
+                saved_ids.append(paper_id)
+            except Exception as e:
+                logger.warning(f"{self.name}: Failed to save paper: {e}")
+        logger.info(
+            f"{self.name}: Saved {len(saved_ids)}/{len(papers)} papers to library"
+        )
+        return saved_ids
+    def save_papers_as_bibtex(
+        self, papers: Papers, output_path: Optional[Union[str, Path]] = None
+    ) -> str:
+        """Save papers to BibTeX format with enrichment metadata.
+        Args:
+            papers: Papers collection to save
+            output_path: Optional path to save the BibTeX file
+        Returns:
+            BibTeX content as string with enrichment metadata included
+        """
+        from ..storage.BibTeXHandler import BibTeXHandler
+        bibtex_handler = BibTeXHandler(
+            project=self.project, config=self.config
+        )
+        return bibtex_handler.papers_to_bibtex(papers, output_path)
+    # ----------------------------------------
+    # Project Handlers
+    # ----------------------------------------
+    def _ensure_project_exists(
+        self, project: str, description: Optional[str] = None
+    ) -> Path:
+        """Ensure project directory exists, create if needed (PRIVATE).
+        Args:
+            project: Project name
+            description: Optional project description
+        Returns:
+            Path to the project directory
+        """
+        project_dir = self.config.get_library_project_dir() / project
+        info_dir = project_dir / "info"
+        # Create project and info directories
+        if not project_dir.exists():
+            project_dir.mkdir(parents=True, exist_ok=True)
+            logger.info(
+                f"{self.name}: Auto-created project directory: {project}"
+            )
+        # Ensure info directory exists
+        info_dir.mkdir(parents=True, exist_ok=True)
+        # Create/move metadata file to info directory
+        old_metadata_file = (
+            project_dir / "project_metadata.json"
+        )  # Old location
+        metadata_file = info_dir / "project_metadata.json"  # New location
+        # Move existing metadata file if it exists in old location
+        if old_metadata_file.exists() and not metadata_file.exists():
+            shutil.move(str(old_metadata_file), str(metadata_file))
+            logger.info(
+                f"{self.name}: Moved project metadata to info directory"
+            )
+        # Create metadata file if it doesn't exist
+        if not metadata_file.exists():
+            metadata = {
+                "name": project,
+                "description": description or f"Papers for {project} project",
+                "created": datetime.now().isoformat(),
+                "created_by": "SciTeX Scholar",
+                "auto_created": True,
+            }
+            with open(metadata_file, "w") as f:
+                json.dump(metadata, f, indent=2)
+            logger.info(
+                f"{self.name}: Created project metadata in info directory: {project}"
+            )
+        return project_dir
+    def _create_project_metadata(
+        self, project: str, description: Optional[str] = None
+    ) -> Path:
+        """Create project directory and metadata (PRIVATE).
+        DEPRECATED: Use _ensure_project_exists instead.
+        Args:
+            project: Project name
+            description: Optional project description
+        Returns:
+            Path to the created project directory
+        """
+        # Just use the new method that puts metadata in info directory
+        return self._ensure_project_exists(project, description)
+    def list_projects(self) -> List[Dict[str, Any]]:
+        """List all projects in the Scholar library.
+        Returns:
+            List of project information dictionaries
+        """
+        library_dir = self.config.get_library_project_dir()
+        projects = []
+        for item in library_dir.iterdir():
+            if item.is_dir() and item.name != "MASTER":
+                project_info = {
+                    "name": item.name,
+                    "path": str(item),
+                    "papers_count": len(list(item.glob("*"))),
+                    "created": None,
+                    "description": None,
+                }
+                # Load metadata if exists
+                metadata_file = item / "project_metadata.json"
+                if metadata_file.exists():
+                    try:
+                        with open(metadata_file, "r") as f:
+                            metadata = json.load(f)
+                        project_info.update(metadata)
+                    except Exception as e:
+                        logger.debug(
+                            f"Failed to load metadata for {item.name}: {e}"
+                        )
+                projects.append(project_info)
+        return sorted(projects, key=lambda x: x["name"])
+    # ----------------------------------------
+    # Library Handlers
+    # ----------------------------------------
+    def get_library_statistics(self) -> Dict[str, Any]:
+        """Get comprehensive statistics for the entire Scholar library.
+        Returns:
+            Dictionary with library-wide statistics
+        """
+        master_dir = self.config.get_library_master_dir()
+        projects = self.list_projects()
+        stats = {
+            "total_projects": len(projects),
+            "total_papers": (
+                len(list(master_dir.glob("*"))) if master_dir.exists() else 0
+            ),
+            "projects": projects,
+            "library_path": str(self.config.get_library_project_dir()),
+            "master_path": str(master_dir),
+        }
+        # Calculate storage usage
+        if master_dir.exists():
+            total_size = sum(
+                f.stat().st_size for f in master_dir.rglob("*") if f.is_file()
+            )
+            stats["storage_mb"] = total_size / (1024 * 1024)
+        else:
+            stats["storage_mb"] = 0
+        return stats
+    def backup_library(self, backup_path: Union[str, Path]) -> Dict[str, Any]:
+        """Create a backup of the Scholar library.
+        Args:
+            backup_path: Path for the backup
+        Returns:
+            Dictionary with backup information
+        """
+        backup_path = Path(backup_path)
+        library_path = self.config.get_library_project_dir()
+        if not library_path.exists():
+            raise ScholarError("Library directory does not exist")
+        # Create timestamped backup
+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+        backup_dir = backup_path / f"scholar_library_backup_{timestamp}"
+        logger.info(f"{self.name}: Creating library backup at {backup_dir}")
+        shutil.copytree(library_path, backup_dir)
+        # Create backup metadata
+        backup_info = {
+            "timestamp": timestamp,
+            "source": str(library_path),
+            "backup": str(backup_dir),
+            "size_mb": sum(
+                f.stat().st_size for f in backup_dir.rglob("*") if f.is_file()
+            )
+            / (1024 * 1024),
+        }
+        metadata_file = backup_dir / "backup_metadata.json"
+        with open(metadata_file, "w") as f:
+            json.dump(backup_info, f, indent=2)
+        logger.info(
+            f"{self.name}: Library backup completed: {backup_info['size_mb']:.2f} MB"
+        )
+        return backup_info
+    # =========================================================================
+    # PIPELINE METHODS (Phase 2)
+    # =========================================================================
+    async def process_paper_async(
+        self,
+        title: Optional[str] = None,
+        doi: Optional[str] = None,
+        project: Optional[str] = None,
+    ) -> "Paper":
+        """
+        Complete sequential pipeline for processing a single paper.
+        Accepts either title OR doi. Uses storage-first approach:
+        each stage checks storage before processing.
+        Workflow:
+          Stage 0: Resolve DOI from title (if needed)
+          Stage 1: Load or create Paper from storage
+          Stage 2: Find PDF URLs → save to storage
+          Stage 3: Download PDF → save to storage
+          Stage 4: Update project symlinks
+        Args:
+            title: Paper title (will resolve DOI using engine)
+            doi: DOI of the paper (preferred if available)
+            project: Project name (uses self.project if None)
+        Returns:
+            Fully processed Paper object
+        Examples:
+            # With DOI (direct)
+            paper = await scholar.process_paper_async(doi="10.1038/s41598-017-02626-y")
+            # With title (resolves DOI first)
+            paper = await scholar.process_paper_async(
+                title="Attention Is All You Need"
+            )
+        """
+        from scitex.scholar.core.Paper import Paper
+        # Validate input
+        if not title and not doi:
+            raise ValueError("Must provide either title or doi")
+        project = project or self.project
+        logger.info(f"{'='*60}")
+        logger.info(f"Processing paper")
+        if title:
+            logger.info(f"Title: {title[:50]}...")
+        if doi:
+            logger.info(f"DOI: {doi}")
+        logger.info(f"{'='*60}")
+        # Stage 0: Resolve DOI from title (if needed)
+        if not doi and title:
+            logger.info(f"Stage 0: Resolving DOI from title...")
+            # Use ScholarEngine to search and get DOI
+            results = await self._scholar_engine.search_async(title=title)
+            if results and results.get("id", {}).get("doi"):
+                doi = results["id"]["doi"]
+                logger.success(f"Resolved DOI: {doi}")
+            else:
+                logger.error(f"Could not resolve DOI from title: {title}")
+                raise ValueError(f"Could not resolve DOI from title: {title}")
+        # Generate paper ID from DOI
+        paper_id = self.config.path_manager._generate_paper_id(doi=doi)
+        storage_path = self.config.get_library_master_dir() / paper_id
+        logger.info(f"Paper ID: {paper_id}")
+        logger.info(f"Storage: {storage_path}")
+        # Stage 1: Load or create Paper from storage
+        logger.info(f"\nStage 1: Loading/creating metadata...")
+        if self._library_manager.has_metadata(paper_id):
+            # Load existing from storage
+            paper = self._library_manager.load_paper_from_id(paper_id)
+            logger.info(f"Loaded existing metadata from storage")
+        else:
+            # Create new Paper
+            paper = Paper()
+            paper.metadata.set_doi(doi)
+            paper.container.scitex_id = paper_id
+            # If we have title, save it
+            if title:
+                paper.metadata.basic.title = title
+            # Create storage and save
+            self._library_manager.save_paper_incremental(paper_id, paper)
+            logger.success(f"Created new paper entry in storage")
+        # Stage 2: Check/find URLs
+        logger.info(f"\nStage 2: Checking/finding PDF URLs...")
+        if not self._library_manager.has_urls(paper_id):
+            logger.info(f"Finding PDF URLs for DOI: {doi}")
+            browser, context = (
+                await self._browser_manager.get_authenticated_browser_and_context_async()
+            )
+            try:
+                url_finder = ScholarURLFinder(context, config=self.config)
+                urls = await url_finder.find_pdf_urls(doi)
+                paper.metadata.url.pdfs = urls
+                self._library_manager.save_paper_incremental(paper_id, paper)
+                logger.success(f"Found {len(urls)} PDF URLs, saved to storage")
+            finally:
+                await self._browser_manager.close()
+        else:
+            logger.info(
+                f"PDF URLs already in storage ({len(paper.metadata.url.pdfs)} URLs)"
+            )
+        # Stage 3: Check/download PDF
+        logger.info(f"\nStage 3: Checking/downloading PDF...")
+        if not self._library_manager.has_pdf(paper_id):
+            logger.info(f"Downloading PDF...")
+            if paper.metadata.url.pdfs:
+                browser, context = (
+                    await self._browser_manager.get_authenticated_browser_and_context_async()
+                )
+                try:
+                    downloader = ScholarPDFDownloader(
+                        context, config=self.config
+                    )
+                    pdf_url = (
+                        paper.metadata.url.pdfs[0]["url"]
+                        if isinstance(paper.metadata.url.pdfs[0], dict)
+                        else paper.metadata.url.pdfs[0]
+                    )
+                    temp_path = storage_path / "main.pdf"
+                    result = await downloader.download_from_url(
+                        pdf_url, temp_path, doi=doi
+                    )
+                    if result and result.exists():
+                        paper.metadata.path.pdfs.append(str(result))
+                        self._library_manager.save_paper_incremental(
+                            paper_id, paper
+                        )
+                        logger.success(
+                            f"{self.name}: Downloaded PDF, saved to storage"
+                        )
+                    else:
+                        logger.warning(f"{self.name}: Failed to download PDF")
+                finally:
+                    await self._browser_manager.close()
+            else:
+                logger.warning(
+                    f"{self.name}: No PDF URLs available for download"
+                )
+        else:
+            logger.info(f"{self.name}: PDF already in storage")
+        # Stage 4: Update project symlinks
+        if project and project not in ["master", "MASTER"]:
+            logger.info(
+                f"{self.name}: \nStage 4: Updating project symlinks..."
+            )
+            self._library_manager.update_symlink(
+                master_storage_path=storage_path,
+                project=project,
+            )
+            logger.success(
+                f"{self.name}: Updated symlink in project: {project}"
+            )
+        logger.info(f"\n{'='*60}")
+        logger.success(f"{self.name}: Paper processing complete")
+        logger.info(f"{'='*60}\n")
+        return paper
+    def process_paper(
+        self,
+        title: Optional[str] = None,
+        doi: Optional[str] = None,
+        project: Optional[str] = None,
+    ) -> "Paper":
+        """
+        Synchronous wrapper for process_paper_async.
+        See process_paper_async() for full documentation.
+        """
+        return asyncio.run(
+            self.process_paper_async(title=title, doi=doi, project=project)
+        )
+    # =========================================================================
+    # PIPELINE METHODS (Phase 3) - Parallel Papers Processing
+    # =========================================================================
+    async def process_papers_async(
+        self,
+        papers: Union["Papers", List[str]],
+        project: Optional[str] = None,
+        max_concurrent: int = 3,
+    ) -> "Papers":
+        """
+        Process multiple papers with controlled parallelism.
+        Each paper goes through complete sequential pipeline.
+        Semaphore controls how many papers process concurrently.
+        Architecture:
+          - Parallel papers (max_concurrent at a time)
+          - Sequential stages per paper
+          - Storage checks before each stage
+        Args:
+            papers: Papers collection or list of DOIs
+            project: Project name (uses self.project if None)
+            max_concurrent: Maximum concurrent papers (default: 3)
+                           Set to 1 for purely sequential processing
+        Returns:
+            Papers collection with processed papers
+        Examples:
+            # Process Papers collection (parallel)
+            papers = scholar.load_bibtex("papers.bib")
+            processed = await scholar.process_papers_async(papers, max_concurrent=3)
+            # Process DOI list (sequential)
+            dois = ["10.1038/...", "10.1016/...", "10.1109/..."]
+            processed = await scholar.process_papers_async(dois, max_concurrent=1)
+        """
+        from scitex.scholar.core.Papers import Papers
+        project = project or self.project
+        # Convert input to Papers collection
+        if isinstance(papers, list):
+            # List of DOI strings
+            papers_list = []
+            for doi in papers:
+                from scitex.scholar.core.Paper import Paper
+                p = Paper()
+                p.metadata.set_doi(doi)
+                papers_list.append(p)
+            papers = Papers(papers_list, project=project, config=self.config)
+        total = len(papers)
+        logger.info(f"{self.name}: \n{'='*60}")
+        logger.info(
+            f"{self.name}: Processing {total} papers (max_concurrent={max_concurrent})"
+        )
+        logger.info(f"{self.name}: Project: {project}")
+        logger.info(f"{self.name}: {'='*60}\n")
+        # Use semaphore for controlled parallelism
+        semaphore = asyncio.Semaphore(max_concurrent)
+        async def process_with_semaphore(paper, index):
+            """Process one paper with semaphore control."""
+            async with semaphore:
+                logger.info(
+                    f"{self.name}: \n[{index}/{total}] Starting paper..."
+                )
+                try:
+                    result = await self.process_paper_async(
+                        title=paper.metadata.basic.title,
+                        doi=paper.metadata.id.doi,
+                        project=project,
+                    )
+                    logger.success(f"{self.name}: [{index}/{total}] Completed")
+                    return result
+                except Exception as e:
+                    logger.error(f"{self.name}: [{index}/{total}] Failed: {e}")
+                    return None
+        # Create tasks for all papers
+        tasks = [
+            process_with_semaphore(paper, i + 1)
+            for i, paper in enumerate(papers)
+        ]
+        # Process with controlled parallelism
+        results = await asyncio.gather(*tasks, return_exceptions=True)
+        # Filter successful results
+        processed_papers = []
+        errors = 0
+        for i, result in enumerate(results):
+            if isinstance(result, Exception):
+                logger.error(
+                    f"{self.name}: Paper {i+1} raised exception: {result}"
+                )
+                errors += 1
+            elif result is not None:
+                processed_papers.append(result)
+        # Summary
+        logger.info(f"{self.name}: \n{'='*60}")
+        logger.info(f"{self.name}: Batch Processing Complete")
+        logger.info(f"{self.name}:   Total: {total}")
+        logger.info(f"{self.name}:   Successful: {len(processed_papers)}")
+        logger.info(f"{self.name}:   Failed: {total - len(processed_papers)}")
+        logger.info(f"{self.name}:   Errors: {errors}")
+        logger.info(f"{self.name}: {'='*60}\n")
+        return Papers(processed_papers, project=project, config=self.config)
+    def process_papers(
+        self,
+        papers: Union["Papers", List[str]],
+        project: Optional[str] = None,
+        max_concurrent: int = 3,
+    ) -> "Papers":
+        """
+        Synchronous wrapper for process_papers_async.
+        See process_papers_async() for full documentation.
+        """
+        return asyncio.run(
+            self.process_papers_async(
+                papers=papers,
+                project=project,
+                max_concurrent=max_concurrent,
+            )
+        )
+    # =========================================================================
+    # INTERNAL SERVICES (PRIVATE - users should not access these directly)
+    # =========================================================================
+    def _init_config(self, config):
+        # Handle different config input types
+        if config is None:
+            return ScholarConfig.load()  # Auto-detect config
+        elif isinstance(config, (str, Path)):
+            return ScholarConfig.from_yaml(config)
+        elif isinstance(config, ScholarConfig):
+            return config
+        else:
+            raise TypeError(f"Invalid config type: {type(config)}")
+    @property
+    def _scholar_engine(self) -> ScholarEngine:
+        """Get Scholar engine for search and enrichment (PRIVATE)."""
+        if (
+            not hasattr(self, "__scholar_engine")
+            or self.__scholar_engine is None
+        ):
+            self.__scholar_engine = ScholarEngine(config=self.config)
+        return self.__scholar_engine
+    @property
+    def _auth_manager(self) -> ScholarAuthManager:
+        """Get authentication manager service (PRIVATE)."""
+        if not hasattr(self, "__auth_manager") or self.__auth_manager is None:
+            self.__auth_manager = ScholarAuthManager()
+        return self.__auth_manager
+    @property
+    def _browser_manager(self) -> ScholarBrowserManager:
+        """Get browser manager service (PRIVATE)."""
+        if (
+            not hasattr(self, "__browser_manager")
+            or self.__browser_manager is None
+        ):
+            self.__browser_manager = ScholarBrowserManager(
+                auth_manager=self._auth_manager,
+                chrome_profile_name="system",
+                browser_mode=self.browser_mode,
+            )
+        return self.__browser_manager
+    @property
+    def _library_manager(self) -> LibraryManager:
+        """Get library manager service - low-level operations (PRIVATE)."""
+        if (
+            not hasattr(self, "__library_manager")
+            or self.__library_manager is None
+        ):
+            self.__library_manager = LibraryManager(
+                project=self.project, config=self.config
+            )
+        return self.__library_manager
+    @property
+    def _library(self) -> ScholarLibrary:
+        """Get Scholar library service - high-level operations (PRIVATE)."""
+        if not hasattr(self, "__library") or self.__library is None:
+            self.__library = ScholarLibrary(
+                project=self.project, config=self.config
+            )
+        return self.__library
+# Export all classes and functions
+__all__ = ["Scholar"]
+if __name__ == "__main__":
+    from scitex.scholar.core.Paper import Paper
+    from scitex.scholar.core.Papers import Papers
+    def main():
+        """Demonstrate Scholar class usage - Clean API Demo."""
+        print("\n" + "=" * 60)
+        print("🎓 Scholar Module Demo - Clean API")
+        print("=" * 60 + "\n")
+        # ----------------------------------------
+        # 1. Initialize Scholar
+        # ----------------------------------------
+        print("1️⃣  Initialize Scholar")
+        print("-" * 60)
+        scholar = Scholar(
+            project="demo_project",
+            project_description="Demo project for testing Scholar API",
+        )
+        print(f"✓ Scholar initialized")
+        print(f"  Project: {scholar.project}")
+        print(f"  Workspace: {scholar.get_workspace_dir()}")
+        print()
+        # Demonstrate project management
+        print("2. Project Management:")
+        try:
+            # Create a new project
+            project_dir = scholar._create_project_metadata(
+                "neural_networks_2024",
+                description="Collection of neural network papers from 2024",
+            )
+            print(f"   ✅ Created project: neural_networks_2024")
+            print(f"   📂 Project directory: {project_dir}")
+            # List all projects
+            projects = scholar.list_projects()
+            print(f"   📋 Total projects in library: {len(projects)}")
+            for project in projects[:3]:  # Show first 3
+                print(
+                    f"      - {project['name']}: {project.get('description', 'No description')}"
+                )
+            if len(projects) > 3:
+                print(f"      ... and {len(projects) - 3} more")
+        except Exception as e:
+            print(f"   ⚠️  Project management demo skipped: {e}")
+        print()
+        # Demonstrate library statistics
+        print("3. Library Statistics:")
+        try:
+            stats = scholar.get_library_statistics()
+            print(f"   📊 Total projects: {stats['total_projects']}")
+            print(f"   📚 Total papers: {stats['total_papers']}")
+            print(f"   💾 Storage usage: {stats['storage_mb']:.2f} MB")
+            print(f"   📁 Library path: {stats['library_path']}")
+        except Exception as e:
+            print(f"   ⚠️  Library statistics demo skipped: {e}")
+        print()
+        # Demonstrate paper and project operations
+        print("4. Working with Papers:")
+        # Create some sample papers with Pydantic structure
+        p1 = Paper()
+        p1.metadata.basic.title = (
+            "Vision Transformer: An Image Is Worth 16x16 Words"
+        )
+        p1.metadata.basic.authors = ["Dosovitskiy, Alexey", "Beyer, Lucas"]
+        p1.metadata.basic.year = 2021
+        p1.metadata.basic.keywords = [
+            "vision transformer",
+            "computer vision",
+            "attention",
+        ]
+        p1.metadata.publication.journal = "ICLR"
+        p1.metadata.set_doi("10.48550/arXiv.2010.11929")
+        p1.container.projects = ["neural_networks_2024"]
+        p2 = Paper()
+        p2.metadata.basic.title = "Scaling Laws for Neural Language Models"
+        p2.metadata.basic.authors = ["Kaplan, Jared", "McCandlish, Sam"]
+        p2.metadata.basic.year = 2020
+        p2.metadata.basic.keywords = ["scaling laws", "language models", "GPT"]
+        p2.metadata.publication.journal = "arXiv preprint"
+        p2.metadata.set_doi("10.48550/arXiv.2001.08361")
+        p2.container.projects = ["neural_networks_2024"]
+        sample_papers = [p1, p2]
+        # Create Papers collection
+        papers = Papers(
+            sample_papers,
+            project="neural_networks_2024",
+            config=scholar.config,
+        )
+        print(f"   📝 Created collection with {len(papers)} papers")
+        # Use Scholar to work with the collection
+        # Switch project by creating new instance (cleaner pattern)
+        scholar = Scholar(project="neural_networks_2024")
+        print(f"   🎯 Set Scholar project to: {scholar.project}")
+        print()
+        # Demonstrate DOI resolution workflow
+        print("5. Scholar Workflow Integration:")
+        try:
+            # Create a sample BibTeX content for demonstration
+            sample_bibtex = """
+    @article{sample2024,
+        title = {Sample Paper for Demo},
+        author = {Demo, Author},
+        year = {2024},
+        journal = {Demo Journal}
+    }
+            """
+            # Demonstrate BibTeX loading
+            papers_from_bibtex = scholar.load_bibtex(sample_bibtex.strip())
+            print(f"   📄 Loaded {len(papers_from_bibtex)} papers from BibTeX")
+            # Demonstrate project loading
+            if scholar.project:
+                try:
+                    project_papers = scholar.load_project()
+                    print(
+                        f"   📂 Loaded {len(project_papers)} papers from current project"
+                    )
+                except:
+                    print(
+                        f"   📂 Current project is empty or doesn't exist yet"
+                    )
+        except Exception as e:
+            print(f"   ⚠️  Workflow demo partially skipped: {e}")
+        print()
+        # Demonstrate search capabilities
+        print("6. Search Capabilities:")
+        try:
+            # Search across projects
+            search_results = scholar.search_across_projects("transformer")
+            print(
+                f"   🔍 Search for 'transformer': {len(search_results)} results across all projects"
+            )
+            # Search in current library (existing papers)
+            library_search = scholar.search_library("vision")
+            print(
+                f"   🔍 Library search for 'vision': {len(library_search)} results"
+            )
+        except Exception as e:
+            print(f"   ⚠️  Search demo skipped: {e}")
+        print()
+        # Demonstrate configuration access
+        print("7. Configuration Management:")
+        print(f"   ⚙️  Scholar directory: {scholar.config.paths.scholar_dir}")
+        print(
+            f"   ⚙️  Library directory: {scholar.config.get_library_project_dir()}"
+        )
+        print(
+            f"   ⚙️  Debug mode: {scholar.config.resolve('debug_mode', default=False)}"
+        )
+        print()
+        # Demonstrate service access (internal components)
+        print("8. Service Components (Internal):")
+        print(
+            f"   🔧 Scholar Engine: {type(scholar._scholar_engine).__name__}"
+        )
+        print(f"   🔧 Auth Manager: {type(scholar._auth_manager).__name__}")
+        print(
+            f"   🔧 Browser Manager: {type(scholar._browser_manager).__name__}"
+        )
+        print(
+            f"   🔧 Library Manager: {type(scholar._library_manager).__name__}"
+        )
+        print()
+        # Demonstrate backup capabilities
+        print("9. Backup and Maintenance:")
+        try:
+            import tempfile
+            import os
+            # Create a temporary backup location
+            backup_dir = Path(tempfile.mkdtemp()) / "scholar_backup"
+            backup_info = scholar.backup_library(backup_dir)
+            print(f"   💾 Library backup created:")
+            print(f"      📁 Location: {backup_info['backup']}")
+            print(f"      📊 Size: {backup_info['size_mb']:.2f} MB")
+            print(f"      🕐 Timestamp: {backup_info['timestamp']}")
+            # Clean up
+            import shutil
+            shutil.rmtree(backup_dir, ignore_errors=True)
+        except Exception as e:
+            print(f"   ⚠️  Backup demo skipped: {e}")
+        print()
+        print("Scholar global management demo completed! ✨")
+        print()
+        print("💡 Key Scholar Capabilities:")
+        print("   • Global library management and statistics")
+        print("   • Project creation and organization")
+        print("   • Cross-project search and analysis")
+        print("   • Integration with Paper and Papers classes")
+        print("   • DOI resolution and metadata enrichment")
+        print("   • PDF download and browser automation")
+        print("   • Backup and maintenance operations")
+        print()
+    main()
+# python -m scitex.scholar.core.Scholar
+# EOF

scitex 2.0.0__py2.py3-none-any.whl → 2.1.0__py2.py3-none-any.whl

scitex 2.0.0py2.py3-none-any.whl → 2.1.0py2.py3-none-any.whl