SinaTools 0.1.23__tar.gz → 0.1.25__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (189) hide show
  1. {SinaTools-0.1.23 → SinaTools-0.1.25}/PKG-INFO +1 -1
  2. {SinaTools-0.1.23 → SinaTools-0.1.25}/SinaTools.egg-info/PKG-INFO +1 -1
  3. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/DataDownload/downloader.py +45 -41
  4. SinaTools-0.1.25/sinatools/VERSION +1 -0
  5. SinaTools-0.1.23/sinatools/VERSION +0 -1
  6. {SinaTools-0.1.23 → SinaTools-0.1.25}/AUTHORS.rst +0 -0
  7. {SinaTools-0.1.23 → SinaTools-0.1.25}/CONTRIBUTING.rst +0 -0
  8. {SinaTools-0.1.23 → SinaTools-0.1.25}/LICENSE +0 -0
  9. {SinaTools-0.1.23 → SinaTools-0.1.25}/MANIFEST.in +0 -0
  10. {SinaTools-0.1.23 → SinaTools-0.1.25}/README.rst +0 -0
  11. {SinaTools-0.1.23 → SinaTools-0.1.25}/SinaTools.egg-info/SOURCES.txt +0 -0
  12. {SinaTools-0.1.23 → SinaTools-0.1.25}/SinaTools.egg-info/dependency_links.txt +0 -0
  13. {SinaTools-0.1.23 → SinaTools-0.1.25}/SinaTools.egg-info/entry_points.txt +0 -0
  14. {SinaTools-0.1.23 → SinaTools-0.1.25}/SinaTools.egg-info/not-zip-safe +0 -0
  15. {SinaTools-0.1.23 → SinaTools-0.1.25}/SinaTools.egg-info/requires.txt +0 -0
  16. {SinaTools-0.1.23 → SinaTools-0.1.25}/SinaTools.egg-info/top_level.txt +0 -0
  17. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/Makefile +0 -0
  18. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/_images/download.png +0 -0
  19. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/_static/download.png +0 -0
  20. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/_static/file.png +0 -0
  21. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/_static/minus.png +0 -0
  22. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/_static/plus.png +0 -0
  23. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/html/_images/SinaLogo.jpg +0 -0
  24. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/html/_images/download.png +0 -0
  25. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/html/_static/SinaLogo.jpg +0 -0
  26. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/html/_static/download.png +0 -0
  27. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/html/_static/file.png +0 -0
  28. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/html/_static/minus.png +0 -0
  29. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/build/html/_static/plus.png +0 -0
  30. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/make.bat +0 -0
  31. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/License.rst +0 -0
  32. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/Overview.rst +0 -0
  33. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/_static/SinaLogo.jpg +0 -0
  34. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/_static/download.png +0 -0
  35. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/about.rst +0 -0
  36. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/DataDownload/downloader.rst +0 -0
  37. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/DataDownload.rst +0 -0
  38. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/arabiner/bin/infer.rst +0 -0
  39. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/arabiner.rst +0 -0
  40. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/morphology/morph_analyzer.rst +0 -0
  41. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/morphology.rst +0 -0
  42. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/salma/views.rst +0 -0
  43. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/salma.rst +0 -0
  44. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/utils/corpus_tokenizer.rst +0 -0
  45. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/utils/implication.rst +0 -0
  46. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/utils/jaccard.rst +0 -0
  47. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/utils/parser.rst +0 -0
  48. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/utils/sentence_tokenizer.rst +0 -0
  49. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/utils/text_transliteration.rst +0 -0
  50. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api/utils.rst +0 -0
  51. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/api.rst +0 -0
  52. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/authors.rst +0 -0
  53. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/DataDownload/download_files.rst +0 -0
  54. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/DataDownload/get_appdatadir.rst +0 -0
  55. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/DataDownload.rst +0 -0
  56. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/arabiner/infer.rst +0 -0
  57. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/arabiner.rst +0 -0
  58. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/morphology/ALMA_multi_word.rst +0 -0
  59. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/morphology/morph_analyzer.rst +0 -0
  60. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/morphology.rst +0 -0
  61. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/salma/salma_tools.rst +0 -0
  62. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/salma.rst +0 -0
  63. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/utils/arStrip.rst +0 -0
  64. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/utils/corpus_tokenizer.rst +0 -0
  65. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/utils/implication.rst +0 -0
  66. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/utils/jaccard.rst +0 -0
  67. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/utils/latin_remove.rst +0 -0
  68. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/utils/remove_punc.rst +0 -0
  69. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/utils/sentence_tokenizer.rst +0 -0
  70. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/utils/text_transliteration.rst +0 -0
  71. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools/utils.rst +0 -0
  72. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/cli_tools.rst +0 -0
  73. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/conf.py +0 -0
  74. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/index.rst +0 -0
  75. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/installation.rst +0 -0
  76. {SinaTools-0.1.23 → SinaTools-0.1.25}/docs/source/readme.rst +0 -0
  77. {SinaTools-0.1.23 → SinaTools-0.1.25}/setup.cfg +0 -0
  78. {SinaTools-0.1.23 → SinaTools-0.1.25}/setup.py +0 -0
  79. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/DataDownload/download_files.py +0 -0
  80. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/morphology/ALMA_multi_word.py +0 -0
  81. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/morphology/morph_analyzer.py +0 -0
  82. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/ner/corpus_entity_extractor.py +0 -0
  83. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/ner/entity_extractor.py +0 -0
  84. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/utils/__init__.py +0 -0
  85. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/utils/arStrip.py +0 -0
  86. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/utils/corpus_tokenizer.py +0 -0
  87. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/utils/implication.py +0 -0
  88. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/utils/jaccard.py +0 -0
  89. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/utils/remove_latin.py +0 -0
  90. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/utils/remove_punctuation.py +0 -0
  91. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/utils/sentence_tokenizer.py +0 -0
  92. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/utils/text_dublication_detector.py +0 -0
  93. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/CLI/utils/text_transliteration.py +0 -0
  94. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/DataDownload/__init__.py +0 -0
  95. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/__init__.py +0 -0
  96. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/__init__.py +0 -0
  97. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/arabert/__init__.py +0 -0
  98. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/arabert/create_classification_data.py +0 -0
  99. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/arabert/create_pretraining_data.py +0 -0
  100. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/arabert/extract_features.py +0 -0
  101. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/arabert/lamb_optimizer.py +0 -0
  102. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/arabert/modeling.py +0 -0
  103. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/arabert/optimization.py +0 -0
  104. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/arabert/run_classifier.py +0 -0
  105. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/arabert/run_pretraining.py +0 -0
  106. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/arabert/run_squad.py +0 -0
  107. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/arabert/tokenization.py +0 -0
  108. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/__init__.py +0 -0
  109. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/build_openwebtext_pretraining_dataset.py +0 -0
  110. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/build_pretraining_dataset.py +0 -0
  111. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/build_pretraining_dataset_single_file.py +0 -0
  112. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/configure_finetuning.py +0 -0
  113. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/configure_pretraining.py +0 -0
  114. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/finetune/__init__.py +0 -0
  115. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/finetune/feature_spec.py +0 -0
  116. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/finetune/preprocessing.py +0 -0
  117. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/finetune/scorer.py +0 -0
  118. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/finetune/task.py +0 -0
  119. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/finetune/task_builder.py +0 -0
  120. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/flops_computation.py +0 -0
  121. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/model/__init__.py +0 -0
  122. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/model/modeling.py +0 -0
  123. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/model/optimization.py +0 -0
  124. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/model/tokenization.py +0 -0
  125. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/pretrain/__init__.py +0 -0
  126. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/pretrain/pretrain_data.py +0 -0
  127. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/pretrain/pretrain_helpers.py +0 -0
  128. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/run_finetuning.py +0 -0
  129. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/run_pretraining.py +0 -0
  130. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/util/__init__.py +0 -0
  131. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/util/training_utils.py +0 -0
  132. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/araelectra/util/utils.py +0 -0
  133. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/__init__.py +0 -0
  134. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/create_pretraining_data.py +0 -0
  135. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/gpt2/__init__.py +0 -0
  136. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/gpt2/lamb_optimizer.py +0 -0
  137. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/gpt2/optimization.py +0 -0
  138. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/gpt2/run_pretraining.py +0 -0
  139. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/grover/__init__.py +0 -0
  140. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/grover/dataloader.py +0 -0
  141. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/grover/modeling.py +0 -0
  142. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/grover/modeling_gpt2.py +0 -0
  143. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/grover/optimization_adafactor.py +0 -0
  144. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/grover/train_tpu.py +0 -0
  145. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/grover/utils.py +0 -0
  146. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/aragpt2/train_bpe_tokenizer.py +0 -0
  147. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/arabert/preprocess.py +0 -0
  148. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/environment.yml +0 -0
  149. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/install_env.py +0 -0
  150. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/morphology/ALMA_multi_word.py +0 -0
  151. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/morphology/__init__.py +0 -0
  152. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/morphology/morph_analyzer.py +0 -0
  153. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/__init__.py +0 -0
  154. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/data/__init__.py +0 -0
  155. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/data/datasets.py +0 -0
  156. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/data/transforms.py +0 -0
  157. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/data_format.py +0 -0
  158. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/datasets.py +0 -0
  159. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/entity_extractor.py +0 -0
  160. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/helpers.py +0 -0
  161. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/metrics.py +0 -0
  162. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/nn/BaseModel.py +0 -0
  163. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/nn/BertNestedTagger.py +0 -0
  164. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/nn/BertSeqTagger.py +0 -0
  165. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/nn/__init__.py +0 -0
  166. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/trainers/BaseTrainer.py +0 -0
  167. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/trainers/BertNestedTrainer.py +0 -0
  168. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/trainers/BertTrainer.py +0 -0
  169. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/trainers/__init__.py +0 -0
  170. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/ner/transforms.py +0 -0
  171. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/semantic_relatedness/__init__.py +0 -0
  172. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/semantic_relatedness/compute_relatedness.py +0 -0
  173. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/sinatools.py +0 -0
  174. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/synonyms/__init__.py +0 -0
  175. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/synonyms/synonyms_generator.py +0 -0
  176. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/utils/__init__.py +0 -0
  177. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/utils/charsets.py +0 -0
  178. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/utils/implication.py +0 -0
  179. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/utils/jaccard.py +0 -0
  180. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/utils/parser.py +0 -0
  181. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/utils/readfile.py +0 -0
  182. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/utils/text_dublication_detector.py +0 -0
  183. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/utils/text_transliteration.py +0 -0
  184. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/utils/tokenizer.py +0 -0
  185. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/utils/tokenizers_words.py +0 -0
  186. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/wsd/__init__.py +0 -0
  187. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/wsd/disambiguator.py +0 -0
  188. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/wsd/settings.py +0 -0
  189. {SinaTools-0.1.23 → SinaTools-0.1.25}/sinatools/wsd/wsd.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: SinaTools
3
- Version: 0.1.23
3
+ Version: 0.1.25
4
4
  Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
5
5
  Home-page: https://github.com/SinaLab/sinatools
6
6
  License: MIT license
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: SinaTools
3
- Version: 0.1.23
3
+ Version: 0.1.25
4
4
  Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
5
5
  Home-page: https://github.com/SinaLab/sinatools
6
6
  License: MIT license
@@ -7,16 +7,16 @@ from tqdm import tqdm
7
7
  import tarfile
8
8
  urls = {
9
9
  'morph': 'https://sina.birzeit.edu/lemmas_dic.pickle',
10
- 'ner': 'https://portal.sina.birzeit.edu/Wj27012000.tar.gz',
11
- 'wsd_model': 'https://portal.sina.birzeit.edu/bert-base-arabertv02_22_May_2021_00h_allglosses_unused01.zip',
12
- 'wsd_tokenizer': 'https://portal.sina.birzeit.edu/bert-base-arabertv02.zip',
13
- 'glosses_dic': 'https://portal.sina.birzeit.edu/glosses_dic.pickle',
14
- 'five_grams': 'https://portal.sina.birzeit.edu/five_grams.pickle',
15
- 'four_grams':'https://portal.sina.birzeit.edu/four_grams.pickle',
16
- 'three_grams':'https://portal.sina.birzeit.edu/three_grams.pickle',
17
- 'two_grams':'https://portal.sina.birzeit.edu/two_grams.pickle',
18
- 'synonyms_level2':'https://portal.sina.birzeit.edu/synonyms_level2.pkl',
19
- 'synonyms_level3':'https://portal.sina.birzeit.edu/synonyms_level3.pkl'
10
+ 'ner': 'https://sina.birzeit.edu/Wj27012000.tar.gz',
11
+ 'wsd_model': 'https://sina.birzeit.edu/bert-base-arabertv02_22_May_2021_00h_allglosses_unused01.zip',
12
+ 'wsd_tokenizer': 'https://sina.birzeit.edu/bert-base-arabertv02.zip',
13
+ 'glosses_dic': 'https://sina.birzeit.edu/glosses_dic.pickle',
14
+ 'five_grams': 'https://sina.birzeit.edu/five_grams.pickle',
15
+ 'four_grams':'https://sina.birzeit.edu/four_grams.pickle',
16
+ 'three_grams':'https://sina.birzeit.edu/three_grams.pickle',
17
+ 'two_grams':'https://sina.birzeit.edu/two_grams.pickle',
18
+ 'synonyms_level2':'https://sina.birzeit.edu/synonyms_level2.pkl',
19
+ 'synonyms_level3':'https://sina.birzeit.edu/synonyms_level3.pkl'
20
20
  }
21
21
 
22
22
  def get_appdatadir():
@@ -95,37 +95,41 @@ def download_file(url, dest_path=get_appdatadir()):
95
95
  print(filename)
96
96
  headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.3029.110 Safari/537.3'}
97
97
 
98
- # try:
99
- with requests.get(url, headers=headers, stream=True) as r:
100
- r.raise_for_status()
101
- with open(file_path, 'wb') as f:
102
- total_size = int(r.headers.get('content-length', 0))
103
- block_size = 8192
104
- progress_bar = tqdm(total=total_size, unit='iB', unit_scale=True)
105
- for chunk in r.iter_content(chunk_size=block_size):
106
- if chunk:
107
- f.write(chunk)
108
- progress_bar.update(len(chunk))
109
- progress_bar.close()
110
- # Check the file type and extract accordingly
111
- file_extension = os.path.splitext(file_path)[1]
112
- extracted_folder_name = os.path.splitext(file_path)[0]
113
-
114
- if file_extension == '.zip':
115
- extract_zip(file_path, extracted_folder_name)
116
- elif file_extension == '.gz':
117
- extract_tar(file_path, extracted_folder_name)
118
- elif file_extension =='.pickle':
119
- print(f'Done: {file_extension}')
120
- else:
121
- print(f'Unsupported file type for extraction: {file_extension}')
122
- return file_path
123
-
124
- # except requests.exceptions.HTTPError as e:
125
- # if e.response.status_code == 403:
126
- # print(f'Error 403: Forbidden. The requested file URL {url} could not be downloaded due to insufficient permissions. Please check the URL and try again.')
127
- # else:
128
- # print('An error occurred while downloading the file:', e)
98
+ try:
99
+ with requests.get(url, headers=headers, stream=True) as r:
100
+ r.raise_for_status()
101
+ with open(file_path, 'wb') as f:
102
+ total_size = int(r.headers.get('content-length', 0))
103
+ block_size = 8192
104
+ progress_bar = tqdm(total=total_size, unit='iB', unit_scale=True)
105
+ for chunk in r.iter_content(chunk_size=block_size):
106
+ if chunk:
107
+ f.write(chunk)
108
+ progress_bar.update(len(chunk))
109
+ progress_bar.close()
110
+
111
+ # Check the file type and extract accordingly
112
+ file_extension = os.path.splitext(file_path)[1]
113
+ extracted_folder_name = os.path.splitext(file_path)[0]
114
+
115
+ if file_extension == '.zip':
116
+ extract_zip(file_path, extracted_folder_name)
117
+ elif file_extension == '.gz':
118
+
119
+ extract_tar(file_path, extracted_folder_name)
120
+ elif file_extension =='.pickle':
121
+ print(f'Done: {file_extension}')
122
+
123
+ else:
124
+ print(f'Unsupported file type for extraction: {file_extension}')
125
+
126
+ return file_path
127
+
128
+ except requests.exceptions.HTTPError as e:
129
+ if e.response.status_code == 403:
130
+ print(f'Error 403: Forbidden. The requested file URL {url} could not be downloaded due to insufficient permissions. Please check the URL and try again.')
131
+ else:
132
+ print('An error occurred while downloading the file:', e)
129
133
 
130
134
  def extract_zip(file_path, extracted_folder_name):
131
135
  """
@@ -0,0 +1 @@
1
+ 0.1.25
@@ -1 +0,0 @@
1
- 0.1.23
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes