SinaTools 0.1.21__tar.gz → 0.1.23__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (189) hide show
  1. {SinaTools-0.1.21 → SinaTools-0.1.23}/PKG-INFO +1 -1
  2. {SinaTools-0.1.21 → SinaTools-0.1.23}/SinaTools.egg-info/PKG-INFO +1 -1
  3. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/DataDownload/download_files.py +2 -2
  4. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/DataDownload/downloader.py +37 -40
  5. SinaTools-0.1.23/sinatools/VERSION +1 -0
  6. SinaTools-0.1.21/sinatools/VERSION +0 -1
  7. {SinaTools-0.1.21 → SinaTools-0.1.23}/AUTHORS.rst +0 -0
  8. {SinaTools-0.1.21 → SinaTools-0.1.23}/CONTRIBUTING.rst +0 -0
  9. {SinaTools-0.1.21 → SinaTools-0.1.23}/LICENSE +0 -0
  10. {SinaTools-0.1.21 → SinaTools-0.1.23}/MANIFEST.in +0 -0
  11. {SinaTools-0.1.21 → SinaTools-0.1.23}/README.rst +0 -0
  12. {SinaTools-0.1.21 → SinaTools-0.1.23}/SinaTools.egg-info/SOURCES.txt +0 -0
  13. {SinaTools-0.1.21 → SinaTools-0.1.23}/SinaTools.egg-info/dependency_links.txt +0 -0
  14. {SinaTools-0.1.21 → SinaTools-0.1.23}/SinaTools.egg-info/entry_points.txt +0 -0
  15. {SinaTools-0.1.21 → SinaTools-0.1.23}/SinaTools.egg-info/not-zip-safe +0 -0
  16. {SinaTools-0.1.21 → SinaTools-0.1.23}/SinaTools.egg-info/requires.txt +0 -0
  17. {SinaTools-0.1.21 → SinaTools-0.1.23}/SinaTools.egg-info/top_level.txt +0 -0
  18. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/Makefile +0 -0
  19. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/_images/download.png +0 -0
  20. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/_static/download.png +0 -0
  21. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/_static/file.png +0 -0
  22. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/_static/minus.png +0 -0
  23. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/_static/plus.png +0 -0
  24. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/html/_images/SinaLogo.jpg +0 -0
  25. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/html/_images/download.png +0 -0
  26. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/html/_static/SinaLogo.jpg +0 -0
  27. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/html/_static/download.png +0 -0
  28. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/html/_static/file.png +0 -0
  29. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/html/_static/minus.png +0 -0
  30. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/build/html/_static/plus.png +0 -0
  31. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/make.bat +0 -0
  32. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/License.rst +0 -0
  33. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/Overview.rst +0 -0
  34. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/_static/SinaLogo.jpg +0 -0
  35. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/_static/download.png +0 -0
  36. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/about.rst +0 -0
  37. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/DataDownload/downloader.rst +0 -0
  38. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/DataDownload.rst +0 -0
  39. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/arabiner/bin/infer.rst +0 -0
  40. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/arabiner.rst +0 -0
  41. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/morphology/morph_analyzer.rst +0 -0
  42. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/morphology.rst +0 -0
  43. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/salma/views.rst +0 -0
  44. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/salma.rst +0 -0
  45. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/utils/corpus_tokenizer.rst +0 -0
  46. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/utils/implication.rst +0 -0
  47. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/utils/jaccard.rst +0 -0
  48. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/utils/parser.rst +0 -0
  49. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/utils/sentence_tokenizer.rst +0 -0
  50. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/utils/text_transliteration.rst +0 -0
  51. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api/utils.rst +0 -0
  52. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/api.rst +0 -0
  53. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/authors.rst +0 -0
  54. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/DataDownload/download_files.rst +0 -0
  55. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/DataDownload/get_appdatadir.rst +0 -0
  56. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/DataDownload.rst +0 -0
  57. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/arabiner/infer.rst +0 -0
  58. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/arabiner.rst +0 -0
  59. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/morphology/ALMA_multi_word.rst +0 -0
  60. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/morphology/morph_analyzer.rst +0 -0
  61. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/morphology.rst +0 -0
  62. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/salma/salma_tools.rst +0 -0
  63. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/salma.rst +0 -0
  64. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/utils/arStrip.rst +0 -0
  65. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/utils/corpus_tokenizer.rst +0 -0
  66. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/utils/implication.rst +0 -0
  67. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/utils/jaccard.rst +0 -0
  68. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/utils/latin_remove.rst +0 -0
  69. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/utils/remove_punc.rst +0 -0
  70. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/utils/sentence_tokenizer.rst +0 -0
  71. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/utils/text_transliteration.rst +0 -0
  72. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools/utils.rst +0 -0
  73. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/cli_tools.rst +0 -0
  74. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/conf.py +0 -0
  75. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/index.rst +0 -0
  76. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/installation.rst +0 -0
  77. {SinaTools-0.1.21 → SinaTools-0.1.23}/docs/source/readme.rst +0 -0
  78. {SinaTools-0.1.21 → SinaTools-0.1.23}/setup.cfg +0 -0
  79. {SinaTools-0.1.21 → SinaTools-0.1.23}/setup.py +0 -0
  80. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/morphology/ALMA_multi_word.py +0 -0
  81. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/morphology/morph_analyzer.py +0 -0
  82. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/ner/corpus_entity_extractor.py +0 -0
  83. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/ner/entity_extractor.py +0 -0
  84. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/utils/__init__.py +0 -0
  85. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/utils/arStrip.py +0 -0
  86. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/utils/corpus_tokenizer.py +0 -0
  87. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/utils/implication.py +0 -0
  88. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/utils/jaccard.py +0 -0
  89. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/utils/remove_latin.py +0 -0
  90. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/utils/remove_punctuation.py +0 -0
  91. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/utils/sentence_tokenizer.py +0 -0
  92. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/utils/text_dublication_detector.py +0 -0
  93. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/CLI/utils/text_transliteration.py +0 -0
  94. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/DataDownload/__init__.py +0 -0
  95. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/__init__.py +0 -0
  96. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/__init__.py +0 -0
  97. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/arabert/__init__.py +0 -0
  98. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/arabert/create_classification_data.py +0 -0
  99. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/arabert/create_pretraining_data.py +0 -0
  100. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/arabert/extract_features.py +0 -0
  101. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/arabert/lamb_optimizer.py +0 -0
  102. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/arabert/modeling.py +0 -0
  103. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/arabert/optimization.py +0 -0
  104. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/arabert/run_classifier.py +0 -0
  105. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/arabert/run_pretraining.py +0 -0
  106. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/arabert/run_squad.py +0 -0
  107. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/arabert/tokenization.py +0 -0
  108. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/__init__.py +0 -0
  109. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/build_openwebtext_pretraining_dataset.py +0 -0
  110. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/build_pretraining_dataset.py +0 -0
  111. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/build_pretraining_dataset_single_file.py +0 -0
  112. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/configure_finetuning.py +0 -0
  113. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/configure_pretraining.py +0 -0
  114. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/finetune/__init__.py +0 -0
  115. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/finetune/feature_spec.py +0 -0
  116. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/finetune/preprocessing.py +0 -0
  117. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/finetune/scorer.py +0 -0
  118. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/finetune/task.py +0 -0
  119. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/finetune/task_builder.py +0 -0
  120. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/flops_computation.py +0 -0
  121. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/model/__init__.py +0 -0
  122. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/model/modeling.py +0 -0
  123. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/model/optimization.py +0 -0
  124. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/model/tokenization.py +0 -0
  125. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/pretrain/__init__.py +0 -0
  126. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/pretrain/pretrain_data.py +0 -0
  127. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/pretrain/pretrain_helpers.py +0 -0
  128. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/run_finetuning.py +0 -0
  129. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/run_pretraining.py +0 -0
  130. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/util/__init__.py +0 -0
  131. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/util/training_utils.py +0 -0
  132. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/araelectra/util/utils.py +0 -0
  133. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/__init__.py +0 -0
  134. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/create_pretraining_data.py +0 -0
  135. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/gpt2/__init__.py +0 -0
  136. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/gpt2/lamb_optimizer.py +0 -0
  137. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/gpt2/optimization.py +0 -0
  138. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/gpt2/run_pretraining.py +0 -0
  139. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/grover/__init__.py +0 -0
  140. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/grover/dataloader.py +0 -0
  141. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/grover/modeling.py +0 -0
  142. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/grover/modeling_gpt2.py +0 -0
  143. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/grover/optimization_adafactor.py +0 -0
  144. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/grover/train_tpu.py +0 -0
  145. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/grover/utils.py +0 -0
  146. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/aragpt2/train_bpe_tokenizer.py +0 -0
  147. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/arabert/preprocess.py +0 -0
  148. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/environment.yml +0 -0
  149. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/install_env.py +0 -0
  150. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/morphology/ALMA_multi_word.py +0 -0
  151. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/morphology/__init__.py +0 -0
  152. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/morphology/morph_analyzer.py +0 -0
  153. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/__init__.py +0 -0
  154. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/data/__init__.py +0 -0
  155. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/data/datasets.py +0 -0
  156. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/data/transforms.py +0 -0
  157. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/data_format.py +0 -0
  158. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/datasets.py +0 -0
  159. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/entity_extractor.py +0 -0
  160. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/helpers.py +0 -0
  161. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/metrics.py +0 -0
  162. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/nn/BaseModel.py +0 -0
  163. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/nn/BertNestedTagger.py +0 -0
  164. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/nn/BertSeqTagger.py +0 -0
  165. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/nn/__init__.py +0 -0
  166. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/trainers/BaseTrainer.py +0 -0
  167. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/trainers/BertNestedTrainer.py +0 -0
  168. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/trainers/BertTrainer.py +0 -0
  169. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/trainers/__init__.py +0 -0
  170. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/ner/transforms.py +0 -0
  171. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/semantic_relatedness/__init__.py +0 -0
  172. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/semantic_relatedness/compute_relatedness.py +0 -0
  173. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/sinatools.py +0 -0
  174. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/synonyms/__init__.py +0 -0
  175. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/synonyms/synonyms_generator.py +0 -0
  176. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/utils/__init__.py +0 -0
  177. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/utils/charsets.py +0 -0
  178. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/utils/implication.py +0 -0
  179. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/utils/jaccard.py +0 -0
  180. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/utils/parser.py +0 -0
  181. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/utils/readfile.py +0 -0
  182. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/utils/text_dublication_detector.py +0 -0
  183. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/utils/text_transliteration.py +0 -0
  184. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/utils/tokenizer.py +0 -0
  185. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/utils/tokenizers_words.py +0 -0
  186. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/wsd/__init__.py +0 -0
  187. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/wsd/disambiguator.py +0 -0
  188. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/wsd/settings.py +0 -0
  189. {SinaTools-0.1.21 → SinaTools-0.1.23}/sinatools/wsd/wsd.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: SinaTools
3
- Version: 0.1.21
3
+ Version: 0.1.23
4
4
  Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
5
5
  Home-page: https://github.com/SinaLab/sinatools
6
6
  License: MIT license
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: SinaTools
3
- Version: 0.1.21
3
+ Version: 0.1.23
4
4
  Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
5
5
  Home-page: https://github.com/SinaLab/sinatools
6
6
  License: MIT license
@@ -2,7 +2,7 @@
2
2
  About:
3
3
  ------
4
4
 
5
- The download_files tool is a command-line interface for downloading various NLP resources from pre-specified URLs. It is a part of the sinatools package and provides options to choose which files to download and to specify a download directory. The tool automatically handles file extraction for zip and tar.gz files.
5
+ The download_files is a command-line interface for downloading various NLP resources from pre-specified URLs. It is a part of the sinatools package and provides options to choose which files to download and to specify a download directory. The tool automatically handles file extraction for zip and tar.gz files.
6
6
 
7
7
  Usage:
8
8
  ------
@@ -18,7 +18,7 @@ Below is the usage information that can be generated by running download_files -
18
18
 
19
19
  Options:
20
20
  -f, --files FILES
21
- Names of the files to download. Available files are: ner, morph, salma_model, salma_tokenizer, glosses_dic, lemma_dic, five_grams, four_grams, three_grams, two_grams.
21
+ Names of the files to download. Available files are: ner, morph, wsd_model, wsd_tokenizer, glosses_dic, five_grams, four_grams, three_grams, two_grams, synonyms_level2, synonyms_level3.
22
22
  If no file is specified, all files will be downloaded.
23
23
 
24
24
  Examples:
@@ -6,16 +6,17 @@ import zipfile
6
6
  from tqdm import tqdm
7
7
  import tarfile
8
8
  urls = {
9
- 'morph': 'https://portal.sina.birzeit.edu/ALMA27012000.pickle',
9
+ 'morph': 'https://sina.birzeit.edu/lemmas_dic.pickle',
10
10
  'ner': 'https://portal.sina.birzeit.edu/Wj27012000.tar.gz',
11
- 'salma_model': 'https://portal.sina.birzeit.edu/bert-base-arabertv02_22_May_2021_00h_allglosses_unused01.zip',
12
- 'salma_tokenizer': 'https://portal.sina.birzeit.edu/bert-base-arabertv02.zip',
11
+ 'wsd_model': 'https://portal.sina.birzeit.edu/bert-base-arabertv02_22_May_2021_00h_allglosses_unused01.zip',
12
+ 'wsd_tokenizer': 'https://portal.sina.birzeit.edu/bert-base-arabertv02.zip',
13
13
  'glosses_dic': 'https://portal.sina.birzeit.edu/glosses_dic.pickle',
14
- 'lemma_dic': 'https://portal.sina.birzeit.edu/lemmas_dic.pickle',
15
14
  'five_grams': 'https://portal.sina.birzeit.edu/five_grams.pickle',
16
15
  'four_grams':'https://portal.sina.birzeit.edu/four_grams.pickle',
17
16
  'three_grams':'https://portal.sina.birzeit.edu/three_grams.pickle',
18
- 'two_grams':'https://portal.sina.birzeit.edu/two_grams.pickle'
17
+ 'two_grams':'https://portal.sina.birzeit.edu/two_grams.pickle',
18
+ 'synonyms_level2':'https://portal.sina.birzeit.edu/synonyms_level2.pkl',
19
+ 'synonyms_level3':'https://portal.sina.birzeit.edu/synonyms_level3.pkl'
19
20
  }
20
21
 
21
22
  def get_appdatadir():
@@ -94,41 +95,37 @@ def download_file(url, dest_path=get_appdatadir()):
94
95
  print(filename)
95
96
  headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.3029.110 Safari/537.3'}
96
97
 
97
- try:
98
- with requests.get(url, headers=headers, stream=True) as r:
99
- r.raise_for_status()
100
- with open(file_path, 'wb') as f:
101
- total_size = int(r.headers.get('content-length', 0))
102
- block_size = 8192
103
- progress_bar = tqdm(total=total_size, unit='iB', unit_scale=True)
104
- for chunk in r.iter_content(chunk_size=block_size):
105
- if chunk:
106
- f.write(chunk)
107
- progress_bar.update(len(chunk))
108
- progress_bar.close()
109
-
110
- # Check the file type and extract accordingly
111
- file_extension = os.path.splitext(file_path)[1]
112
- extracted_folder_name = os.path.splitext(file_path)[0]
113
-
114
- if file_extension == '.zip':
115
- extract_zip(file_path, extracted_folder_name)
116
- elif file_extension == '.gz':
117
-
118
- extract_tar(file_path, extracted_folder_name)
119
- elif file_extension =='.pickle':
120
- print(f'Done: {file_extension}')
121
-
122
- else:
123
- print(f'Unsupported file type for extraction: {file_extension}')
124
-
125
- return file_path
126
-
127
- except requests.exceptions.HTTPError as e:
128
- if e.response.status_code == 403:
129
- print(f'Error 403: Forbidden. The requested file URL {url} could not be downloaded due to insufficient permissions. Please check the URL and try again.')
130
- else:
131
- print('An error occurred while downloading the file:', e)
98
+ # try:
99
+ with requests.get(url, headers=headers, stream=True) as r:
100
+ r.raise_for_status()
101
+ with open(file_path, 'wb') as f:
102
+ total_size = int(r.headers.get('content-length', 0))
103
+ block_size = 8192
104
+ progress_bar = tqdm(total=total_size, unit='iB', unit_scale=True)
105
+ for chunk in r.iter_content(chunk_size=block_size):
106
+ if chunk:
107
+ f.write(chunk)
108
+ progress_bar.update(len(chunk))
109
+ progress_bar.close()
110
+ # Check the file type and extract accordingly
111
+ file_extension = os.path.splitext(file_path)[1]
112
+ extracted_folder_name = os.path.splitext(file_path)[0]
113
+
114
+ if file_extension == '.zip':
115
+ extract_zip(file_path, extracted_folder_name)
116
+ elif file_extension == '.gz':
117
+ extract_tar(file_path, extracted_folder_name)
118
+ elif file_extension =='.pickle':
119
+ print(f'Done: {file_extension}')
120
+ else:
121
+ print(f'Unsupported file type for extraction: {file_extension}')
122
+ return file_path
123
+
124
+ # except requests.exceptions.HTTPError as e:
125
+ # if e.response.status_code == 403:
126
+ # print(f'Error 403: Forbidden. The requested file URL {url} could not be downloaded due to insufficient permissions. Please check the URL and try again.')
127
+ # else:
128
+ # print('An error occurred while downloading the file:', e)
132
129
 
133
130
  def extract_zip(file_path, extracted_folder_name):
134
131
  """
@@ -0,0 +1 @@
1
+ 0.1.23
@@ -1 +0,0 @@
1
- 0.1.21
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes