SinaTools 0.1.32__tar.gz → 0.1.34__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (191) hide show
  1. {SinaTools-0.1.32 → SinaTools-0.1.34}/PKG-INFO +1 -1
  2. {SinaTools-0.1.32 → SinaTools-0.1.34}/SinaTools.egg-info/PKG-INFO +1 -1
  3. {SinaTools-0.1.32 → SinaTools-0.1.34}/SinaTools.egg-info/entry_points.txt +1 -0
  4. {SinaTools-0.1.32 → SinaTools-0.1.34}/setup.py +3 -1
  5. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/DataDownload/download_files.py +5 -2
  6. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/DataDownload/downloader.py +34 -3
  7. SinaTools-0.1.34/sinatools/VERSION +1 -0
  8. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/morphology/morph_analyzer.py +1 -1
  9. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/relations/relation_extractor.py +2 -2
  10. SinaTools-0.1.32/sinatools/VERSION +0 -1
  11. {SinaTools-0.1.32 → SinaTools-0.1.34}/AUTHORS.rst +0 -0
  12. {SinaTools-0.1.32 → SinaTools-0.1.34}/CONTRIBUTING.rst +0 -0
  13. {SinaTools-0.1.32 → SinaTools-0.1.34}/LICENSE +0 -0
  14. {SinaTools-0.1.32 → SinaTools-0.1.34}/MANIFEST.in +0 -0
  15. {SinaTools-0.1.32 → SinaTools-0.1.34}/README.rst +0 -0
  16. {SinaTools-0.1.32 → SinaTools-0.1.34}/SinaTools.egg-info/SOURCES.txt +0 -0
  17. {SinaTools-0.1.32 → SinaTools-0.1.34}/SinaTools.egg-info/dependency_links.txt +0 -0
  18. {SinaTools-0.1.32 → SinaTools-0.1.34}/SinaTools.egg-info/not-zip-safe +0 -0
  19. {SinaTools-0.1.32 → SinaTools-0.1.34}/SinaTools.egg-info/requires.txt +0 -0
  20. {SinaTools-0.1.32 → SinaTools-0.1.34}/SinaTools.egg-info/top_level.txt +0 -0
  21. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/Makefile +0 -0
  22. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/_images/download.png +0 -0
  23. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/_static/download.png +0 -0
  24. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/_static/file.png +0 -0
  25. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/_static/minus.png +0 -0
  26. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/_static/plus.png +0 -0
  27. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/html/_images/SinaLogo.jpg +0 -0
  28. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/html/_images/download.png +0 -0
  29. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/html/_static/SinaLogo.jpg +0 -0
  30. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/html/_static/download.png +0 -0
  31. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/html/_static/file.png +0 -0
  32. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/html/_static/minus.png +0 -0
  33. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/build/html/_static/plus.png +0 -0
  34. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/make.bat +0 -0
  35. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/License.rst +0 -0
  36. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/Overview.rst +0 -0
  37. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/_static/SinaLogo.jpg +0 -0
  38. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/_static/download.png +0 -0
  39. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/about.rst +0 -0
  40. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/DataDownload/downloader.rst +0 -0
  41. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/DataDownload.rst +0 -0
  42. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/arabiner/bin/infer.rst +0 -0
  43. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/arabiner.rst +0 -0
  44. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/morphology/morph_analyzer.rst +0 -0
  45. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/morphology.rst +0 -0
  46. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/salma/views.rst +0 -0
  47. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/salma.rst +0 -0
  48. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/utils/corpus_tokenizer.rst +0 -0
  49. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/utils/implication.rst +0 -0
  50. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/utils/jaccard.rst +0 -0
  51. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/utils/parser.rst +0 -0
  52. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/utils/sentence_tokenizer.rst +0 -0
  53. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/utils/text_transliteration.rst +0 -0
  54. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api/utils.rst +0 -0
  55. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/api.rst +0 -0
  56. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/authors.rst +0 -0
  57. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/DataDownload/download_files.rst +0 -0
  58. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/DataDownload/get_appdatadir.rst +0 -0
  59. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/DataDownload.rst +0 -0
  60. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/arabiner/infer.rst +0 -0
  61. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/arabiner.rst +0 -0
  62. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/morphology/ALMA_multi_word.rst +0 -0
  63. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/morphology/morph_analyzer.rst +0 -0
  64. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/morphology.rst +0 -0
  65. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/salma/salma_tools.rst +0 -0
  66. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/salma.rst +0 -0
  67. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/utils/arStrip.rst +0 -0
  68. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/utils/corpus_tokenizer.rst +0 -0
  69. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/utils/implication.rst +0 -0
  70. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/utils/jaccard.rst +0 -0
  71. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/utils/latin_remove.rst +0 -0
  72. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/utils/remove_punc.rst +0 -0
  73. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/utils/sentence_tokenizer.rst +0 -0
  74. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/utils/text_transliteration.rst +0 -0
  75. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools/utils.rst +0 -0
  76. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/cli_tools.rst +0 -0
  77. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/conf.py +0 -0
  78. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/index.rst +0 -0
  79. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/installation.rst +0 -0
  80. {SinaTools-0.1.32 → SinaTools-0.1.34}/docs/source/readme.rst +0 -0
  81. {SinaTools-0.1.32 → SinaTools-0.1.34}/setup.cfg +0 -0
  82. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/morphology/ALMA_multi_word.py +0 -0
  83. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/morphology/morph_analyzer.py +0 -0
  84. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/ner/corpus_entity_extractor.py +0 -0
  85. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/ner/entity_extractor.py +0 -0
  86. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/utils/__init__.py +0 -0
  87. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/utils/arStrip.py +0 -0
  88. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/utils/corpus_tokenizer.py +0 -0
  89. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/utils/implication.py +0 -0
  90. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/utils/jaccard.py +0 -0
  91. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/utils/remove_latin.py +0 -0
  92. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/utils/remove_punctuation.py +0 -0
  93. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/utils/sentence_tokenizer.py +0 -0
  94. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/utils/text_dublication_detector.py +0 -0
  95. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/CLI/utils/text_transliteration.py +0 -0
  96. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/DataDownload/__init__.py +0 -0
  97. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/__init__.py +0 -0
  98. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/__init__.py +0 -0
  99. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/arabert/__init__.py +0 -0
  100. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/arabert/create_classification_data.py +0 -0
  101. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/arabert/create_pretraining_data.py +0 -0
  102. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/arabert/extract_features.py +0 -0
  103. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/arabert/lamb_optimizer.py +0 -0
  104. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/arabert/modeling.py +0 -0
  105. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/arabert/optimization.py +0 -0
  106. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/arabert/run_classifier.py +0 -0
  107. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/arabert/run_pretraining.py +0 -0
  108. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/arabert/run_squad.py +0 -0
  109. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/arabert/tokenization.py +0 -0
  110. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/__init__.py +0 -0
  111. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/build_openwebtext_pretraining_dataset.py +0 -0
  112. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/build_pretraining_dataset.py +0 -0
  113. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/build_pretraining_dataset_single_file.py +0 -0
  114. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/configure_finetuning.py +0 -0
  115. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/configure_pretraining.py +0 -0
  116. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/finetune/__init__.py +0 -0
  117. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/finetune/feature_spec.py +0 -0
  118. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/finetune/preprocessing.py +0 -0
  119. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/finetune/scorer.py +0 -0
  120. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/finetune/task.py +0 -0
  121. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/finetune/task_builder.py +0 -0
  122. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/flops_computation.py +0 -0
  123. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/model/__init__.py +0 -0
  124. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/model/modeling.py +0 -0
  125. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/model/optimization.py +0 -0
  126. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/model/tokenization.py +0 -0
  127. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/pretrain/__init__.py +0 -0
  128. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/pretrain/pretrain_data.py +0 -0
  129. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/pretrain/pretrain_helpers.py +0 -0
  130. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/run_finetuning.py +0 -0
  131. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/run_pretraining.py +0 -0
  132. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/util/__init__.py +0 -0
  133. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/util/training_utils.py +0 -0
  134. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/araelectra/util/utils.py +0 -0
  135. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/__init__.py +0 -0
  136. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/create_pretraining_data.py +0 -0
  137. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/gpt2/__init__.py +0 -0
  138. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/gpt2/lamb_optimizer.py +0 -0
  139. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/gpt2/optimization.py +0 -0
  140. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/gpt2/run_pretraining.py +0 -0
  141. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/grover/__init__.py +0 -0
  142. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/grover/dataloader.py +0 -0
  143. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/grover/modeling.py +0 -0
  144. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/grover/modeling_gpt2.py +0 -0
  145. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/grover/optimization_adafactor.py +0 -0
  146. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/grover/train_tpu.py +0 -0
  147. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/grover/utils.py +0 -0
  148. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/aragpt2/train_bpe_tokenizer.py +0 -0
  149. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/arabert/preprocess.py +0 -0
  150. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/environment.yml +0 -0
  151. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/install_env.py +0 -0
  152. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/morphology/ALMA_multi_word.py +0 -0
  153. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/morphology/__init__.py +0 -0
  154. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/__init__.py +0 -0
  155. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/data/__init__.py +0 -0
  156. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/data/datasets.py +0 -0
  157. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/data/transforms.py +0 -0
  158. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/data_format.py +0 -0
  159. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/datasets.py +0 -0
  160. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/entity_extractor.py +0 -0
  161. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/helpers.py +0 -0
  162. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/metrics.py +0 -0
  163. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/nn/BaseModel.py +0 -0
  164. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/nn/BertNestedTagger.py +0 -0
  165. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/nn/BertSeqTagger.py +0 -0
  166. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/nn/__init__.py +0 -0
  167. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/trainers/BaseTrainer.py +0 -0
  168. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/trainers/BertNestedTrainer.py +0 -0
  169. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/trainers/BertTrainer.py +0 -0
  170. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/trainers/__init__.py +0 -0
  171. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/ner/transforms.py +0 -0
  172. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/relations/__init__.py +0 -0
  173. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/semantic_relatedness/__init__.py +0 -0
  174. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/semantic_relatedness/compute_relatedness.py +0 -0
  175. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/sinatools.py +0 -0
  176. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/synonyms/__init__.py +0 -0
  177. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/synonyms/synonyms_generator.py +0 -0
  178. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/utils/__init__.py +0 -0
  179. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/utils/charsets.py +0 -0
  180. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/utils/parser.py +0 -0
  181. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/utils/readfile.py +0 -0
  182. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/utils/similarity.py +0 -0
  183. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/utils/text_dublication_detector.py +0 -0
  184. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/utils/text_transliteration.py +0 -0
  185. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/utils/tokenizer.py +0 -0
  186. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/utils/tokenizers_words.py +0 -0
  187. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/utils/word_compare.py +0 -0
  188. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/wsd/__init__.py +0 -0
  189. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/wsd/disambiguator.py +0 -0
  190. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/wsd/settings.py +0 -0
  191. {SinaTools-0.1.32 → SinaTools-0.1.34}/sinatools/wsd/wsd.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: SinaTools
3
- Version: 0.1.32
3
+ Version: 0.1.34
4
4
  Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
5
5
  Home-page: https://github.com/SinaLab/sinatools
6
6
  License: MIT license
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: SinaTools
3
- Version: 0.1.32
3
+ Version: 0.1.34
4
4
  Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
5
5
  Home-page: https://github.com/SinaLab/sinatools
6
6
  License: MIT license
@@ -12,6 +12,7 @@ implication = sinatools.CLI.utils.implication:main
12
12
  install_env = sinatools.install_env:main
13
13
  jaccard_similarity = sinatools.CLI.utils.jaccard:main
14
14
  morphology_analyzer = sinatools.CLI.morphology.morph_analyzer:main
15
+ relation_extractor = sinatools.CLI.relations.relation_extractor:main
15
16
  remove_latin = sinatools.CLI.utils.remove_latin:main
16
17
  remove_punctuation = sinatools.CLI.utils.remove_punctuation:main
17
18
  semantic_relatedness = sinatools.CLI.semantic_relatedness.compute_relatedness:main
@@ -78,7 +78,9 @@ setup(
78
78
  ('extend_synonyms='
79
79
  'sinatools.CLI.synonyms.extend_synonyms:main'),
80
80
  ('semantic_relatedness='
81
- 'sinatools.CLI.semantic_relatedness.compute_relatedness:main'),
81
+ 'sinatools.CLI.semantic_relatedness.compute_relatedness:main'),
82
+ ('relation_extractor='
83
+ 'sinatools.CLI.relations.relation_extractor:main'),
82
84
  ],
83
85
  },
84
86
  data_files=[('sinatools', ['sinatools/environment.yml'])],
@@ -34,6 +34,7 @@ import argparse
34
34
  from sinatools.DataDownload.downloader import download_file
35
35
  from sinatools.DataDownload.downloader import download_files
36
36
  from sinatools.DataDownload.downloader import get_appdatadir
37
+ from sinatools.DataDownload.downloader import download_folder_from_hf
37
38
  from sinatools.DataDownload.downloader import urls
38
39
 
39
40
 
@@ -53,8 +54,10 @@ def main():
53
54
  if file == "wsd":
54
55
  download_file(urls["morph"])
55
56
  download_file(urls["ner"])
56
- download_file(urls["wsd_model"])
57
- download_file(urls["wsd_tokenizer"])
57
+ #download_file(urls["wsd_model"])
58
+ #download_file(urls["wsd_tokenizer"])
59
+ download_folder_from_hf("SinaLab/ArabGlossBERT", "bert-base-arabertv02_22_May_2021_00h_allglosses_unused01")
60
+ download_folder_from_hf("SinaLab/ArabGlossBERT", "bert-base-arabertv02")
58
61
  download_file(urls["one_gram"])
59
62
  download_file(urls["five_grams"])
60
63
  download_file(urls["four_grams"])
@@ -8,8 +8,8 @@ import tarfile
8
8
  urls = {
9
9
  'morph': 'https://sina.birzeit.edu/lemmas_dic.pickle',
10
10
  'ner': 'https://sina.birzeit.edu/Wj27012000.tar.gz',
11
- 'wsd_model': 'https://sina.birzeit.edu/bert-base-arabertv02_22_May_2021_00h_allglosses_unused01.zip',
12
- 'wsd_tokenizer': 'https://sina.birzeit.edu/bert-base-arabertv02.zip',
11
+ # 'wsd_model': 'https://sina.birzeit.edu/bert-base-arabertv02_22_May_2021_00h_allglosses_unused01.zip',
12
+ # 'wsd_tokenizer': 'https://sina.birzeit.edu/bert-base-arabertv02.zip',
13
13
  'one_gram': 'https://sina.birzeit.edu/one_gram.pickle',
14
14
  'five_grams': 'https://sina.birzeit.edu/five_grams.pickle',
15
15
  'four_grams':'https://sina.birzeit.edu/four_grams.pickle',
@@ -184,4 +184,35 @@ def download_files():
184
184
  None
185
185
  """
186
186
  for url in urls.values():
187
- download_file(url)
187
+ download_file(url)
188
+
189
+
190
+ def download_folder_from_hf(repo_url, folder_name):
191
+
192
+ # Hugging Face API to fetch files from the repository
193
+ api_url = f"https://huggingface.co/api/models/{repo_url}/tree/main/{folder_name}"
194
+
195
+ # Make the request to get the folder structure
196
+ response = requests.get(api_url)
197
+ if response.status_code != 200:
198
+ print(f"Failed to fetch folder contents. Status code: {response.status_code}")
199
+ return
200
+
201
+ folder_content = response.json()
202
+
203
+ # Download each file in the folder
204
+ for file_info in folder_content:
205
+ file_name = file_info["path"]
206
+ file_url = f"https://huggingface.co/{repo_url}/resolve/main/{file_name}"
207
+
208
+ # Download the file and save it to the output directory
209
+ file_response = requests.get(file_url)
210
+ if file_response.status_code == 200:
211
+ # Create any necessary directories
212
+ output_file_path = os.path.join(get_appdatadir(), file_name)
213
+ os.makedirs(os.path.dirname(output_file_path), exist_ok=True)
214
+ with open(output_file_path, 'wb') as f:
215
+ f.write(file_response.content)
216
+ print(f"Downloaded: {file_name}")
217
+ else:
218
+ print(f"Failed to download {file_name}. Status code: {file_response.status_code}")
@@ -0,0 +1 @@
1
+ 0.1.34
@@ -16,7 +16,7 @@ def find_solution(token, language, flag):
16
16
  solutions = [solutions[0]]
17
17
  for solution in solutions:
18
18
  # token, freq, lemma, lemma_id, root, pos
19
- resulted_solutions.append([token, solution[0], solution[1], solution[2], solution[3], solution[4]])
19
+ resulted_solutions.append([token, solution[1], solution[2], solution[3], solution[4], solution[5]])
20
20
  return resulted_solutions
21
21
  else:
22
22
  return []
@@ -193,7 +193,7 @@ def event_argument_relation_extraction(documnet):
193
193
  score = predicted_relation[0][0]['score']
194
194
  if score > 0.50:
195
195
  triple_id+=1
196
- relation={"TripleID":triple_id,"Subject":{"ID":entity_identifier[event_entity],"Type": entities[event_entity], "Label":event_entity}, "Relation": category, "Object":{"ID":entity_identifier[arg_name],"Type": entities[arg_name], "Label":arg_name,}}
196
+ relation={"TripleID":triple_id,"Subject":{"ID":entity_identifier[event_entity],"Type": entities[event_entity], "Label":event_entity}, "Relation": category, "Object":{"ID":entity_identifier[arg_name],"Type": entities[arg_name], "Label":arg_name,},"confidence": f"{score: .2f}"}
197
197
  output_list.append(relation)
198
198
 
199
- return output_list
199
+ return output_list
@@ -1 +0,0 @@
1
- 0.1.32
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes