SinaTools 0.1.29__tar.gz → 0.1.30__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (190) hide show
  1. {SinaTools-0.1.29 → SinaTools-0.1.30}/PKG-INFO +1 -1
  2. {SinaTools-0.1.29 → SinaTools-0.1.30}/SinaTools.egg-info/PKG-INFO +1 -1
  3. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/DataDownload/downloader.py +2 -1
  4. SinaTools-0.1.30/sinatools/VERSION +1 -0
  5. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/morphology/morph_analyzer.py +7 -3
  6. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/__init__.py +1 -2
  7. SinaTools-0.1.29/sinatools/VERSION +0 -1
  8. {SinaTools-0.1.29 → SinaTools-0.1.30}/AUTHORS.rst +0 -0
  9. {SinaTools-0.1.29 → SinaTools-0.1.30}/CONTRIBUTING.rst +0 -0
  10. {SinaTools-0.1.29 → SinaTools-0.1.30}/LICENSE +0 -0
  11. {SinaTools-0.1.29 → SinaTools-0.1.30}/MANIFEST.in +0 -0
  12. {SinaTools-0.1.29 → SinaTools-0.1.30}/README.rst +0 -0
  13. {SinaTools-0.1.29 → SinaTools-0.1.30}/SinaTools.egg-info/SOURCES.txt +0 -0
  14. {SinaTools-0.1.29 → SinaTools-0.1.30}/SinaTools.egg-info/dependency_links.txt +0 -0
  15. {SinaTools-0.1.29 → SinaTools-0.1.30}/SinaTools.egg-info/entry_points.txt +0 -0
  16. {SinaTools-0.1.29 → SinaTools-0.1.30}/SinaTools.egg-info/not-zip-safe +0 -0
  17. {SinaTools-0.1.29 → SinaTools-0.1.30}/SinaTools.egg-info/requires.txt +0 -0
  18. {SinaTools-0.1.29 → SinaTools-0.1.30}/SinaTools.egg-info/top_level.txt +0 -0
  19. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/Makefile +0 -0
  20. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/_images/download.png +0 -0
  21. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/_static/download.png +0 -0
  22. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/_static/file.png +0 -0
  23. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/_static/minus.png +0 -0
  24. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/_static/plus.png +0 -0
  25. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/html/_images/SinaLogo.jpg +0 -0
  26. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/html/_images/download.png +0 -0
  27. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/html/_static/SinaLogo.jpg +0 -0
  28. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/html/_static/download.png +0 -0
  29. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/html/_static/file.png +0 -0
  30. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/html/_static/minus.png +0 -0
  31. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/build/html/_static/plus.png +0 -0
  32. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/make.bat +0 -0
  33. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/License.rst +0 -0
  34. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/Overview.rst +0 -0
  35. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/_static/SinaLogo.jpg +0 -0
  36. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/_static/download.png +0 -0
  37. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/about.rst +0 -0
  38. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/DataDownload/downloader.rst +0 -0
  39. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/DataDownload.rst +0 -0
  40. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/arabiner/bin/infer.rst +0 -0
  41. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/arabiner.rst +0 -0
  42. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/morphology/morph_analyzer.rst +0 -0
  43. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/morphology.rst +0 -0
  44. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/salma/views.rst +0 -0
  45. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/salma.rst +0 -0
  46. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/utils/corpus_tokenizer.rst +0 -0
  47. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/utils/implication.rst +0 -0
  48. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/utils/jaccard.rst +0 -0
  49. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/utils/parser.rst +0 -0
  50. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/utils/sentence_tokenizer.rst +0 -0
  51. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/utils/text_transliteration.rst +0 -0
  52. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api/utils.rst +0 -0
  53. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/api.rst +0 -0
  54. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/authors.rst +0 -0
  55. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/DataDownload/download_files.rst +0 -0
  56. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/DataDownload/get_appdatadir.rst +0 -0
  57. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/DataDownload.rst +0 -0
  58. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/arabiner/infer.rst +0 -0
  59. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/arabiner.rst +0 -0
  60. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/morphology/ALMA_multi_word.rst +0 -0
  61. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/morphology/morph_analyzer.rst +0 -0
  62. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/morphology.rst +0 -0
  63. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/salma/salma_tools.rst +0 -0
  64. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/salma.rst +0 -0
  65. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/utils/arStrip.rst +0 -0
  66. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/utils/corpus_tokenizer.rst +0 -0
  67. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/utils/implication.rst +0 -0
  68. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/utils/jaccard.rst +0 -0
  69. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/utils/latin_remove.rst +0 -0
  70. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/utils/remove_punc.rst +0 -0
  71. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/utils/sentence_tokenizer.rst +0 -0
  72. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/utils/text_transliteration.rst +0 -0
  73. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools/utils.rst +0 -0
  74. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/cli_tools.rst +0 -0
  75. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/conf.py +0 -0
  76. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/index.rst +0 -0
  77. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/installation.rst +0 -0
  78. {SinaTools-0.1.29 → SinaTools-0.1.30}/docs/source/readme.rst +0 -0
  79. {SinaTools-0.1.29 → SinaTools-0.1.30}/setup.cfg +0 -0
  80. {SinaTools-0.1.29 → SinaTools-0.1.30}/setup.py +0 -0
  81. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/DataDownload/download_files.py +0 -0
  82. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/morphology/ALMA_multi_word.py +0 -0
  83. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/morphology/morph_analyzer.py +0 -0
  84. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/ner/corpus_entity_extractor.py +0 -0
  85. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/ner/entity_extractor.py +0 -0
  86. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/utils/__init__.py +0 -0
  87. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/utils/arStrip.py +0 -0
  88. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/utils/corpus_tokenizer.py +0 -0
  89. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/utils/implication.py +0 -0
  90. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/utils/jaccard.py +0 -0
  91. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/utils/remove_latin.py +0 -0
  92. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/utils/remove_punctuation.py +0 -0
  93. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/utils/sentence_tokenizer.py +0 -0
  94. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/utils/text_dublication_detector.py +0 -0
  95. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/CLI/utils/text_transliteration.py +0 -0
  96. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/DataDownload/__init__.py +0 -0
  97. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/__init__.py +0 -0
  98. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/__init__.py +0 -0
  99. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/arabert/__init__.py +0 -0
  100. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/arabert/create_classification_data.py +0 -0
  101. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/arabert/create_pretraining_data.py +0 -0
  102. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/arabert/extract_features.py +0 -0
  103. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/arabert/lamb_optimizer.py +0 -0
  104. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/arabert/modeling.py +0 -0
  105. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/arabert/optimization.py +0 -0
  106. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/arabert/run_classifier.py +0 -0
  107. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/arabert/run_pretraining.py +0 -0
  108. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/arabert/run_squad.py +0 -0
  109. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/arabert/tokenization.py +0 -0
  110. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/__init__.py +0 -0
  111. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/build_openwebtext_pretraining_dataset.py +0 -0
  112. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/build_pretraining_dataset.py +0 -0
  113. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/build_pretraining_dataset_single_file.py +0 -0
  114. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/configure_finetuning.py +0 -0
  115. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/configure_pretraining.py +0 -0
  116. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/finetune/__init__.py +0 -0
  117. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/finetune/feature_spec.py +0 -0
  118. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/finetune/preprocessing.py +0 -0
  119. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/finetune/scorer.py +0 -0
  120. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/finetune/task.py +0 -0
  121. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/finetune/task_builder.py +0 -0
  122. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/flops_computation.py +0 -0
  123. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/model/__init__.py +0 -0
  124. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/model/modeling.py +0 -0
  125. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/model/optimization.py +0 -0
  126. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/model/tokenization.py +0 -0
  127. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/pretrain/__init__.py +0 -0
  128. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/pretrain/pretrain_data.py +0 -0
  129. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/pretrain/pretrain_helpers.py +0 -0
  130. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/run_finetuning.py +0 -0
  131. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/run_pretraining.py +0 -0
  132. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/util/__init__.py +0 -0
  133. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/util/training_utils.py +0 -0
  134. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/araelectra/util/utils.py +0 -0
  135. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/__init__.py +0 -0
  136. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/create_pretraining_data.py +0 -0
  137. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/gpt2/__init__.py +0 -0
  138. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/gpt2/lamb_optimizer.py +0 -0
  139. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/gpt2/optimization.py +0 -0
  140. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/gpt2/run_pretraining.py +0 -0
  141. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/grover/__init__.py +0 -0
  142. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/grover/dataloader.py +0 -0
  143. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/grover/modeling.py +0 -0
  144. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/grover/modeling_gpt2.py +0 -0
  145. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/grover/optimization_adafactor.py +0 -0
  146. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/grover/train_tpu.py +0 -0
  147. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/grover/utils.py +0 -0
  148. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/aragpt2/train_bpe_tokenizer.py +0 -0
  149. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/arabert/preprocess.py +0 -0
  150. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/environment.yml +0 -0
  151. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/install_env.py +0 -0
  152. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/morphology/ALMA_multi_word.py +0 -0
  153. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/morphology/__init__.py +0 -0
  154. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/data/__init__.py +0 -0
  155. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/data/datasets.py +0 -0
  156. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/data/transforms.py +0 -0
  157. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/data_format.py +0 -0
  158. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/datasets.py +0 -0
  159. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/entity_extractor.py +0 -0
  160. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/helpers.py +0 -0
  161. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/metrics.py +0 -0
  162. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/nn/BaseModel.py +0 -0
  163. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/nn/BertNestedTagger.py +0 -0
  164. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/nn/BertSeqTagger.py +0 -0
  165. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/nn/__init__.py +0 -0
  166. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/relation_extractor.py +0 -0
  167. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/trainers/BaseTrainer.py +0 -0
  168. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/trainers/BertNestedTrainer.py +0 -0
  169. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/trainers/BertTrainer.py +0 -0
  170. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/trainers/__init__.py +0 -0
  171. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/ner/transforms.py +0 -0
  172. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/semantic_relatedness/__init__.py +0 -0
  173. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/semantic_relatedness/compute_relatedness.py +0 -0
  174. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/sinatools.py +0 -0
  175. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/synonyms/__init__.py +0 -0
  176. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/synonyms/synonyms_generator.py +0 -0
  177. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/utils/__init__.py +0 -0
  178. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/utils/charsets.py +0 -0
  179. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/utils/parser.py +0 -0
  180. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/utils/readfile.py +0 -0
  181. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/utils/similarity.py +0 -0
  182. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/utils/text_dublication_detector.py +0 -0
  183. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/utils/text_transliteration.py +0 -0
  184. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/utils/tokenizer.py +0 -0
  185. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/utils/tokenizers_words.py +0 -0
  186. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/utils/word_compare.py +0 -0
  187. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/wsd/__init__.py +0 -0
  188. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/wsd/disambiguator.py +0 -0
  189. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/wsd/settings.py +0 -0
  190. {SinaTools-0.1.29 → SinaTools-0.1.30}/sinatools/wsd/wsd.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: SinaTools
3
- Version: 0.1.29
3
+ Version: 0.1.30
4
4
  Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
5
5
  Home-page: https://github.com/SinaLab/sinatools
6
6
  License: MIT license
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: SinaTools
3
- Version: 0.1.29
3
+ Version: 0.1.30
4
4
  Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
5
5
  Home-page: https://github.com/SinaLab/sinatools
6
6
  License: MIT license
@@ -16,7 +16,8 @@ urls = {
16
16
  'three_grams':'https://sina.birzeit.edu/three_grams.pickle',
17
17
  'two_grams':'https://sina.birzeit.edu/two_grams.pickle',
18
18
  'graph_l2':'https://sina.birzeit.edu/graph_l2.pkl',
19
- 'graph_l3':'https://sina.birzeit.edu/graph_l3.pkl'
19
+ 'graph_l3':'https://sina.birzeit.edu/graph_l3.pkl',
20
+ 'relation':'https://sina.birzeit.edu/relation_model.zip'
20
21
  }
21
22
 
22
23
  def get_appdatadir():
@@ -0,0 +1 @@
1
+ 0.1.30
@@ -3,6 +3,7 @@ from sinatools.utils.tokenizers_words import simple_word_tokenize
3
3
  from sinatools.utils.parser import arStrip
4
4
  from sinatools.utils.charsets import AR_CHARSET, AR_DIAC_CHARSET
5
5
  from sinatools.DataDownload.downloader import get_appdatadir
6
+ from sinatools.morphology.morph_analyzer import remove_punctuation
6
7
  from . import dictionary
7
8
 
8
9
  _IS_AR_RE = re.compile(u'^[' + re.escape(u''.join(AR_CHARSET)) + u']+$')
@@ -98,13 +99,16 @@ def analyze(text, language ='MSA', task ='full', flag="1"):
98
99
  token = arStrip(token , False , True , False , False , False , False)
99
100
  token = re.sub('[ٱ]','ﺍ',token)
100
101
  # token, freq, lemma, lemma_id, root, pos
101
- solution = [token, 0, token+"_0", 0, token, ""]
102
+ solution = [token, 0, token, 0, token, ""]
102
103
 
103
104
  if token.isdigit():
104
- solution[5] = "digit" #pos
105
+ solution[5] = "رقم" #pos
106
+
107
+ elif remove_punctuation(token).strip() == "":
108
+ solution[5] = "علامة ترقيم" #pos
105
109
 
106
110
  elif not _is_ar(token):
107
- solution[5] = "Foreign" #pos
111
+ solution[5] = "أجنبي" #pos
108
112
 
109
113
  else:
110
114
  result_token = find_solution(token,language,flag)
@@ -39,5 +39,4 @@ train_config.trainer_config["kwargs"]["model"] = model
39
39
  tagger = load_object(train_config.trainer_config["fn"], train_config.trainer_config["kwargs"])
40
40
  tagger.load(os.path.join(model_path,"checkpoints"))
41
41
 
42
- pipe = pipeline("sentiment-analysis", model= os.path.join(path, "best_model"), return_all_scores =True, max_length=128, truncation=True)
43
- #pipe = AutoModelForSequenceClassification.from_pretrained(os.path.join(path, "best_model"))
42
+ pipe = pipeline("sentiment-analysis", model= os.path.join(path, "relation_model"), return_all_scores =True, max_length=128, truncation=True)
@@ -1 +0,0 @@
1
- 0.1.29
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes