SinaTools 0.1.29__tar.gz → 0.1.31__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {SinaTools-0.1.29 → SinaTools-0.1.31}/PKG-INFO +1 -1
- {SinaTools-0.1.29 → SinaTools-0.1.31}/SinaTools.egg-info/PKG-INFO +1 -1
- {SinaTools-0.1.29 → SinaTools-0.1.31}/SinaTools.egg-info/SOURCES.txt +2 -1
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/DataDownload/downloader.py +2 -1
- SinaTools-0.1.31/sinatools/VERSION +1 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/morphology/morph_analyzer.py +7 -3
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/__init__.py +0 -5
- SinaTools-0.1.31/sinatools/relations/__init__.py +7 -0
- {SinaTools-0.1.29/sinatools/ner → SinaTools-0.1.31/sinatools/relations}/relation_extractor.py +28 -30
- SinaTools-0.1.29/sinatools/VERSION +0 -1
- {SinaTools-0.1.29 → SinaTools-0.1.31}/AUTHORS.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/CONTRIBUTING.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/LICENSE +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/MANIFEST.in +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/README.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/SinaTools.egg-info/dependency_links.txt +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/SinaTools.egg-info/entry_points.txt +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/SinaTools.egg-info/not-zip-safe +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/SinaTools.egg-info/requires.txt +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/SinaTools.egg-info/top_level.txt +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/Makefile +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/_images/download.png +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/_static/download.png +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/_static/file.png +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/_static/minus.png +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/_static/plus.png +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/html/_images/SinaLogo.jpg +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/html/_images/download.png +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/html/_static/SinaLogo.jpg +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/html/_static/download.png +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/html/_static/file.png +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/html/_static/minus.png +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/build/html/_static/plus.png +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/make.bat +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/License.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/Overview.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/_static/SinaLogo.jpg +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/_static/download.png +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/about.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/DataDownload/downloader.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/DataDownload.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/arabiner/bin/infer.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/arabiner.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/morphology/morph_analyzer.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/morphology.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/salma/views.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/salma.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/utils/corpus_tokenizer.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/utils/implication.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/utils/jaccard.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/utils/parser.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/utils/sentence_tokenizer.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/utils/text_transliteration.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api/utils.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/api.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/authors.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/DataDownload/download_files.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/DataDownload/get_appdatadir.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/DataDownload.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/arabiner/infer.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/arabiner.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/morphology/ALMA_multi_word.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/morphology/morph_analyzer.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/morphology.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/salma/salma_tools.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/salma.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/utils/arStrip.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/utils/corpus_tokenizer.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/utils/implication.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/utils/jaccard.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/utils/latin_remove.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/utils/remove_punc.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/utils/sentence_tokenizer.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/utils/text_transliteration.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools/utils.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/cli_tools.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/conf.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/index.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/installation.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/docs/source/readme.rst +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/setup.cfg +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/setup.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/DataDownload/download_files.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/morphology/ALMA_multi_word.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/morphology/morph_analyzer.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/ner/corpus_entity_extractor.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/ner/entity_extractor.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/utils/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/utils/arStrip.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/utils/corpus_tokenizer.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/utils/implication.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/utils/jaccard.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/utils/remove_latin.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/utils/remove_punctuation.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/utils/sentence_tokenizer.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/utils/text_dublication_detector.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/CLI/utils/text_transliteration.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/DataDownload/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/create_classification_data.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/create_pretraining_data.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/extract_features.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/lamb_optimizer.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/modeling.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/optimization.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/run_classifier.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/run_pretraining.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/run_squad.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/tokenization.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/build_openwebtext_pretraining_dataset.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/build_pretraining_dataset.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/build_pretraining_dataset_single_file.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/configure_finetuning.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/configure_pretraining.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/finetune/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/finetune/feature_spec.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/finetune/preprocessing.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/finetune/scorer.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/finetune/task.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/finetune/task_builder.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/flops_computation.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/model/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/model/modeling.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/model/optimization.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/model/tokenization.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/pretrain/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/pretrain/pretrain_data.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/pretrain/pretrain_helpers.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/run_finetuning.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/run_pretraining.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/util/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/util/training_utils.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/util/utils.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/create_pretraining_data.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/gpt2/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/gpt2/lamb_optimizer.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/gpt2/optimization.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/gpt2/run_pretraining.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/grover/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/grover/dataloader.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/grover/modeling.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/grover/modeling_gpt2.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/grover/optimization_adafactor.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/grover/train_tpu.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/grover/utils.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/train_bpe_tokenizer.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/preprocess.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/environment.yml +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/install_env.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/morphology/ALMA_multi_word.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/morphology/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/data/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/data/datasets.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/data/transforms.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/data_format.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/datasets.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/entity_extractor.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/helpers.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/metrics.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/nn/BaseModel.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/nn/BertNestedTagger.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/nn/BertSeqTagger.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/nn/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/trainers/BaseTrainer.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/trainers/BertNestedTrainer.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/trainers/BertTrainer.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/trainers/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/ner/transforms.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/semantic_relatedness/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/semantic_relatedness/compute_relatedness.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/sinatools.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/synonyms/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/synonyms/synonyms_generator.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/utils/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/utils/charsets.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/utils/parser.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/utils/readfile.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/utils/similarity.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/utils/text_dublication_detector.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/utils/text_transliteration.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/utils/tokenizer.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/utils/tokenizers_words.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/utils/word_compare.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/wsd/__init__.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/wsd/disambiguator.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/wsd/settings.py +0 -0
- {SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/wsd/wsd.py +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: SinaTools
|
3
|
-
Version: 0.1.
|
3
|
+
Version: 0.1.31
|
4
4
|
Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
|
5
5
|
Home-page: https://github.com/SinaLab/sinatools
|
6
6
|
License: MIT license
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: SinaTools
|
3
|
-
Version: 0.1.
|
3
|
+
Version: 0.1.31
|
4
4
|
Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
|
5
5
|
Home-page: https://github.com/SinaLab/sinatools
|
6
6
|
License: MIT license
|
@@ -155,7 +155,6 @@ sinatools/ner/datasets.py
|
|
155
155
|
sinatools/ner/entity_extractor.py
|
156
156
|
sinatools/ner/helpers.py
|
157
157
|
sinatools/ner/metrics.py
|
158
|
-
sinatools/ner/relation_extractor.py
|
159
158
|
sinatools/ner/transforms.py
|
160
159
|
sinatools/ner/data/__init__.py
|
161
160
|
sinatools/ner/data/datasets.py
|
@@ -168,6 +167,8 @@ sinatools/ner/trainers/BaseTrainer.py
|
|
168
167
|
sinatools/ner/trainers/BertNestedTrainer.py
|
169
168
|
sinatools/ner/trainers/BertTrainer.py
|
170
169
|
sinatools/ner/trainers/__init__.py
|
170
|
+
sinatools/relations/__init__.py
|
171
|
+
sinatools/relations/relation_extractor.py
|
171
172
|
sinatools/semantic_relatedness/__init__.py
|
172
173
|
sinatools/semantic_relatedness/compute_relatedness.py
|
173
174
|
sinatools/synonyms/__init__.py
|
@@ -16,7 +16,8 @@ urls = {
|
|
16
16
|
'three_grams':'https://sina.birzeit.edu/three_grams.pickle',
|
17
17
|
'two_grams':'https://sina.birzeit.edu/two_grams.pickle',
|
18
18
|
'graph_l2':'https://sina.birzeit.edu/graph_l2.pkl',
|
19
|
-
'graph_l3':'https://sina.birzeit.edu/graph_l3.pkl'
|
19
|
+
'graph_l3':'https://sina.birzeit.edu/graph_l3.pkl',
|
20
|
+
'relation':'https://sina.birzeit.edu/relation_model.zip'
|
20
21
|
}
|
21
22
|
|
22
23
|
def get_appdatadir():
|
@@ -0,0 +1 @@
|
|
1
|
+
0.1.31
|
@@ -3,6 +3,7 @@ from sinatools.utils.tokenizers_words import simple_word_tokenize
|
|
3
3
|
from sinatools.utils.parser import arStrip
|
4
4
|
from sinatools.utils.charsets import AR_CHARSET, AR_DIAC_CHARSET
|
5
5
|
from sinatools.DataDownload.downloader import get_appdatadir
|
6
|
+
from sinatools.morphology.morph_analyzer import remove_punctuation
|
6
7
|
from . import dictionary
|
7
8
|
|
8
9
|
_IS_AR_RE = re.compile(u'^[' + re.escape(u''.join(AR_CHARSET)) + u']+$')
|
@@ -98,13 +99,16 @@ def analyze(text, language ='MSA', task ='full', flag="1"):
|
|
98
99
|
token = arStrip(token , False , True , False , False , False , False)
|
99
100
|
token = re.sub('[ٱ]','ﺍ',token)
|
100
101
|
# token, freq, lemma, lemma_id, root, pos
|
101
|
-
solution = [token, 0, token
|
102
|
+
solution = [token, 0, token, 0, token, ""]
|
102
103
|
|
103
104
|
if token.isdigit():
|
104
|
-
solution[5] = "
|
105
|
+
solution[5] = "رقم" #pos
|
106
|
+
|
107
|
+
elif remove_punctuation(token).strip() == "":
|
108
|
+
solution[5] = "علامة ترقيم" #pos
|
105
109
|
|
106
110
|
elif not _is_ar(token):
|
107
|
-
solution[5] = "
|
111
|
+
solution[5] = "أجنبي" #pos
|
108
112
|
|
109
113
|
else:
|
110
114
|
result_token = find_solution(token,language,flag)
|
@@ -7,8 +7,6 @@ import torch
|
|
7
7
|
import pickle
|
8
8
|
import json
|
9
9
|
from argparse import Namespace
|
10
|
-
from transformers import pipeline
|
11
|
-
#from transformers import AutoModelForSequenceClassification
|
12
10
|
|
13
11
|
tagger = None
|
14
12
|
tag_vocab = None
|
@@ -38,6 +36,3 @@ if torch.cuda.is_available():
|
|
38
36
|
train_config.trainer_config["kwargs"]["model"] = model
|
39
37
|
tagger = load_object(train_config.trainer_config["fn"], train_config.trainer_config["kwargs"])
|
40
38
|
tagger.load(os.path.join(model_path,"checkpoints"))
|
41
|
-
|
42
|
-
pipe = pipeline("sentiment-analysis", model= os.path.join(path, "best_model"), return_all_scores =True, max_length=128, truncation=True)
|
43
|
-
#pipe = AutoModelForSequenceClassification.from_pretrained(os.path.join(path, "best_model"))
|
@@ -0,0 +1,7 @@
|
|
1
|
+
from sinatools.DataDownload import downloader
|
2
|
+
import os
|
3
|
+
from transformers import pipeline
|
4
|
+
|
5
|
+
path =downloader.get_appdatadir()
|
6
|
+
|
7
|
+
pipe = pipeline("sentiment-analysis", model= os.path.join(path, "relation_model"), return_all_scores =True, max_length=128, truncation=True)
|
{SinaTools-0.1.29/sinatools/ner → SinaTools-0.1.31/sinatools/relations}/relation_extractor.py
RENAMED
@@ -1,10 +1,8 @@
|
|
1
|
-
import torch
|
2
|
-
import json
|
3
1
|
from urllib.request import Request, urlopen
|
4
2
|
from sinatools.ner.entity_extractor import extract
|
3
|
+
from sinatools.utils.tokenizer import sentence_tokenizer
|
5
4
|
from . import pipe
|
6
5
|
|
7
|
-
|
8
6
|
# ============================ Extract entities and their types ========================
|
9
7
|
def jsons_to_list_of_lists(json_list):
|
10
8
|
return [[d['token'], d['tags']] for d in json_list]
|
@@ -168,34 +166,34 @@ def get_entity_category(entity_type, categories):
|
|
168
166
|
|
169
167
|
|
170
168
|
# ============ Extract entities, their types and categorize them ===============
|
171
|
-
def
|
172
|
-
#test_sentence="صورة إعتقال طفل فلسطيني خلال انتفاضة الأقصى ."
|
173
|
-
entities=entities_and_types(sentence)
|
174
|
-
|
175
|
-
event_indices = [i for i, (_, entity_type) in enumerate(entities.items()) if entity_type == 'EVENT']
|
176
|
-
arg_event_indices = [i for i, (_, entity_type) in enumerate(entities.items()) if entity_type != 'EVENT']
|
169
|
+
def event_argument_relation_extraction(documnet):
|
177
170
|
|
171
|
+
sentences=sentence_tokenizer(documnet)
|
178
172
|
output_list=[]
|
179
|
-
|
180
|
-
|
181
|
-
|
182
|
-
|
183
|
-
|
184
|
-
|
185
|
-
|
186
|
-
|
187
|
-
|
188
|
-
|
189
|
-
|
190
|
-
|
191
|
-
|
192
|
-
|
193
|
-
|
194
|
-
|
195
|
-
|
196
|
-
|
197
|
-
|
198
|
-
|
199
|
-
|
173
|
+
relation={}
|
174
|
+
triple_id=0
|
175
|
+
for sentence in sentences:
|
176
|
+
entities=entities_and_types(sentence)
|
177
|
+
entity_identifier={entity:i for entity, i in zip(entities,range(1,len(entities)+1))}
|
178
|
+
|
179
|
+
event_indices = [i for i, (_, entity_type) in enumerate(entities.items()) if entity_type == 'EVENT']
|
180
|
+
arg_event_indices = [i for i, (_, entity_type) in enumerate(entities.items()) if entity_type != 'EVENT']
|
181
|
+
|
182
|
+
|
183
|
+
for i in event_indices:
|
184
|
+
event_entity=list(entities.keys())[i]
|
185
|
+
for j in arg_event_indices:
|
186
|
+
arg_name= list(entities.keys())[j]
|
187
|
+
arg_type=entities[arg_name]
|
188
|
+
category = get_entity_category(arg_type, categories)
|
189
|
+
|
190
|
+
if category in temp03:
|
191
|
+
relation_sentence=f"[CLS] {sentence} [SEP] {event_entity} {temp03[category]} {arg_name}"
|
192
|
+
predicted_relation=pipe(relation_sentence)
|
193
|
+
score = predicted_relation[0][0]['score']
|
194
|
+
if score > 0.50:
|
195
|
+
triple_id+=1
|
196
|
+
relation={"TripleID":triple_id,"Subject":{"ID":entity_identifier[event_entity],"Type": entities[event_entity], "Label":event_entity}, "Relation": category, "Object":{"ID":entity_identifier[arg_name],"Type": entities[arg_name], "Label":arg_name,}}
|
197
|
+
output_list.append(relation)
|
200
198
|
|
201
199
|
return output_list
|
@@ -1 +0,0 @@
|
|
1
|
-
0.1.29
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/arabert/create_classification_data.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/build_pretraining_dataset.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/finetune/preprocessing.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/pretrain/pretrain_data.py
RENAMED
File without changes
|
{SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/araelectra/pretrain/pretrain_helpers.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{SinaTools-0.1.29 → SinaTools-0.1.31}/sinatools/arabert/aragpt2/grover/optimization_adafactor.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|