SinaTools 0.1.30__tar.gz → 0.1.32__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {SinaTools-0.1.30 → SinaTools-0.1.32}/PKG-INFO +1 -1
- {SinaTools-0.1.30 → SinaTools-0.1.32}/SinaTools.egg-info/PKG-INFO +1 -1
- {SinaTools-0.1.30 → SinaTools-0.1.32}/SinaTools.egg-info/SOURCES.txt +2 -1
- SinaTools-0.1.32/sinatools/VERSION +1 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/morphology/morph_analyzer.py +1 -1
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/__init__.py +0 -4
- SinaTools-0.1.32/sinatools/relations/__init__.py +7 -0
- {SinaTools-0.1.30/sinatools/ner → SinaTools-0.1.32/sinatools/relations}/relation_extractor.py +28 -30
- SinaTools-0.1.30/sinatools/VERSION +0 -1
- {SinaTools-0.1.30 → SinaTools-0.1.32}/AUTHORS.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/CONTRIBUTING.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/LICENSE +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/MANIFEST.in +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/README.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/SinaTools.egg-info/dependency_links.txt +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/SinaTools.egg-info/entry_points.txt +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/SinaTools.egg-info/not-zip-safe +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/SinaTools.egg-info/requires.txt +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/SinaTools.egg-info/top_level.txt +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/Makefile +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/_images/download.png +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/_static/download.png +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/_static/file.png +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/_static/minus.png +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/_static/plus.png +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/html/_images/SinaLogo.jpg +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/html/_images/download.png +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/html/_static/SinaLogo.jpg +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/html/_static/download.png +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/html/_static/file.png +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/html/_static/minus.png +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/build/html/_static/plus.png +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/make.bat +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/License.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/Overview.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/_static/SinaLogo.jpg +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/_static/download.png +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/about.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/DataDownload/downloader.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/DataDownload.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/arabiner/bin/infer.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/arabiner.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/morphology/morph_analyzer.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/morphology.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/salma/views.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/salma.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/utils/corpus_tokenizer.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/utils/implication.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/utils/jaccard.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/utils/parser.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/utils/sentence_tokenizer.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/utils/text_transliteration.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api/utils.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/api.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/authors.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/DataDownload/download_files.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/DataDownload/get_appdatadir.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/DataDownload.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/arabiner/infer.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/arabiner.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/morphology/ALMA_multi_word.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/morphology/morph_analyzer.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/morphology.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/salma/salma_tools.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/salma.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/utils/arStrip.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/utils/corpus_tokenizer.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/utils/implication.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/utils/jaccard.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/utils/latin_remove.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/utils/remove_punc.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/utils/sentence_tokenizer.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/utils/text_transliteration.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools/utils.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/cli_tools.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/conf.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/index.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/installation.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/docs/source/readme.rst +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/setup.cfg +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/setup.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/DataDownload/download_files.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/morphology/ALMA_multi_word.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/morphology/morph_analyzer.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/ner/corpus_entity_extractor.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/ner/entity_extractor.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/utils/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/utils/arStrip.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/utils/corpus_tokenizer.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/utils/implication.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/utils/jaccard.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/utils/remove_latin.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/utils/remove_punctuation.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/utils/sentence_tokenizer.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/utils/text_dublication_detector.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/CLI/utils/text_transliteration.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/DataDownload/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/DataDownload/downloader.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/create_classification_data.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/create_pretraining_data.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/extract_features.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/lamb_optimizer.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/modeling.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/optimization.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/run_classifier.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/run_pretraining.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/run_squad.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/tokenization.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/build_openwebtext_pretraining_dataset.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/build_pretraining_dataset.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/build_pretraining_dataset_single_file.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/configure_finetuning.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/configure_pretraining.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/finetune/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/finetune/feature_spec.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/finetune/preprocessing.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/finetune/scorer.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/finetune/task.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/finetune/task_builder.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/flops_computation.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/model/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/model/modeling.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/model/optimization.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/model/tokenization.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/pretrain/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/pretrain/pretrain_data.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/pretrain/pretrain_helpers.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/run_finetuning.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/run_pretraining.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/util/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/util/training_utils.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/util/utils.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/create_pretraining_data.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/gpt2/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/gpt2/lamb_optimizer.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/gpt2/optimization.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/gpt2/run_pretraining.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/grover/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/grover/dataloader.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/grover/modeling.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/grover/modeling_gpt2.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/grover/optimization_adafactor.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/grover/train_tpu.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/grover/utils.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/train_bpe_tokenizer.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/preprocess.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/environment.yml +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/install_env.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/morphology/ALMA_multi_word.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/morphology/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/data/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/data/datasets.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/data/transforms.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/data_format.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/datasets.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/entity_extractor.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/helpers.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/metrics.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/nn/BaseModel.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/nn/BertNestedTagger.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/nn/BertSeqTagger.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/nn/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/trainers/BaseTrainer.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/trainers/BertNestedTrainer.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/trainers/BertTrainer.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/trainers/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/ner/transforms.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/semantic_relatedness/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/semantic_relatedness/compute_relatedness.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/sinatools.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/synonyms/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/synonyms/synonyms_generator.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/utils/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/utils/charsets.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/utils/parser.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/utils/readfile.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/utils/similarity.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/utils/text_dublication_detector.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/utils/text_transliteration.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/utils/tokenizer.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/utils/tokenizers_words.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/utils/word_compare.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/wsd/__init__.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/wsd/disambiguator.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/wsd/settings.py +0 -0
- {SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/wsd/wsd.py +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: SinaTools
|
3
|
-
Version: 0.1.
|
3
|
+
Version: 0.1.32
|
4
4
|
Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
|
5
5
|
Home-page: https://github.com/SinaLab/sinatools
|
6
6
|
License: MIT license
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: SinaTools
|
3
|
-
Version: 0.1.
|
3
|
+
Version: 0.1.32
|
4
4
|
Summary: Open-source Python toolkit for Arabic Natural Understanding, allowing people to integrate it in their system workflow.
|
5
5
|
Home-page: https://github.com/SinaLab/sinatools
|
6
6
|
License: MIT license
|
@@ -155,7 +155,6 @@ sinatools/ner/datasets.py
|
|
155
155
|
sinatools/ner/entity_extractor.py
|
156
156
|
sinatools/ner/helpers.py
|
157
157
|
sinatools/ner/metrics.py
|
158
|
-
sinatools/ner/relation_extractor.py
|
159
158
|
sinatools/ner/transforms.py
|
160
159
|
sinatools/ner/data/__init__.py
|
161
160
|
sinatools/ner/data/datasets.py
|
@@ -168,6 +167,8 @@ sinatools/ner/trainers/BaseTrainer.py
|
|
168
167
|
sinatools/ner/trainers/BertNestedTrainer.py
|
169
168
|
sinatools/ner/trainers/BertTrainer.py
|
170
169
|
sinatools/ner/trainers/__init__.py
|
170
|
+
sinatools/relations/__init__.py
|
171
|
+
sinatools/relations/relation_extractor.py
|
171
172
|
sinatools/semantic_relatedness/__init__.py
|
172
173
|
sinatools/semantic_relatedness/compute_relatedness.py
|
173
174
|
sinatools/synonyms/__init__.py
|
@@ -0,0 +1 @@
|
|
1
|
+
0.1.32
|
@@ -3,7 +3,7 @@ from sinatools.utils.tokenizers_words import simple_word_tokenize
|
|
3
3
|
from sinatools.utils.parser import arStrip
|
4
4
|
from sinatools.utils.charsets import AR_CHARSET, AR_DIAC_CHARSET
|
5
5
|
from sinatools.DataDownload.downloader import get_appdatadir
|
6
|
-
from sinatools.
|
6
|
+
from sinatools.utils.parser import remove_punctuation
|
7
7
|
from . import dictionary
|
8
8
|
|
9
9
|
_IS_AR_RE = re.compile(u'^[' + re.escape(u''.join(AR_CHARSET)) + u']+$')
|
@@ -7,8 +7,6 @@ import torch
|
|
7
7
|
import pickle
|
8
8
|
import json
|
9
9
|
from argparse import Namespace
|
10
|
-
from transformers import pipeline
|
11
|
-
#from transformers import AutoModelForSequenceClassification
|
12
10
|
|
13
11
|
tagger = None
|
14
12
|
tag_vocab = None
|
@@ -38,5 +36,3 @@ if torch.cuda.is_available():
|
|
38
36
|
train_config.trainer_config["kwargs"]["model"] = model
|
39
37
|
tagger = load_object(train_config.trainer_config["fn"], train_config.trainer_config["kwargs"])
|
40
38
|
tagger.load(os.path.join(model_path,"checkpoints"))
|
41
|
-
|
42
|
-
pipe = pipeline("sentiment-analysis", model= os.path.join(path, "relation_model"), return_all_scores =True, max_length=128, truncation=True)
|
@@ -0,0 +1,7 @@
|
|
1
|
+
from sinatools.DataDownload import downloader
|
2
|
+
import os
|
3
|
+
from transformers import pipeline
|
4
|
+
|
5
|
+
path =downloader.get_appdatadir()
|
6
|
+
|
7
|
+
pipe = pipeline("sentiment-analysis", model= os.path.join(path, "relation_model"), return_all_scores =True, max_length=128, truncation=True)
|
{SinaTools-0.1.30/sinatools/ner → SinaTools-0.1.32/sinatools/relations}/relation_extractor.py
RENAMED
@@ -1,10 +1,8 @@
|
|
1
|
-
import torch
|
2
|
-
import json
|
3
1
|
from urllib.request import Request, urlopen
|
4
2
|
from sinatools.ner.entity_extractor import extract
|
3
|
+
from sinatools.utils.tokenizer import sentence_tokenizer
|
5
4
|
from . import pipe
|
6
5
|
|
7
|
-
|
8
6
|
# ============================ Extract entities and their types ========================
|
9
7
|
def jsons_to_list_of_lists(json_list):
|
10
8
|
return [[d['token'], d['tags']] for d in json_list]
|
@@ -168,34 +166,34 @@ def get_entity_category(entity_type, categories):
|
|
168
166
|
|
169
167
|
|
170
168
|
# ============ Extract entities, their types and categorize them ===============
|
171
|
-
def
|
172
|
-
#test_sentence="صورة إعتقال طفل فلسطيني خلال انتفاضة الأقصى ."
|
173
|
-
entities=entities_and_types(sentence)
|
174
|
-
|
175
|
-
event_indices = [i for i, (_, entity_type) in enumerate(entities.items()) if entity_type == 'EVENT']
|
176
|
-
arg_event_indices = [i for i, (_, entity_type) in enumerate(entities.items()) if entity_type != 'EVENT']
|
169
|
+
def event_argument_relation_extraction(documnet):
|
177
170
|
|
171
|
+
sentences=sentence_tokenizer(documnet)
|
178
172
|
output_list=[]
|
179
|
-
|
180
|
-
|
181
|
-
|
182
|
-
|
183
|
-
|
184
|
-
|
185
|
-
|
186
|
-
|
187
|
-
|
188
|
-
|
189
|
-
|
190
|
-
|
191
|
-
|
192
|
-
|
193
|
-
|
194
|
-
|
195
|
-
|
196
|
-
|
197
|
-
|
198
|
-
|
199
|
-
|
173
|
+
relation={}
|
174
|
+
triple_id=0
|
175
|
+
for sentence in sentences:
|
176
|
+
entities=entities_and_types(sentence)
|
177
|
+
entity_identifier={entity:i for entity, i in zip(entities,range(1,len(entities)+1))}
|
178
|
+
|
179
|
+
event_indices = [i for i, (_, entity_type) in enumerate(entities.items()) if entity_type == 'EVENT']
|
180
|
+
arg_event_indices = [i for i, (_, entity_type) in enumerate(entities.items()) if entity_type != 'EVENT']
|
181
|
+
|
182
|
+
|
183
|
+
for i in event_indices:
|
184
|
+
event_entity=list(entities.keys())[i]
|
185
|
+
for j in arg_event_indices:
|
186
|
+
arg_name= list(entities.keys())[j]
|
187
|
+
arg_type=entities[arg_name]
|
188
|
+
category = get_entity_category(arg_type, categories)
|
189
|
+
|
190
|
+
if category in temp03:
|
191
|
+
relation_sentence=f"[CLS] {sentence} [SEP] {event_entity} {temp03[category]} {arg_name}"
|
192
|
+
predicted_relation=pipe(relation_sentence)
|
193
|
+
score = predicted_relation[0][0]['score']
|
194
|
+
if score > 0.50:
|
195
|
+
triple_id+=1
|
196
|
+
relation={"TripleID":triple_id,"Subject":{"ID":entity_identifier[event_entity],"Type": entities[event_entity], "Label":event_entity}, "Relation": category, "Object":{"ID":entity_identifier[arg_name],"Type": entities[arg_name], "Label":arg_name,}}
|
197
|
+
output_list.append(relation)
|
200
198
|
|
201
199
|
return output_list
|
@@ -1 +0,0 @@
|
|
1
|
-
0.1.30
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/arabert/create_classification_data.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/build_pretraining_dataset.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/finetune/preprocessing.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/pretrain/pretrain_data.py
RENAMED
File without changes
|
{SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/araelectra/pretrain/pretrain_helpers.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{SinaTools-0.1.30 → SinaTools-0.1.32}/sinatools/arabert/aragpt2/grover/optimization_adafactor.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|