pelican-nlp 0.2.2__tar.gz → 0.2.3__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (102) hide show
  1. {pelican_nlp-0.2.2/pelican_nlp.egg-info → pelican_nlp-0.2.3}/PKG-INFO +1 -1
  2. pelican_nlp-0.2.3/pelican_nlp/_version.py +1 -0
  3. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/core/corpus.py +6 -6
  4. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3/pelican_nlp.egg-info}/PKG-INFO +1 -1
  5. pelican_nlp-0.2.2/pelican_nlp/_version.py +0 -1
  6. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/LICENSE +0 -0
  7. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/MANIFEST.in +0 -0
  8. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/README.rst +0 -0
  9. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_discourse/config_discourse.yml +0 -0
  10. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_discourse/subjects/sub-01/interview/sub-01_interview_schizophrenia_run-01.rtf +0 -0
  11. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_fluency/config_fluency.yml +0 -0
  12. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_fluency/subjects/sub-01/fluency/sub-01_fluency_sem_animals.txt +0 -0
  13. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_fluency/subjects/sub-01/fluency/sub-01_fluency_sem_clothes.txt +0 -0
  14. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_fluency/subjects/sub-01/fluency/sub-01_fluency_sem_food.txt +0 -0
  15. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_fluency/subjects/sub-02/fluency/sub-02_fluency_sem_animals.txt +0 -0
  16. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_fluency/subjects/sub-02/fluency/sub-02_fluency_sem_clothes.txt +0 -0
  17. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_fluency/subjects/sub-02/fluency/sub-02_fluency_sem_food.txt +0 -0
  18. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_image-descriptions/config_image-descriptions.yml +0 -0
  19. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_image-descriptions/subjects/sub-01/ses-01/image-description/sub-01_ses-01_image-description_drug.docx +0 -0
  20. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_image-descriptions/subjects/sub-01/ses-01/image-description/sub-01_ses-01_image-description_placebo.docx +0 -0
  21. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_image-descriptions/subjects/sub-01/ses-02/image-description/sub-01_ses-02_image-description_drug.docx +0 -0
  22. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_image-descriptions/subjects/sub-01/ses-02/image-description/sub-01_ses-02_image-description_placebo.docx +0 -0
  23. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_image-descriptions/subjects/sub-02/ses-01/image-description/sub-02_ses-01_image-description_drug.docx +0 -0
  24. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/examples/PyPI_testing_image-descriptions/subjects/sub-02/ses-01/image-description/sub-02_ses-01_image-description_placebo.docx +0 -0
  25. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/__init__.py +0 -0
  26. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/extract_acoustic_features.py +0 -0
  27. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/__init__.py +0 -0
  28. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/aggregate_fluency_results.py +0 -0
  29. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/behavioral_data.py +0 -0
  30. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/check_duplicates.py +0 -0
  31. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/coherence.py +0 -0
  32. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/config.py +0 -0
  33. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/main.py +0 -0
  34. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/optimality_without_tsa.py +0 -0
  35. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/plot_fluency.py +0 -0
  36. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/plotting_utils.py +0 -0
  37. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/questionnaires_data.py +0 -0
  38. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/stats_fluency.py +0 -0
  39. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/fluency/utils.py +0 -0
  40. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/speaker_diarization_Nils.py +0 -0
  41. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/transcription/__init__.py +0 -0
  42. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/transcription/annotation_tool.py +0 -0
  43. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/transcription/annotation_tool_boundaries.py +0 -0
  44. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/transcription/annotation_tool_sandbox.py +0 -0
  45. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/transcription/output/holmes_control_nova_all_outputs.json +0 -0
  46. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/transcription/test.json +0 -0
  47. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/transcription/transcribe_audio.py +0 -0
  48. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/transcription/transcribe_audio_chunked.py +0 -0
  49. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/transcription/transcription.py +0 -0
  50. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/transcription/transcription_gui.py +0 -0
  51. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Nils_backup/transcription/word_boundaries.py +0 -0
  52. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Silvia_files/Opensmile/opensmile_feature_extraction.py +0 -0
  53. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/Silvia_files/prosogram/prosogram.py +0 -0
  54. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/__init__.py +0 -0
  55. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/cli.py +0 -0
  56. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/configuration_files/config_audio.yml +0 -0
  57. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/configuration_files/config_discourse.yml +0 -0
  58. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/configuration_files/config_fluency.yml +0 -0
  59. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/configuration_files/config_general.yml +0 -0
  60. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/configuration_files/config_morteza.yml +0 -0
  61. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/core/__init__.py +0 -0
  62. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/core/audio_document.py +0 -0
  63. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/core/document.py +0 -0
  64. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/core/subject.py +0 -0
  65. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/extraction/__init__.py +0 -0
  66. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/extraction/acoustic_feature_extraction.py +0 -0
  67. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/extraction/distance_from_randomness.py +0 -0
  68. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/extraction/extract_embeddings.py +0 -0
  69. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/extraction/extract_logits.py +0 -0
  70. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/extraction/language_model.py +0 -0
  71. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/extraction/semantic_similarity.py +0 -0
  72. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/extraction/test_documents/test_features.csv +0 -0
  73. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/extraction/test_documents/wallace_1.15_3.txt +0 -0
  74. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/extraction/test_documents/wallace_1.1_3.txt +0 -0
  75. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/extraction/test_documents/wallace_1_4.txt +0 -0
  76. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/main.py +0 -0
  77. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/metrics_statistics/embeddings_metrics_statistics.py +0 -0
  78. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/praat/__init__.py +0 -0
  79. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/preprocessing/LPDS.py +0 -0
  80. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/preprocessing/__init__.py +0 -0
  81. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/preprocessing/pipeline.py +0 -0
  82. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/preprocessing/speaker_diarization.py +0 -0
  83. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/preprocessing/text_cleaner.py +0 -0
  84. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/preprocessing/text_importer.py +0 -0
  85. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/preprocessing/text_normalizer.py +0 -0
  86. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/preprocessing/text_tokenizer.py +0 -0
  87. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/sample_configuration_files/config_discourse.yml +0 -0
  88. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/sample_configuration_files/config_fluency.yml +0 -0
  89. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/sample_configuration_files/config_general.yml +0 -0
  90. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/utils/__init__.py +0 -0
  91. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/utils/csv_functions.py +0 -0
  92. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/utils/sample_usage.py +0 -0
  93. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp/utils/setup_functions.py +0 -0
  94. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp.egg-info/SOURCES.txt +0 -0
  95. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp.egg-info/dependency_links.txt +0 -0
  96. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp.egg-info/entry_points.txt +0 -0
  97. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp.egg-info/requires.txt +0 -0
  98. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pelican_nlp.egg-info/top_level.txt +0 -0
  99. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/pyproject.toml +0 -0
  100. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/requirements.txt +0 -0
  101. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/setup.cfg +0 -0
  102. {pelican_nlp-0.2.2 → pelican_nlp-0.2.3}/tests/__init__.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: pelican_nlp
3
- Version: 0.2.2
3
+ Version: 0.2.3
4
4
  Summary: Preprocessing and Extraction of Linguistic Information for Computational Analysis
5
5
  Author-email: Yves Pauli <yves.pauli@gmail.com>
6
6
  License-Expression: CC-BY-NC-4.0
@@ -0,0 +1 @@
1
+ __version__ = "0.2.3"
@@ -16,11 +16,12 @@ import pandas as pd
16
16
  import re
17
17
 
18
18
  class Corpus:
19
- def __init__(self, corpus_name, documents, configuration_settings):
19
+ def __init__(self, corpus_name, documents, configuration_settings, project_folder):
20
20
  self.name = corpus_name
21
21
  self.documents = documents
22
22
  self.config = configuration_settings
23
- self.derivative_dir = self.config['PATH_TO_PROJECT_FOLDER']+'/derivatives'
23
+ self.project_folder = project_folder
24
+ self.derivative_dir = project_folder + '/derivatives'
24
25
  self.pipeline = TextPreprocessingPipeline(self.config)
25
26
  self.task = configuration_settings['task_name']
26
27
  self.results_path = None
@@ -112,14 +113,13 @@ class Corpus:
112
113
  from pelican_nlp.extraction.extract_logits import LogitsExtractor
113
114
  from pelican_nlp.preprocessing.text_tokenizer import TextTokenizer
114
115
  logits_options = self.config['options_logits']
115
- project_path = self.config['PATH_TO_PROJECT_FOLDER']
116
116
 
117
117
  print('logits extraction in progress')
118
118
  model_name = logits_options['model_name']
119
119
  logitsExtractor = LogitsExtractor(logits_options,
120
120
  self.pipeline,
121
- project_path)
122
- model = Model(model_name, project_path)
121
+ self.project_folder)
122
+ model = Model(model_name, self.project_folder)
123
123
  model.load_model()
124
124
  model_instance = model.model_instance
125
125
  tokenizer = TextTokenizer(logits_options['tokenization_method'], model_name=logits_options['model_name'])
@@ -153,7 +153,7 @@ class Corpus:
153
153
 
154
154
  embedding_options = self.config['options_embeddings']
155
155
  print('Embeddings extraction in progress...')
156
- embeddingsExtractor = EmbeddingsExtractor(embedding_options, self.config['PATH_TO_PROJECT_FOLDER'])
156
+ embeddingsExtractor = EmbeddingsExtractor(embedding_options, self.project_folder)
157
157
  for i in range(len(self.documents)):
158
158
  for key, section in self.documents[i].cleaned_sections.items():
159
159
  print(f'Processing section {key}')
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: pelican_nlp
3
- Version: 0.2.2
3
+ Version: 0.2.3
4
4
  Summary: Preprocessing and Extraction of Linguistic Information for Computational Analysis
5
5
  Author-email: Yves Pauli <yves.pauli@gmail.com>
6
6
  License-Expression: CC-BY-NC-4.0
@@ -1 +0,0 @@
1
- __version__ = "0.2.2"
File without changes
File without changes
File without changes
File without changes
File without changes