pelican-nlp 0.2.6__tar.gz → 0.2.7__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (102) hide show
  1. {pelican_nlp-0.2.6/pelican_nlp.egg-info → pelican_nlp-0.2.7}/PKG-INFO +3 -3
  2. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/README.rst +2 -2
  3. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_discourse/config_discourse.yml +0 -1
  4. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_image-descriptions/config_image-descriptions.yml +0 -1
  5. pelican_nlp-0.2.7/pelican_nlp/_version.py +1 -0
  6. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/extraction/language_model.py +26 -2
  7. {pelican_nlp-0.2.6/examples/PyPI_testing_fluency → pelican_nlp-0.2.7/pelican_nlp/sample_configuration_files}/config_fluency.yml +0 -1
  8. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7/pelican_nlp.egg-info}/PKG-INFO +3 -3
  9. pelican_nlp-0.2.6/pelican_nlp/_version.py +0 -1
  10. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/LICENSE +0 -0
  11. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/MANIFEST.in +0 -0
  12. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_discourse/subjects/sub-01/interview/sub-01_interview_schizophrenia_run-01.rtf +0 -0
  13. {pelican_nlp-0.2.6/pelican_nlp/configuration_files → pelican_nlp-0.2.7/examples/PyPI_testing_fluency}/config_fluency.yml +0 -0
  14. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_fluency/subjects/sub-01/fluency/sub-01_fluency_sem_animals.txt +0 -0
  15. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_fluency/subjects/sub-01/fluency/sub-01_fluency_sem_clothes.txt +0 -0
  16. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_fluency/subjects/sub-01/fluency/sub-01_fluency_sem_food.txt +0 -0
  17. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_fluency/subjects/sub-02/fluency/sub-02_fluency_sem_animals.txt +0 -0
  18. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_fluency/subjects/sub-02/fluency/sub-02_fluency_sem_clothes.txt +0 -0
  19. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_fluency/subjects/sub-02/fluency/sub-02_fluency_sem_food.txt +0 -0
  20. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_image-descriptions/subjects/sub-01/ses-01/image-description/sub-01_ses-01_image-description_drug.docx +0 -0
  21. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_image-descriptions/subjects/sub-01/ses-01/image-description/sub-01_ses-01_image-description_placebo.docx +0 -0
  22. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_image-descriptions/subjects/sub-01/ses-02/image-description/sub-01_ses-02_image-description_drug.docx +0 -0
  23. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_image-descriptions/subjects/sub-01/ses-02/image-description/sub-01_ses-02_image-description_placebo.docx +0 -0
  24. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_image-descriptions/subjects/sub-02/ses-01/image-description/sub-02_ses-01_image-description_drug.docx +0 -0
  25. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/examples/PyPI_testing_image-descriptions/subjects/sub-02/ses-01/image-description/sub-02_ses-01_image-description_placebo.docx +0 -0
  26. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/__init__.py +0 -0
  27. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/extract_acoustic_features.py +0 -0
  28. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/__init__.py +0 -0
  29. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/aggregate_fluency_results.py +0 -0
  30. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/behavioral_data.py +0 -0
  31. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/check_duplicates.py +0 -0
  32. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/coherence.py +0 -0
  33. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/config.py +0 -0
  34. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/main.py +0 -0
  35. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/optimality_without_tsa.py +0 -0
  36. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/plot_fluency.py +0 -0
  37. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/plotting_utils.py +0 -0
  38. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/questionnaires_data.py +0 -0
  39. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/stats_fluency.py +0 -0
  40. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/fluency/utils.py +0 -0
  41. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/speaker_diarization_Nils.py +0 -0
  42. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/transcription/__init__.py +0 -0
  43. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/transcription/annotation_tool.py +0 -0
  44. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/transcription/annotation_tool_boundaries.py +0 -0
  45. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/transcription/annotation_tool_sandbox.py +0 -0
  46. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/transcription/output/holmes_control_nova_all_outputs.json +0 -0
  47. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/transcription/test.json +0 -0
  48. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/transcription/transcribe_audio.py +0 -0
  49. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/transcription/transcribe_audio_chunked.py +0 -0
  50. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/transcription/transcription.py +0 -0
  51. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/transcription/transcription_gui.py +0 -0
  52. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Nils_backup/transcription/word_boundaries.py +0 -0
  53. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Silvia_files/Opensmile/opensmile_feature_extraction.py +0 -0
  54. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/Silvia_files/prosogram/prosogram.py +0 -0
  55. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/__init__.py +0 -0
  56. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/cli.py +0 -0
  57. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/configuration_files/config_audio.yml +0 -0
  58. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/configuration_files/config_discourse.yml +0 -0
  59. {pelican_nlp-0.2.6/pelican_nlp/sample_configuration_files → pelican_nlp-0.2.7/pelican_nlp/configuration_files}/config_fluency.yml +0 -0
  60. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/configuration_files/config_general.yml +0 -0
  61. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/configuration_files/config_morteza.yml +0 -0
  62. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/core/__init__.py +0 -0
  63. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/core/audio_document.py +0 -0
  64. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/core/corpus.py +0 -0
  65. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/core/document.py +0 -0
  66. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/core/subject.py +0 -0
  67. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/extraction/__init__.py +0 -0
  68. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/extraction/acoustic_feature_extraction.py +0 -0
  69. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/extraction/distance_from_randomness.py +0 -0
  70. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/extraction/extract_embeddings.py +0 -0
  71. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/extraction/extract_logits.py +0 -0
  72. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/extraction/semantic_similarity.py +0 -0
  73. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/extraction/test_documents/test_features.csv +0 -0
  74. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/extraction/test_documents/wallace_1.15_3.txt +0 -0
  75. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/extraction/test_documents/wallace_1.1_3.txt +0 -0
  76. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/extraction/test_documents/wallace_1_4.txt +0 -0
  77. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/main.py +0 -0
  78. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/metrics_statistics/embeddings_metrics_statistics.py +0 -0
  79. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/praat/__init__.py +0 -0
  80. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/preprocessing/LPDS.py +0 -0
  81. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/preprocessing/__init__.py +0 -0
  82. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/preprocessing/pipeline.py +0 -0
  83. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/preprocessing/speaker_diarization.py +0 -0
  84. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/preprocessing/text_cleaner.py +0 -0
  85. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/preprocessing/text_importer.py +0 -0
  86. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/preprocessing/text_normalizer.py +0 -0
  87. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/preprocessing/text_tokenizer.py +0 -0
  88. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/sample_configuration_files/config_discourse.yml +0 -0
  89. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/sample_configuration_files/config_general.yml +0 -0
  90. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/utils/__init__.py +0 -0
  91. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/utils/csv_functions.py +0 -0
  92. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/utils/sample_usage.py +0 -0
  93. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp/utils/setup_functions.py +0 -0
  94. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp.egg-info/SOURCES.txt +0 -0
  95. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp.egg-info/dependency_links.txt +0 -0
  96. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp.egg-info/entry_points.txt +0 -0
  97. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp.egg-info/requires.txt +0 -0
  98. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pelican_nlp.egg-info/top_level.txt +0 -0
  99. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/pyproject.toml +0 -0
  100. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/requirements.txt +0 -0
  101. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/setup.cfg +0 -0
  102. {pelican_nlp-0.2.6 → pelican_nlp-0.2.7}/tests/__init__.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: pelican_nlp
3
- Version: 0.2.6
3
+ Version: 0.2.7
4
4
  Summary: Preprocessing and Extraction of Linguistic Information for Computational Analysis
5
5
  Author-email: Yves Pauli <yves.pauli@gmail.com>
6
6
  License-Expression: CC-BY-NC-4.0
@@ -69,7 +69,7 @@ Create conda environment
69
69
 
70
70
  .. code-block:: bash
71
71
 
72
- conda create -n pelican-nlp python=3.10
72
+ conda create -n pelican-nlp -c defaults python=3.10
73
73
 
74
74
  Activate environment
75
75
 
@@ -157,7 +157,7 @@ Features
157
157
  Examples
158
158
  ========
159
159
 
160
- You can find example setups on the github repository in the 'examples` folder: https://github.com/ypauli/pelican_nlp/tree/main/examples
160
+ You can find example setups on the github repository in the `examples <https://github.com/ypauli/pelican_nlp/tree/main/examples>`_ folder:
161
161
 
162
162
  Contributing
163
163
  ============
@@ -23,7 +23,7 @@ Create conda environment
23
23
 
24
24
  .. code-block:: bash
25
25
 
26
- conda create -n pelican-nlp python=3.10
26
+ conda create -n pelican-nlp -c defaults python=3.10
27
27
 
28
28
  Activate environment
29
29
 
@@ -111,7 +111,7 @@ Features
111
111
  Examples
112
112
  ========
113
113
 
114
- You can find example setups on the github repository in the 'examples` folder: https://github.com/ypauli/pelican_nlp/tree/main/examples
114
+ You can find example setups on the github repository in the `examples <https://github.com/ypauli/pelican_nlp/tree/main/examples>`_ folder:
115
115
 
116
116
  Contributing
117
117
  ============
@@ -5,7 +5,6 @@ discourse: &discourse_flag true
5
5
  #=====================================
6
6
 
7
7
  #general configurations; always adapt
8
- PATH_TO_PROJECT_FOLDER: "/home/yvespauli/PycharmProjects/PyPI_testing_discourse"
9
8
  language: "german" # Possibly add options for German and English
10
9
 
11
10
  task_name: "interview" # Give name of task used for creation of the input file (e.g., ['fluency', 'interview'])
@@ -4,7 +4,6 @@
4
4
  # Basic Settings
5
5
  # -------------
6
6
  input_file: "text" # Options: 'text' or 'audio'
7
- PATH_TO_PROJECT_FOLDER: "/home/yvespauli/PycharmProjects/PyPI_testing_image-descriptions"
8
7
  language: "german" # Options: 'german', 'english'
9
8
  recompute_everything: true # If false, reuses previously computed results
10
9
 
@@ -0,0 +1 @@
1
+ __version__ = "0.2.7"
@@ -1,5 +1,6 @@
1
1
  import torch
2
2
  import psutil
3
+ import os
3
4
 
4
5
  from accelerate import init_empty_weights, infer_auto_device_map, dispatch_model
5
6
  from transformers import AutoModelForCausalLM
@@ -17,8 +18,31 @@ class Model:
17
18
  if self.model_name == 'fastText':
18
19
  import fasttext
19
20
  import fasttext.util
20
- fasttext.util.download_model('de', if_exists='ignore')
21
- self.model_instance = fasttext.load_model('cc.de.300.bin')
21
+
22
+ # Create a model directory if it doesn't exist
23
+ model_dir = os.path.join(os.path.expanduser('~'), '.fasttext')
24
+ os.makedirs(model_dir, exist_ok=True)
25
+
26
+ # Set the model path using proper OS path joining
27
+ model_path = os.path.join(model_dir, 'cc.de.300.bin')
28
+
29
+ # Download only if model doesn't exist
30
+ if not os.path.exists(model_path):
31
+ try:
32
+ fasttext.util.download_model('de', if_exists='ignore')
33
+ except OSError:
34
+ # Direct download fallback for Windows
35
+ import urllib.request
36
+ url = 'https://dl.fbaipublicfiles.com/fasttext/vectors-crawl/cc.de.300.bin.gz'
37
+ urllib.request.urlretrieve(url, model_path + '.gz')
38
+ # Decompress the file
39
+ import gzip
40
+ with gzip.open(model_path + '.gz', 'rb') as f_in:
41
+ with open(model_path, 'wb') as f_out:
42
+ f_out.write(f_in.read())
43
+ os.remove(model_path + '.gz')
44
+
45
+ self.model_instance = fasttext.load_model(model_path)
22
46
  print('FastText model loaded.')
23
47
  elif self.model_name == 'xlm-roberta-base':
24
48
  from transformers import AutoModel
@@ -5,7 +5,6 @@ fluency_task: &fluency_flag true
5
5
  #========================================
6
6
 
7
7
  #general configurations; always adapt
8
- PATH_TO_PROJECT_FOLDER: "/home/yvespauli/PycharmProjects/pelican_testing"
9
8
  language: "german"
10
9
  multiple_sessions: &session_flag false
11
10
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: pelican_nlp
3
- Version: 0.2.6
3
+ Version: 0.2.7
4
4
  Summary: Preprocessing and Extraction of Linguistic Information for Computational Analysis
5
5
  Author-email: Yves Pauli <yves.pauli@gmail.com>
6
6
  License-Expression: CC-BY-NC-4.0
@@ -69,7 +69,7 @@ Create conda environment
69
69
 
70
70
  .. code-block:: bash
71
71
 
72
- conda create -n pelican-nlp python=3.10
72
+ conda create -n pelican-nlp -c defaults python=3.10
73
73
 
74
74
  Activate environment
75
75
 
@@ -157,7 +157,7 @@ Features
157
157
  Examples
158
158
  ========
159
159
 
160
- You can find example setups on the github repository in the 'examples` folder: https://github.com/ypauli/pelican_nlp/tree/main/examples
160
+ You can find example setups on the github repository in the `examples <https://github.com/ypauli/pelican_nlp/tree/main/examples>`_ folder:
161
161
 
162
162
  Contributing
163
163
  ============
@@ -1 +0,0 @@
1
- __version__ = "0.2.6"
File without changes
File without changes
File without changes
File without changes