lopace 0.1.6.dev2__tar.gz → 0.1.6.dev3__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/PKG-INFO +1 -1
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/lopace/_version.py +3 -3
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/lopace/compressor.py +5 -3
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/lopace.egg-info/PKG-INFO +1 -1
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/lopace.egg-info/SOURCES.txt +6 -0
- lopace-0.1.6.dev3/screenshots/benchmark_data.csv +1159 -0
- lopace-0.1.6.dev3/screenshots/comprehensive_comparison.png +0 -0
- lopace-0.1.6.dev3/screenshots/comprehensive_comparison.svg +787 -0
- lopace-0.1.6.dev3/screenshots/compression_ratio.png +0 -0
- lopace-0.1.6.dev3/screenshots/compression_ratio.svg +1995 -0
- lopace-0.1.6.dev3/screenshots/dataset_analysis.csv +387 -0
- lopace-0.1.6.dev3/screenshots/dataset_eda.png +0 -0
- lopace-0.1.6.dev3/screenshots/dataset_eda.svg +1650 -0
- lopace-0.1.6.dev3/screenshots/dataset_percentiles.png +0 -0
- lopace-0.1.6.dev3/screenshots/dataset_percentiles.svg +343 -0
- lopace-0.1.6.dev3/screenshots/dataset_statistics.json +28 -0
- lopace-0.1.6.dev3/screenshots/disk_size_comparison.png +0 -0
- lopace-0.1.6.dev3/screenshots/disk_size_comparison.svg +18020 -0
- lopace-0.1.6.dev3/screenshots/memory_usage.png +0 -0
- lopace-0.1.6.dev3/screenshots/memory_usage.svg +3217 -0
- lopace-0.1.6.dev3/screenshots/original_vs_decompressed.png +0 -0
- lopace-0.1.6.dev3/screenshots/original_vs_decompressed.svg +3361 -0
- lopace-0.1.6.dev3/screenshots/scalability_analysis.png +0 -0
- lopace-0.1.6.dev3/screenshots/scalability_analysis.svg +9888 -0
- lopace-0.1.6.dev3/screenshots/space_savings.png +0 -0
- lopace-0.1.6.dev3/screenshots/space_savings.svg +433 -0
- lopace-0.1.6.dev3/screenshots/speed_metrics.png +0 -0
- lopace-0.1.6.dev3/screenshots/speed_metrics.svg +6185 -0
- lopace-0.1.6.dev3/scripts/generate_visualizations.py +845 -0
- lopace-0.1.6.dev2/screenshots/benchmark_data.csv +0 -31
- lopace-0.1.6.dev2/screenshots/comprehensive_comparison.png +0 -0
- lopace-0.1.6.dev2/screenshots/comprehensive_comparison.svg +0 -961
- lopace-0.1.6.dev2/screenshots/compression_ratio.png +0 -0
- lopace-0.1.6.dev2/screenshots/compression_ratio.svg +0 -546
- lopace-0.1.6.dev2/screenshots/disk_size_comparison.png +0 -0
- lopace-0.1.6.dev2/screenshots/disk_size_comparison.svg +0 -576
- lopace-0.1.6.dev2/screenshots/memory_usage.png +0 -0
- lopace-0.1.6.dev2/screenshots/memory_usage.svg +0 -721
- lopace-0.1.6.dev2/screenshots/original_vs_decompressed.png +0 -0
- lopace-0.1.6.dev2/screenshots/original_vs_decompressed.svg +0 -2804
- lopace-0.1.6.dev2/screenshots/scalability_analysis.png +0 -0
- lopace-0.1.6.dev2/screenshots/scalability_analysis.svg +0 -1267
- lopace-0.1.6.dev2/screenshots/space_savings.png +0 -0
- lopace-0.1.6.dev2/screenshots/space_savings.svg +0 -397
- lopace-0.1.6.dev2/screenshots/speed_metrics.png +0 -0
- lopace-0.1.6.dev2/screenshots/speed_metrics.svg +0 -1044
- lopace-0.1.6.dev2/scripts/generate_visualizations.py +0 -948
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/.dockerignore +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/.github/dependabot.yml +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/.github/pull_request_template.md +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/.github/workflows/ci-cd.yml +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/.github/workflows/test-only.yml +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/.gitignore +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/CHANGELOG.md +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/CODE_OF_CONDUCT.md +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/CONTRIBUTING.md +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/Dockerfile +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/LICENSE +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/MANIFEST.in +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/README.md +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/SECURITY.md +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/lopace/__init__.py +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/lopace.egg-info/dependency_links.txt +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/lopace.egg-info/requires.txt +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/lopace.egg-info/top_level.txt +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/notebooks/LoPace_Complete_Guide.ipynb +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/notebooks/README.md +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/paper/lopace-preprint-arxiv-01.png +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/paper/lopace-preprint-arxiv.pdf +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/pyproject.toml +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/requirements-dev.txt +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/requirements.txt +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/screenshots/.gitkeep +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/screenshots/compression-pipeline.png +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/screenshots/logo-text.png +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/screenshots/logo.png +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/screenshots/lopace-compression-technique.png +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/scripts/README.md +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/scripts/__init__.py +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/scripts/requirements.txt +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/setup.cfg +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/setup.py +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/streamlit_app.py +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/tests/__init__.py +0 -0
- {lopace-0.1.6.dev2 → lopace-0.1.6.dev3}/tests/test_compressor.py +0 -0
|
@@ -28,7 +28,7 @@ version_tuple: VERSION_TUPLE
|
|
|
28
28
|
commit_id: COMMIT_ID
|
|
29
29
|
__commit_id__: COMMIT_ID
|
|
30
30
|
|
|
31
|
-
__version__ = version = '0.1.6.
|
|
32
|
-
__version_tuple__ = version_tuple = (0, 1, 6, '
|
|
31
|
+
__version__ = version = '0.1.6.dev3'
|
|
32
|
+
__version_tuple__ = version_tuple = (0, 1, 6, 'dev3')
|
|
33
33
|
|
|
34
|
-
__commit_id__ = commit_id = '
|
|
34
|
+
__commit_id__ = commit_id = 'gb8dad2406'
|
|
@@ -126,7 +126,8 @@ class PromptCompressor:
|
|
|
126
126
|
>>> original = compressor.decompress_token(compressed)
|
|
127
127
|
"""
|
|
128
128
|
# Step 1: Convert text to list of token IDs
|
|
129
|
-
|
|
129
|
+
# Allow special tokens to be encoded as normal text (disable the check)
|
|
130
|
+
token_ids = list(self.tokenizer.encode(text, disallowed_special=())) # Ensure it's a list
|
|
130
131
|
|
|
131
132
|
if not token_ids:
|
|
132
133
|
# Empty token list - return just format byte
|
|
@@ -221,7 +222,8 @@ class PromptCompressor:
|
|
|
221
222
|
>>> original = compressor.decompress_hybrid(compressed)
|
|
222
223
|
"""
|
|
223
224
|
# Step 1: Tokenize
|
|
224
|
-
tokens
|
|
225
|
+
# Allow special tokens to be encoded as normal text (disable the check)
|
|
226
|
+
tokens = list(self.tokenizer.encode(text, disallowed_special=())) # Ensure it's a list
|
|
225
227
|
|
|
226
228
|
if not tokens:
|
|
227
229
|
# Empty token list - return compressed empty data
|
|
@@ -393,7 +395,7 @@ class PromptCompressor:
|
|
|
393
395
|
original_size = len(text.encode('utf-8'))
|
|
394
396
|
stats = {
|
|
395
397
|
'original_size_bytes': original_size,
|
|
396
|
-
'original_size_tokens': len(self.tokenizer.encode(text)),
|
|
398
|
+
'original_size_tokens': len(self.tokenizer.encode(text, disallowed_special=())),
|
|
397
399
|
'methods': {}
|
|
398
400
|
}
|
|
399
401
|
|
|
@@ -38,6 +38,12 @@ screenshots/comprehensive_comparison.svg
|
|
|
38
38
|
screenshots/compression-pipeline.png
|
|
39
39
|
screenshots/compression_ratio.png
|
|
40
40
|
screenshots/compression_ratio.svg
|
|
41
|
+
screenshots/dataset_analysis.csv
|
|
42
|
+
screenshots/dataset_eda.png
|
|
43
|
+
screenshots/dataset_eda.svg
|
|
44
|
+
screenshots/dataset_percentiles.png
|
|
45
|
+
screenshots/dataset_percentiles.svg
|
|
46
|
+
screenshots/dataset_statistics.json
|
|
41
47
|
screenshots/disk_size_comparison.png
|
|
42
48
|
screenshots/disk_size_comparison.svg
|
|
43
49
|
screenshots/logo-text.png
|