cognigraph-chunker 2.2.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (111) hide show
  1. cognigraph_chunker-2.2.0/.dockerignore +8 -0
  2. cognigraph_chunker-2.2.0/.gitignore +10 -0
  3. cognigraph_chunker-2.2.0/Cargo.lock +3507 -0
  4. cognigraph_chunker-2.2.0/Cargo.toml +100 -0
  5. cognigraph_chunker-2.2.0/Dockerfile +71 -0
  6. cognigraph_chunker-2.2.0/LICENSE +21 -0
  7. cognigraph_chunker-2.2.0/PKG-INFO +61 -0
  8. cognigraph_chunker-2.2.0/README.md +1282 -0
  9. cognigraph_chunker-2.2.0/benches/chunking.rs +425 -0
  10. cognigraph_chunker-2.2.0/packages/python/Cargo.toml +19 -0
  11. cognigraph_chunker-2.2.0/packages/python/README.md +40 -0
  12. cognigraph_chunker-2.2.0/packages/python/src/adaptive.rs +281 -0
  13. cognigraph_chunker-2.2.0/packages/python/src/chunker.rs +69 -0
  14. cognigraph_chunker-2.2.0/packages/python/src/cognitive.rs +218 -0
  15. cognigraph_chunker-2.2.0/packages/python/src/enriched.rs +205 -0
  16. cognigraph_chunker-2.2.0/packages/python/src/error.rs +8 -0
  17. cognigraph_chunker-2.2.0/packages/python/src/intent.rs +210 -0
  18. cognigraph_chunker-2.2.0/packages/python/src/lib.rs +100 -0
  19. cognigraph_chunker-2.2.0/packages/python/src/merge.rs +43 -0
  20. cognigraph_chunker-2.2.0/packages/python/src/quality_metrics.rs +224 -0
  21. cognigraph_chunker-2.2.0/packages/python/src/semantic/mod.rs +166 -0
  22. cognigraph_chunker-2.2.0/packages/python/src/semantic/providers.rs +51 -0
  23. cognigraph_chunker-2.2.0/packages/python/src/signal.rs +127 -0
  24. cognigraph_chunker-2.2.0/packages/python/src/splitter.rs +80 -0
  25. cognigraph_chunker-2.2.0/packages/python/src/topo.rs +161 -0
  26. cognigraph_chunker-2.2.0/pyproject.toml +31 -0
  27. cognigraph_chunker-2.2.0/renovate.json +6 -0
  28. cognigraph_chunker-2.2.0/src/api/adaptive.rs +137 -0
  29. cognigraph_chunker-2.2.0/src/api/chunk.rs +70 -0
  30. cognigraph_chunker-2.2.0/src/api/cognitive.rs +369 -0
  31. cognigraph_chunker-2.2.0/src/api/enriched.rs +130 -0
  32. cognigraph_chunker-2.2.0/src/api/errors.rs +99 -0
  33. cognigraph_chunker-2.2.0/src/api/evaluate.rs +82 -0
  34. cognigraph_chunker-2.2.0/src/api/health.rs +8 -0
  35. cognigraph_chunker-2.2.0/src/api/intent.rs +152 -0
  36. cognigraph_chunker-2.2.0/src/api/merge.rs +59 -0
  37. cognigraph_chunker-2.2.0/src/api/mod.rs +184 -0
  38. cognigraph_chunker-2.2.0/src/api/provider.rs +75 -0
  39. cognigraph_chunker-2.2.0/src/api/semantic.rs +294 -0
  40. cognigraph_chunker-2.2.0/src/api/split.rs +73 -0
  41. cognigraph_chunker-2.2.0/src/api/topo.rs +157 -0
  42. cognigraph_chunker-2.2.0/src/api/types.rs +93 -0
  43. cognigraph_chunker-2.2.0/src/api/validation.rs +130 -0
  44. cognigraph_chunker-2.2.0/src/cli/adaptive_cmd.rs +259 -0
  45. cognigraph_chunker-2.2.0/src/cli/chunk_cmd.rs +95 -0
  46. cognigraph_chunker-2.2.0/src/cli/cognitive_cmd.rs +484 -0
  47. cognigraph_chunker-2.2.0/src/cli/enriched_cmd.rs +189 -0
  48. cognigraph_chunker-2.2.0/src/cli/global_opts.rs +83 -0
  49. cognigraph_chunker-2.2.0/src/cli/intent_cmd.rs +235 -0
  50. cognigraph_chunker-2.2.0/src/cli/merge_opts.rs +67 -0
  51. cognigraph_chunker-2.2.0/src/cli/mod.rs +47 -0
  52. cognigraph_chunker-2.2.0/src/cli/semantic_cmd.rs +168 -0
  53. cognigraph_chunker-2.2.0/src/cli/serve_cmd.rs +128 -0
  54. cognigraph_chunker-2.2.0/src/cli/split_cmd.rs +101 -0
  55. cognigraph_chunker-2.2.0/src/cli/topo_cmd.rs +165 -0
  56. cognigraph_chunker-2.2.0/src/config.rs +167 -0
  57. cognigraph_chunker-2.2.0/src/core/chunk.rs +481 -0
  58. cognigraph_chunker-2.2.0/src/core/delim.rs +453 -0
  59. cognigraph_chunker-2.2.0/src/core/merge.rs +175 -0
  60. cognigraph_chunker-2.2.0/src/core/mod.rs +21 -0
  61. cognigraph_chunker-2.2.0/src/core/savgol.rs +422 -0
  62. cognigraph_chunker-2.2.0/src/core/split.rs +484 -0
  63. cognigraph_chunker-2.2.0/src/embeddings/cloudflare.rs +265 -0
  64. cognigraph_chunker-2.2.0/src/embeddings/mod.rs +367 -0
  65. cognigraph_chunker-2.2.0/src/embeddings/oauth.rs +202 -0
  66. cognigraph_chunker-2.2.0/src/embeddings/oauth_token.rs +171 -0
  67. cognigraph_chunker-2.2.0/src/embeddings/ollama.rs +229 -0
  68. cognigraph_chunker-2.2.0/src/embeddings/onnx.rs +226 -0
  69. cognigraph_chunker-2.2.0/src/embeddings/openai.rs +116 -0
  70. cognigraph_chunker-2.2.0/src/embeddings/reranker.rs +761 -0
  71. cognigraph_chunker-2.2.0/src/http_util.rs +189 -0
  72. cognigraph_chunker-2.2.0/src/lib.rs +8 -0
  73. cognigraph_chunker-2.2.0/src/llm/enrichment.rs +185 -0
  74. cognigraph_chunker-2.2.0/src/llm/intents.rs +100 -0
  75. cognigraph_chunker-2.2.0/src/llm/mod.rs +182 -0
  76. cognigraph_chunker-2.2.0/src/llm/relations.rs +182 -0
  77. cognigraph_chunker-2.2.0/src/llm/synopsis.rs +45 -0
  78. cognigraph_chunker-2.2.0/src/llm/topo_agents.rs +209 -0
  79. cognigraph_chunker-2.2.0/src/main.rs +173 -0
  80. cognigraph_chunker-2.2.0/src/output.rs +62 -0
  81. cognigraph_chunker-2.2.0/src/semantic/adaptive_chunk.rs +587 -0
  82. cognigraph_chunker-2.2.0/src/semantic/adaptive_types.rs +53 -0
  83. cognigraph_chunker-2.2.0/src/semantic/blocks.rs +238 -0
  84. cognigraph_chunker-2.2.0/src/semantic/cognitive_assemble.rs +624 -0
  85. cognigraph_chunker-2.2.0/src/semantic/cognitive_rerank.rs +300 -0
  86. cognigraph_chunker-2.2.0/src/semantic/cognitive_score.rs +306 -0
  87. cognigraph_chunker-2.2.0/src/semantic/cognitive_types.rs +245 -0
  88. cognigraph_chunker-2.2.0/src/semantic/diagnostics.rs +60 -0
  89. cognigraph_chunker-2.2.0/src/semantic/enriched_chunk.rs +534 -0
  90. cognigraph_chunker-2.2.0/src/semantic/enriched_types.rs +46 -0
  91. cognigraph_chunker-2.2.0/src/semantic/enrichment/discourse.rs +172 -0
  92. cognigraph_chunker-2.2.0/src/semantic/enrichment/entities.rs +349 -0
  93. cognigraph_chunker-2.2.0/src/semantic/enrichment/heading_context.rs +182 -0
  94. cognigraph_chunker-2.2.0/src/semantic/enrichment/language.rs +359 -0
  95. cognigraph_chunker-2.2.0/src/semantic/enrichment/mod.rs +299 -0
  96. cognigraph_chunker-2.2.0/src/semantic/enrichment/multilingual_discourse.rs +736 -0
  97. cognigraph_chunker-2.2.0/src/semantic/enrichment/script_entities.rs +228 -0
  98. cognigraph_chunker-2.2.0/src/semantic/evaluation.rs +337 -0
  99. cognigraph_chunker-2.2.0/src/semantic/graph_export.rs +180 -0
  100. cognigraph_chunker-2.2.0/src/semantic/intent_chunk.rs +437 -0
  101. cognigraph_chunker-2.2.0/src/semantic/intent_types.rs +45 -0
  102. cognigraph_chunker-2.2.0/src/semantic/mod.rs +639 -0
  103. cognigraph_chunker-2.2.0/src/semantic/proposition_heal.rs +416 -0
  104. cognigraph_chunker-2.2.0/src/semantic/quality_metrics.rs +569 -0
  105. cognigraph_chunker-2.2.0/src/semantic/sentence.rs +54 -0
  106. cognigraph_chunker-2.2.0/src/semantic/sir.rs +74 -0
  107. cognigraph_chunker-2.2.0/src/semantic/topo_chunk.rs +571 -0
  108. cognigraph_chunker-2.2.0/src/semantic/topo_types.rs +60 -0
  109. cognigraph_chunker-2.2.0/tests/benchmark_comparison.rs +480 -0
  110. cognigraph_chunker-2.2.0/tests/benchmark_reranker.rs +412 -0
  111. cognigraph_chunker-2.2.0/tests/embedding_providers.rs +107 -0
@@ -0,0 +1,8 @@
1
+ target/
2
+ .git/
3
+ .env*
4
+ .claude/
5
+ models/
6
+ tests/
7
+ *.md
8
+ !Cargo.toml
@@ -0,0 +1,10 @@
1
+ /target
2
+ .env
3
+ .env.*
4
+ .idea/
5
+ .venv
6
+ models/
7
+ tests/python/.venv/
8
+ __pycache__/
9
+ planning/
10
+ scripts/