kreuzberg 4.5.2-aarch64-linux → 4.5.4-aarch64-linux
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/Gemfile.lock +2 -2
- data/README.md +4 -4
- data/lib/kreuzberg/config.rb +5 -3
- data/lib/kreuzberg/version.rb +1 -1
- data/lib/kreuzberg_rb.so +0 -0
- data/sig/kreuzberg.rbs +2 -1
- metadata +2 -2
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA256:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: dfd3586f04b1b2b6dcdf06af30712755fd3fd8d76c7bc03cee05a67133134998
|
|
4
|
+
data.tar.gz: c402149a2765063da19d639eb2aa2b75340db6292b680c9218bc826d5997346c
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: aa8f6ba036c180200182377b90b15f293cf008b440c49d732d5dfa84df203373b173b9928138d58917fd7dddfe41c3b4ea89cab582c69707253ed87163932349
|
|
7
|
+
data.tar.gz: 211e120a58693b5c385ff0c577391d542a4ee9ca3e1194ca96e2e975a2636d78cdf9526b25852dad70d543142576317c2b344260f83148143d4d9ab6ac6822bd
|
data/Gemfile.lock
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
PATH
|
|
2
2
|
remote: .
|
|
3
3
|
specs:
|
|
4
|
-
kreuzberg (4.5.
|
|
4
|
+
kreuzberg (4.5.4)
|
|
5
5
|
rb_sys (~> 0.9.119)
|
|
6
6
|
sorbet-runtime (~> 0.5)
|
|
7
7
|
|
|
@@ -222,7 +222,7 @@ CHECKSUMS
|
|
|
222
222
|
io-console (0.8.2) sha256=d6e3ae7a7cc7574f4b8893b4fca2162e57a825b223a177b7afa236c5ef9814cc
|
|
223
223
|
json (2.19.2) sha256=e7e1bd318b2c37c4ceee2444841c86539bc462e81f40d134cf97826cb14e83cf
|
|
224
224
|
json-schema (6.2.0) sha256=e8bff46ed845a22c1ab2bd0d7eccf831c01fe23bb3920caa4c74db4306813666
|
|
225
|
-
kreuzberg (4.5.
|
|
225
|
+
kreuzberg (4.5.4)
|
|
226
226
|
language_server-protocol (3.17.0.5) sha256=fd1e39a51a28bf3eec959379985a72e296e9f9acfce46f6a79d31ca8760803cc
|
|
227
227
|
lint_roller (1.1.0) sha256=2c0c845b632a7d172cb849cc90c1bce937a28c5c8ccccb50dfd46a485003cc87
|
|
228
228
|
listen (3.10.0) sha256=c6e182db62143aeccc2e1960033bebe7445309c7272061979bb098d03760c9d2
|
data/README.md
CHANGED
|
@@ -22,7 +22,7 @@
|
|
|
22
22
|
<img src="https://img.shields.io/maven-central/v/dev.kreuzberg/kreuzberg?label=Java&color=007ec6" alt="Java">
|
|
23
23
|
</a>
|
|
24
24
|
<a href="https://github.com/kreuzberg-dev/kreuzberg/releases">
|
|
25
|
-
<img src="https://img.shields.io/github/v/tag/kreuzberg-dev/kreuzberg?label=Go&color=007ec6&filter=v4.5.
|
|
25
|
+
<img src="https://img.shields.io/github/v/tag/kreuzberg-dev/kreuzberg?label=Go&color=007ec6&filter=v4.5.4" alt="Go">
|
|
26
26
|
</a>
|
|
27
27
|
<a href="https://www.nuget.org/packages/Kreuzberg/">
|
|
28
28
|
<img src="https://img.shields.io/nuget/v/Kreuzberg?label=C%23&color=007ec6" alt="C#">
|
|
@@ -61,7 +61,7 @@
|
|
|
61
61
|
</div>
|
|
62
62
|
|
|
63
63
|
|
|
64
|
-
Extract text, tables, images, and metadata from
|
|
64
|
+
Extract text, tables, images, and metadata from 91+ file formats including PDF, Office documents, and images. Ruby bindings with idiomatic Ruby API and native performance.
|
|
65
65
|
|
|
66
66
|
|
|
67
67
|
## Installation
|
|
@@ -211,9 +211,9 @@ puts "Processing time: #{result.metadata&.dig('processing_time')}ms"
|
|
|
211
211
|
|
|
212
212
|
## Features
|
|
213
213
|
|
|
214
|
-
### Supported File Formats (
|
|
214
|
+
### Supported File Formats (91+)
|
|
215
215
|
|
|
216
|
-
|
|
216
|
+
91+ file formats across 8 major categories with intelligent format detection and comprehensive metadata extraction.
|
|
217
217
|
|
|
218
218
|
#### Office Documents
|
|
219
219
|
|
data/lib/kreuzberg/config.rb
CHANGED
|
@@ -850,19 +850,21 @@ module Kreuzberg
|
|
|
850
850
|
# )
|
|
851
851
|
#
|
|
852
852
|
class LayoutDetection
|
|
853
|
-
attr_reader :preset, :confidence_threshold, :apply_heuristics
|
|
853
|
+
attr_reader :preset, :confidence_threshold, :apply_heuristics, :table_model
|
|
854
854
|
|
|
855
|
-
def initialize(preset: 'fast', confidence_threshold: nil, apply_heuristics: true)
|
|
855
|
+
def initialize(preset: 'fast', confidence_threshold: nil, apply_heuristics: true, table_model: nil)
|
|
856
856
|
@preset = preset.to_s
|
|
857
857
|
@confidence_threshold = confidence_threshold&.to_f
|
|
858
858
|
@apply_heuristics = apply_heuristics ? true : false
|
|
859
|
+
@table_model = table_model&.to_s
|
|
859
860
|
end
|
|
860
861
|
|
|
861
862
|
def to_h
|
|
862
863
|
{
|
|
863
864
|
preset: @preset,
|
|
864
865
|
confidence_threshold: @confidence_threshold,
|
|
865
|
-
apply_heuristics: @apply_heuristics
|
|
866
|
+
apply_heuristics: @apply_heuristics,
|
|
867
|
+
table_model: @table_model
|
|
866
868
|
}.compact
|
|
867
869
|
end
|
|
868
870
|
end
|
data/lib/kreuzberg/version.rb
CHANGED
data/lib/kreuzberg_rb.so
CHANGED
|
Binary file
|
data/sig/kreuzberg.rbs
CHANGED
|
@@ -463,8 +463,9 @@ module Kreuzberg
|
|
|
463
463
|
attr_reader preset: String
|
|
464
464
|
attr_reader confidence_threshold: Float?
|
|
465
465
|
attr_reader apply_heuristics: bool
|
|
466
|
+
attr_reader table_model: String?
|
|
466
467
|
|
|
467
|
-
def initialize: (?preset: String, ?confidence_threshold: Float?, ?apply_heuristics: bool) -> void
|
|
468
|
+
def initialize: (?preset: String, ?confidence_threshold: Float?, ?apply_heuristics: bool, ?table_model: String?) -> void
|
|
468
469
|
def to_h: () -> Hash[Symbol, untyped]
|
|
469
470
|
end
|
|
470
471
|
|
metadata
CHANGED
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: kreuzberg
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 4.5.
|
|
4
|
+
version: 4.5.4
|
|
5
5
|
platform: aarch64-linux
|
|
6
6
|
authors:
|
|
7
7
|
- Na'aman Hirschfeld
|
|
8
8
|
autorequire:
|
|
9
9
|
bindir: exe
|
|
10
10
|
cert_chain: []
|
|
11
|
-
date: 2026-03-
|
|
11
|
+
date: 2026-03-23 00:00:00.000000000 Z
|
|
12
12
|
dependencies:
|
|
13
13
|
- !ruby/object:Gem::Dependency
|
|
14
14
|
name: bundler
|