baran 0.1.7 → 0.1.9

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: c2f275e2741118e6b0505c9f3ae20d195ca082b9338f28dd9e5fee3899b6d3a5
4
- data.tar.gz: e0eaa0d7e56895c59ab33028f88efd5157a7c091bfb508d35f8cbd19fddf78c1
3
+ metadata.gz: 51599bea086ef467f089b64f9252aa87a881c1889c776219695cec4922318be8
4
+ data.tar.gz: b9c20815e90bf477c8b98b3fb2580013c791dcf1a387332552bf51ae33882768
5
5
  SHA512:
6
- metadata.gz: 76da807e98e3ee3c8c11146b9fd960ad7e254eb8e185eaabda1cf43b524b63a70916eee29e5b698e6a90fae9ae7c5c638729f5b20299a5842e2a2780b41ce890
7
- data.tar.gz: ae3d9ff9180cebb6ee57ab85f2c04239497ed0fd7713042cdc30dc3f8ca603457a3554b4ac05e0d7272293a928c27997172bdaa5562443252b8a9b81faf827a4
6
+ metadata.gz: 8add731f1eb06baa85e7bfe495f11ce58be02b8ca6947f3f0bbfc1d7ac85cad3b693d24dc7f4f9124e5a357f784d5f42eb6875e36d7d2fb1aac09dda22dd8862
7
+ data.tar.gz: 54e8924c8c2c86f524805b99cbeab0bb77a2784d72191fd35857def7450f9e9389176a63d684c4346c17787ad34bd7f3c9155b3803a6be2d0b22de24691a9ed2
data/Gemfile CHANGED
@@ -5,6 +5,6 @@ source "https://rubygems.org"
5
5
  # Specify your gem's dependencies in baran.gemspec
6
6
  gemspec
7
7
 
8
- gem "minitest", "~> 5.18"
8
+ gem "minitest", "~> 5.20"
9
9
 
10
10
  gem "rake", "~> 13.0"
data/Gemfile.lock CHANGED
@@ -1,12 +1,12 @@
1
1
  PATH
2
2
  remote: .
3
3
  specs:
4
- baran (0.1.7)
4
+ baran (0.1.9)
5
5
 
6
6
  GEM
7
7
  remote: https://rubygems.org/
8
8
  specs:
9
- minitest (5.18.1)
9
+ minitest (5.20.0)
10
10
  rake (13.0.6)
11
11
 
12
12
  PLATFORMS
@@ -15,7 +15,7 @@ PLATFORMS
15
15
 
16
16
  DEPENDENCIES
17
17
  baran!
18
- minitest (~> 5.18)
18
+ minitest (~> 5.20)
19
19
  rake (~> 13.0)
20
20
 
21
21
  BUNDLED WITH
@@ -14,4 +14,4 @@ module Baran
14
14
  merged(splits, @separator)
15
15
  end
16
16
  end
17
- end
17
+ end
@@ -14,12 +14,14 @@ module Baran
14
14
  raise NotImplementedError, "splitted method should be implemented in a subclass"
15
15
  end
16
16
 
17
- def chunks(text)
17
+ def chunks(text, metadata: nil)
18
18
  cursor = 0
19
19
  chunks = []
20
20
 
21
- splitted(text).each do |chunk|
22
- chunks << { text: chunk, cursor: cursor }
21
+ splitted(text).compact.each do |chunk|
22
+ chunk = { text: chunk, cursor: cursor }
23
+ chunk[:metadata] = metadata if metadata
24
+ chunks << chunk
23
25
  cursor += chunk.length
24
26
  end
25
27
 
@@ -56,4 +58,4 @@ module Baran
56
58
  results
57
59
  end
58
60
  end
59
- end
61
+ end
data/lib/baran/version.rb CHANGED
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module Baran
4
- VERSION = "0.1.7"
4
+ VERSION = "0.1.9"
5
5
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: baran
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.1.7
4
+ version: 0.1.9
5
5
  platform: ruby
6
6
  authors:
7
7
  - Moeki Kawakami
8
8
  autorequire:
9
9
  bindir: exe
10
10
  cert_chain: []
11
- date: 2023-07-10 00:00:00.000000000 Z
11
+ date: 2023-09-26 00:00:00.000000000 Z
12
12
  dependencies: []
13
13
  description: Text Splitter for Large Language Model Datasets.
14
14
  email: