bm25 0.1.3 → 0.1.4
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/Gemfile.lock +1 -1
- data/lib/bm25/parser.rb +3 -0
- data/lib/bm25/stopword.txt +2 -18
- data/lib/bm25/utils.rb +2 -2
- data/lib/bm25/version.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 3cb66896c835cefd13368e83f874fb6a0d3667bade74c27e3f069685fade9abc
|
4
|
+
data.tar.gz: 40b158e69b60560e880fc40ffab05b01066fe3e49ade003b1bda51bb920fd09e
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 301214a74bb46d76161264e1f767dd34d09216734b17cb55ad955eda0e741a648dc259778b24eb9bcfa51b8659a60a7bf310044992e626ceaa3e5187fa405bd9
|
7
|
+
data.tar.gz: 3b6b7938854cd8eba7581599f107f17f7fc7234923c36c96fc07f1fb800f178bdbbce08710692481ef561859475bbd59b8eddc59a1a5135aa6667f47b4ce9302
|
data/Gemfile.lock
CHANGED
data/lib/bm25/parser.rb
CHANGED
data/lib/bm25/stopword.txt
CHANGED
@@ -100,16 +100,13 @@
|
|
100
100
|
よそ
|
101
101
|
わけ
|
102
102
|
わたし
|
103
|
-
|
103
|
+
けど
|
104
|
+
ので
|
104
105
|
ハイ
|
105
|
-
|
106
|
-
|
107
106
|
上
|
108
107
|
中
|
109
108
|
下
|
110
109
|
字
|
111
|
-
|
112
|
-
|
113
110
|
年
|
114
111
|
月
|
115
112
|
日
|
@@ -131,8 +128,6 @@
|
|
131
128
|
区
|
132
129
|
町
|
133
130
|
村
|
134
|
-
|
135
|
-
|
136
131
|
各
|
137
132
|
第
|
138
133
|
方
|
@@ -230,10 +225,6 @@
|
|
230
225
|
毎
|
231
226
|
式
|
232
227
|
簿
|
233
|
-
|
234
|
-
|
235
|
-
|
236
|
-
|
237
228
|
回
|
238
229
|
匹
|
239
230
|
個
|
@@ -246,21 +237,16 @@
|
|
246
237
|
円
|
247
238
|
玉
|
248
239
|
枚
|
249
|
-
|
250
240
|
前
|
251
241
|
後
|
252
242
|
左
|
253
243
|
右
|
254
244
|
次
|
255
245
|
先
|
256
|
-
|
257
246
|
春
|
258
247
|
夏
|
259
248
|
秋
|
260
249
|
冬
|
261
|
-
|
262
|
-
|
263
|
-
|
264
250
|
一
|
265
251
|
二
|
266
252
|
三
|
@@ -276,8 +262,6 @@
|
|
276
262
|
万
|
277
263
|
億
|
278
264
|
兆
|
279
|
-
|
280
|
-
|
281
265
|
下記
|
282
266
|
上記
|
283
267
|
時間
|
data/lib/bm25/utils.rb
CHANGED
@@ -6,8 +6,8 @@ module Bm25
|
|
6
6
|
|
7
7
|
def is_stopword? (word)
|
8
8
|
match = false
|
9
|
-
|
10
|
-
File.open(
|
9
|
+
stopword_path = File.join( File.dirname(__FILE__), 'stopword.txt' )
|
10
|
+
File.open(stopword_path, "r") do |f|
|
11
11
|
f.each_line do |t|
|
12
12
|
if t.chomp === word
|
13
13
|
match = true
|
data/lib/bm25/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: bm25
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.1.
|
4
|
+
version: 0.1.4
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Masayuki Komatsu
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2018-03-
|
11
|
+
date: 2018-03-28 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: bundler
|