dejunk 0.2.0 → 0.3.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/dejunk.gemspec +1 -0
- data/lib/dejunk.rb +1 -4
- data/lib/dejunk/version.rb +1 -1
- metadata +5 -5
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 1c27554d9b8b375cd041796a404ea48e28c6c9ce2a772f27af21e83f78117cd8
|
4
|
+
data.tar.gz: 5464e9f63e8b3729f155280bbb167baf1810549b3f05e8d9343f6f8c16c0d420
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 5c425a21416fe2532e665cb9b10b8fbf081134ab6705f4b60b2487104b043e6120aa0cab2bc77832b231c631795b2bd8a5124184c96d861b7d28f3d7abf1336e
|
7
|
+
data.tar.gz: 37cedff6a300bab1c2dc75fbdae68473b44c2fbf688f78f0811194de812bf47e8e2d278b4f7cd279ec6af1cf17f40e0f05dc83c2b299f3a2b7cdaeba13195d6e
|
data/dejunk.gemspec
CHANGED
data/lib/dejunk.rb
CHANGED
@@ -146,7 +146,7 @@ module Dejunk
|
|
146
146
|
def normalize_for_comparison(string)
|
147
147
|
string.
|
148
148
|
mb_chars.
|
149
|
-
|
149
|
+
unicode_normalize(:nfkd).
|
150
150
|
gsub(/\p{Mn}+/, ''.freeze).
|
151
151
|
gsub(/[^[:alnum:]]+/, ''.freeze).
|
152
152
|
downcase
|
@@ -229,9 +229,6 @@ module Dejunk
|
|
229
229
|
def mashing_probability(bigram)
|
230
230
|
if (f = mashing_bigram_frequencies[bigram])
|
231
231
|
f
|
232
|
-
elsif f =~ /[a-z]{2}/i
|
233
|
-
# 26**2 = 676, so 1 in 2k seems a reasonable probability for an arbitrary two-letter bigram given mashing
|
234
|
-
0.0005
|
235
232
|
else
|
236
233
|
# An arbitrary (non-ASCII) bigram with mashing is slightly more probable than with legit strings
|
237
234
|
1e-6
|
data/lib/dejunk/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: dejunk
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
4
|
+
version: 0.3.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- David Judd
|
8
8
|
autorequire:
|
9
9
|
bindir: exe
|
10
10
|
cert_chain: []
|
11
|
-
date:
|
11
|
+
date: 2020-08-07 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: activesupport
|
@@ -96,16 +96,16 @@ require_paths:
|
|
96
96
|
- lib
|
97
97
|
required_ruby_version: !ruby/object:Gem::Requirement
|
98
98
|
requirements:
|
99
|
-
- - "
|
99
|
+
- - "~>"
|
100
100
|
- !ruby/object:Gem::Version
|
101
|
-
version: '
|
101
|
+
version: '2.3'
|
102
102
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
103
103
|
requirements:
|
104
104
|
- - ">="
|
105
105
|
- !ruby/object:Gem::Version
|
106
106
|
version: '0'
|
107
107
|
requirements: []
|
108
|
-
rubygems_version: 3.0.
|
108
|
+
rubygems_version: 3.0.3
|
109
109
|
signing_key:
|
110
110
|
specification_version: 4
|
111
111
|
summary: Detect keyboard mashing and other junk in your data.
|