RubyGems - linkify-it-rb - Versions diffs - 0.1.0.0 → 1.0.0.2 - Mend

linkify-it-rb 0.1.0.0 → 1.0.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

checksums.yaml +4 -4
data/README.md +66 -73
data/lib/linkify-it-rb/index.rb +18 -26
data/lib/linkify-it-rb/re.rb +28 -29
data/lib/linkify-it-rb/version.rb +1 -1
data/spec/linkify-it-rb/test_spec.rb +153 -166
metadata +2 -2

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 8899eb2fafae9f6ce4105221dc2342c93de1ca5c
-  data.tar.gz: 493bb38504a90c6f6c9dfa870364758370ee548e
+  metadata.gz: 6c47469712f3d6de315f05caeca61b4c02c52a32
+  data.tar.gz: 3b51dd1d0651a17efb07cacb27df11615f17683e
 SHA512:
-  metadata.gz: 01ebcaaaa3238631990a3212f5058d69bd58b7f336576e82ac101745f25ddf7dbd948b81013eda800a388d845ab99fa23f75d2d6d90db35368d90a9b92e5f6b2
-  data.tar.gz: 0b9c9fbfe357d9b3c78c2def0bd9f51f08cb0b39335e85c8bb791d483c4e589bf3a5d860357584591e3fe8277f6226310dff04a5235ed0c783472d7ac7803663
+  metadata.gz: 5ace911d1c5873013966ad4c0438e6d933270d126adf686d2544205b906bd2364fd4290b5585967fa06716798061943161af029d3ece148809eef4f47261fa54
+  data.tar.gz: 3c3fdf523803ce1641a40ae659fd8d40508469f44843c2d435ef4fc775c7bc6423638a8c32c66cd03f149b3df35f48ea46671e799b0f2c42af61dbfc6299451f

data/README.md CHANGED

@@ -1,115 +1,108 @@
 # linkify-it-rb
-Links recognition library with FULL unicode support. Focused on high quality link patterns detection in plain text.  For use with both Ruby and RubyMotion.
+[![Gem Version](https://badge.fury.io/rb/linkify-it-rb.svg)](http://badge.fury.io/rb/linkify-it-rb)
+Links recognition library with full unicode support. Focused on high quality link pattern detection in plain text.  For use with both Ruby and RubyMotion.
 This gem is a port of the [linkify-it javascript package](https://github.com/markdown-it/linkify-it) by Vitaly Puzrin, that is used for the [markdown-it](https://github.com/markdown-it/markdown-it) package.
 __[Javascript Demo](http://markdown-it.github.io/linkify-it/)__
-_Note:_ This gem is still in progress - some of the Unicode support is still being worked on.
+Features:
+- Full unicode support, with astral characters
+- International domain support
+- Allows rules extension & custom normalizers
-## To be updated: Original Javascript package documentation
-Why it's awesome:
+Install
+-------
-- Full unicode support, _with astral characters_!
-- International domains support.
-- Allows rules extension & custom normalizers.
+### Ruby
+Add it to your project's `Gemfile`
-Install
--------
+	gem 'linkify-it-rb'
-```bash
-npm install linkify-it --save
-```
+and run `bundle install`
+### RubyMotion
-Browserification is also supported.
+Add it to your project's `Gemfile`
+	gem 'linkify-it-rb'
+Edit your `Rakefile` and add
+	require 'linkify-it-rb'
+and run `bundle install`
 Usage examples
 --------------
 ##### Example 1
-```js
-var linkify = require('linkify-it')();
-// Reload full tlds list & add uniffocial `.onion` domain.
-linkify
-  .tlds(require('tlds'))          // Reload with full tlds list
-  .tlds('.onion', true);          // Add uniffocial `.onion` domain
-  .linkify.add('git:', 'http:');  // Add `git:` ptotocol as "alias"
-  .linkify.add('ftp:', null);     // Disable `ftp:` ptotocol
-console.log(linkify.test('Site github.com!'));  // true
-console.log(linkify.match('Site github.com!')); // [ {
-                                                //   schema: "",
-                                                //   index: 5,
-                                                //   lastIndex: 15,
-                                                //   raw: "github.com",
-                                                //   text: "github.com",
-                                                //   url: "http://github.com",
-                                                // } ]
+```ruby
+linkify = Linkify.new
+# add unoffocial `.mydomain` domain.
+linkify.tlds('.mydomain', true)  # Add unofficial `.mydomain` domain
+linkify.add('git:', 'http:')     # Add `git:` ptotocol as "alias"
+linkify.add('ftp:', null)        # Disable `ftp:` ptotocol
+linkify.test('Site github.com!'))
+=> true
+linkify.match('Site github.com!'))
+=> [#<Linkify::Match @schema="", @index=5, @lastIndex=15, @raw="github.com", @text="github.com", @url="github.com">]
 ```
 ##### Exmple 2. Add twitter mentions handler
-```js
+```ruby
 linkify.add('@', {
-  validate: function (text, pos, self) {
-    var tail = text.slice(pos);
-    if (!self.re.twitter) {
-      self.re.twitter =  new RegExp(
-        '^([a-zA-Z0-9_]){1,15}(?!_)(?=$|' + self.re.src_ZPCcCf + ')'
-      );
-    }
-    if (self.re.twitter.test(tail)) {
-      // Linkifier allows punctuation chars before prefix,
-      // but we additionally disable `@` ("@@mention" is invalid)
-      if (pos >= 2 && tail[pos - 2] === '@') {
-        return false;
-      }
-      return tail.match(self.re.twitter)[0].length;
-    }
-    return 0;
-  },
-  normalize: function (match) {
-    match.url = 'https://twitter.com/' + match.url.replace(/^@/, '');
-  }
-});
+  validate: lambda do |text, pos, obj|
+    tail = text.slice(pos..-1)
+    if (!obj.re[:twitter])
+      obj.re[:twitter] =  Regexp.new('^([a-zA-Z0-9_]){1,15}(?!_)(?=$|' + LinkifyRe::SRC_Z_P_CC + ')')
+    end
+    if (obj.re[:twitter] =~ tail)
+      return 0 if (pos >= 2 && text[pos - 2] == '@')
+      return tail.match(obj.re[:twitter])[0].length
+    end
+    return 0
+  end,
+  normalize: lambda do |m, obj|
+    m.url = 'https://twitter.com/' + m.url.sub(/^@/, '')
+  end
+})
 ```
 API
 ---
-__[API documentation](http://markdown-it.github.io/linkify-it/doc)__
-### new LinkifyIt(schemas)
+### LinkifyIt.new(schemas)
 Creates new linkifier instance with optional additional schemas.
-Can be called without `new` keyword for convenience.
 By default understands:
 - `http(s)://...` , `ftp://...`, `mailto:...` & `//...` links
 - "fuzzy" links and emails (google.com, foo@bar.com).
-`schemas` is an object, where each key/value describes protocol/rule:
+`schemas` is a Hash, where each key/value describes protocol/rule:
 - __key__ - link prefix (usually, protocol name with `:` at the end, `skype:`
-  for example). `linkify-it` makes shure that prefix is not preceeded with
+  for example). `linkify-it-rb` makes shure that prefix is not preceeded with
   alphanumeric char.
 - __value__ - rule to check tail after link prefix
   - _String_ - just alias to existing rule
-  - _Object_
-    - _validate_ - validator function (should return matched length on success),
+  - _Hash_
+    - _validate_ - validator block (should return matched length on success),
       or `RegExp`.
-    - _normalize_ - optional function to normalize text & url of matched result
+    - _normalize_ - optional block to normalize text & url of matched result
       (for example, for twitter mentions).
@@ -120,20 +113,20 @@ Searches linkifiable pattern and returns `true` on success or `false` on fail.
 ### .pretest(text)
-Quick check if link MAY BE can exist. Can be used to optimize more expensive
-`.test()` calls. Return `false` if link can not be found, `true` - if `.test()`
+Quick check if link MAYBE can exist. Can be used to optimize more expensive
+`.test` calls. Return `false` if link can not be found, `true` - if `.test`
 call needed to know exactly.
 ### .testSchemaAt(text, name, offset)
-Similar to `.test()` but checks only specific protocol tail exactly at given
+Similar to `.test` but checks only specific protocol tail exactly at given
 position. Returns length of found pattern (0 on fail).
 ### .match(text)
-Returns `Array` of found link matches or null if nothing found.
+Returns `Array` of found link matches or nil if nothing found.
 Each match has:
@@ -148,8 +141,8 @@ Each match has:
 ### .tlds(list[, keepOld])
-Load (or merge) new tlds list. Those are user for fuzzy links (without prefix)
-to avoid false positives. By default this algorythm used:
+Load (or merge) new tlds list. These are used for fuzzy links (without prefix)
+to avoid false positives. By default this algorithm uses:
 - hostname with any 2-letter root zones are ok.
 - biz|com|edu|gov|net|org|pro|web|xxx|aero|asia|coop|info|museum|name|shop|рф
@@ -162,9 +155,9 @@ If list is replaced, then exact match for 2-chars root zones will be checked.
 ### .add(schema, definition)
 Add new rule with `schema` prefix. For definition details see constructor
-description. To disable existing rule use `.add(name, null)`
+description. To disable existing rule use `.add(name, nil)`
 ## License
-[MIT](https://github.com/markdown-it/linkify-it/blob/master/LICENSE)
+[MIT](https://github.com/digitalmoksha/linkify-it-rb/blob/master/LICENSE)

data/lib/linkify-it-rb/index.rb CHANGED

@@ -87,25 +87,17 @@ class Linkify
   #
   #------------------------------------------------------------------------------
   def compile
-    # Load & clone RE patterns.
-    re = @re = {}  #.merge!(require('./lib/re'))
+    @re = { src_xn: LinkifyRe::SRC_XN }
     # Define dynamic patterns
     tlds = @__tlds__.dup
+    tlds.push('[a-z]{2}') if (!@__tlds_replaced__)
+    tlds.push(@re[:src_xn])
-    if (!@__tlds_replaced__)
-      tlds.push('[a-z]{2}')
-    end
-    tlds.push(re[:src_xn])
-    re[:src_tlds] = tlds.join('|')
-    untpl = lambda { |tpl| tpl.gsub('%TLDS%', re[:src_tlds]) }
-    re[:email_fuzzy]      = Regexp.new(LinkifyRe::TPL_EMAIL_FUZZY.gsub('%TLDS%', re[:src_tlds]), true)
-    re[:link_fuzzy]       = Regexp.new(LinkifyRe::TPL_LINK_FUZZY.gsub('%TLDS%', re[:src_tlds]), true)
-    re[:host_fuzzy_test]  = Regexp.new(LinkifyRe::TPL_HOST_FUZZY_TEST.gsub('%TLDS%', re[:src_tlds]), true)
+    @re[:src_tlds] = tlds.join('|')
+    @re[:email_fuzzy]      = Regexp.new(LinkifyRe::TPL_EMAIL_FUZZY.gsub('%TLDS%', @re[:src_tlds]), true)
+    @re[:link_fuzzy]       = Regexp.new(LinkifyRe::TPL_LINK_FUZZY.gsub('%TLDS%', @re[:src_tlds]), true)
+    @re[:host_fuzzy_test]  = Regexp.new(LinkifyRe::TPL_HOST_FUZZY_TEST.gsub('%TLDS%', @re[:src_tlds]), true)
     #
     # Compile each schema
@@ -180,8 +172,8 @@ class Linkify
     slist = @__compiled__.select {|name, val| name.length > 0 && !val.nil? }.keys.map {|str| escapeRE(str)}.join('|')
     # (?!_) cause 1.5x slowdown
-    @re[:schema_test]   = Regexp.new('(^|(?!_)(?:>|' + LinkifyRe::SRC_Z_P_CC_CF + '))(' + slist + ')', 'i')
-    @re[:schema_search] = Regexp.new('(^|(?!_)(?:>|' + LinkifyRe::SRC_Z_P_CC_CF + '))(' + slist + ')', 'ig')
+    @re[:schema_test]   = Regexp.new('(^|(?!_)(?:>|' + LinkifyRe::SRC_Z_P_CC + '))(' + slist + ')', 'i')
+    @re[:schema_search] = Regexp.new('(^|(?!_)(?:>|' + LinkifyRe::SRC_Z_P_CC + '))(' + slist + ')', 'ig')
     @re[:pretest]       = Regexp.new(
                               '(' + @re[:schema_test].source + ')|' +
@@ -318,14 +310,15 @@ class Linkify
     @__index__      = -1
     return false if (!text.length)
     # try to scan for link with schema - that's the most simple rule
     if @re[:schema_test] =~ text
       re = @re[:schema_search]
-      # re[:lastIndex] = 0
-      while ((m = re.match(text)) != nil)
-        len = testSchemaAt(text, m[2], m.end(0)) #re[:lastIndex])
-        if (len)
+      lastIndex = 0
+      while ((m = re.match(text, lastIndex)) != nil)
+        lastIndex = m.end(0)
+        len       = testSchemaAt(text, m[2], lastIndex)
+        if len > 0
           @__schema__     = m[2]
           @__index__      = m.begin(0) + m[1].length
           @__last_index__ = m.begin(0) + m[0].length + len
@@ -334,9 +327,8 @@ class Linkify
       end
     end
+    # guess schemaless links
     if (@__compiled__['http:'])
-      # guess schemaless links
       tld_pos = text.index(@re[:host_fuzzy_test])
       if !tld_pos.nil?
         # if tld is located after found link - no need to check fuzzy pattern
@@ -355,8 +347,8 @@ class Linkify
       end
     end
+    # guess schemaless emails
     if (@__compiled__['mailto:'])
-      # guess schemaless emails
       at_pos = text.index('@')
       if !at_pos.nil?
         # We can't skip this check, because this cases are possible:
@@ -410,7 +402,7 @@ class Linkify
   # LinkifyIt#match(text) -> Array|null
   #
-  # Returns array of found link descriptions or `null` on fail. We strongly
+  # Returns array of found link descriptions or `null` on fail. We strongly suggest
   # to use [[LinkifyIt#test]] first, for best speed.
   #
   # ##### Result match description

data/lib/linkify-it-rb/re.rb CHANGED

@@ -1,58 +1,57 @@
 module LinkifyRe
     # Use direct extract instead of `regenerate` to reduce size
-    SRC_ANY = UCMicro::Properties::Any::REGEX
-    SRC_CC  = UCMicro::Categories::Cc::REGEX
-    SRC_CF  = UCMicro::Categories::Cf::REGEX
-    SRC_Z   = UCMicro::Categories::Z::REGEX
-    SRC_P   = UCMicro::Categories::P::REGEX
+    SRC_ANY = UCMicro::Properties::Any::REGEX.source
+    SRC_CC  = UCMicro::Categories::Cc::REGEX.source
+    SRC_Z   = UCMicro::Categories::Z::REGEX.source
+    SRC_P   = UCMicro::Categories::P::REGEX.source
-    # \p{\Z\P\Cc\CF} (white spaces + control + format + punctuation)
-    SRC_Z_P_CC_CF = [ SRC_Z, SRC_P, SRC_CC, SRC_CF ].join('|')
+    # \p{\Z\P\Cc} (white spaces + control + punctuation)
+    SRC_Z_P_CC = [ SRC_Z, SRC_P, SRC_CC ].join('|')
-    # \p{\Z\Cc\CF} (white spaces + control + format)
-    SRC_Z_CC_CF = [ SRC_Z, SRC_CC, SRC_CF ].join('|')
+    # \p{\Z\Cc} (white spaces + control)
+    SRC_Z_CC = [ SRC_Z, SRC_CC ].join('|')
     # All possible word characters (everything without punctuation, spaces & controls)
     # Defined via punctuation & spaces to save space
     # Should be something like \p{\L\N\S\M} (\w but without `_`)
-    SRC_PSEUDO_LETTER       = '(?:(?!' + SRC_Z_P_CC_CF + ')' + SRC_ANY.source + ')'
+    SRC_PSEUDO_LETTER       = '(?:(?!' + SRC_Z_P_CC + ')' + SRC_ANY + ')'
     # The same as above but without [0-9]
-    SRC_PSEUDO_LETTER_NON_D = '(?:(?![0-9]|' + SRC_Z_P_CC_CF + ')' + SRC_ANY.source + ')'
+    SRC_PSEUDO_LETTER_NON_D = '(?:(?![0-9]|' + SRC_Z_P_CC + ')' + SRC_ANY + ')'
     #------------------------------------------------------------------------------
     SRC_IP4   = '(?:(25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)'
-    SRC_AUTH  = '(?:(?:(?!' + SRC_Z_CC_CF + ').)+@)?'
+    SRC_AUTH  = '(?:(?:(?!' + SRC_Z_CC + ').)+@)?'
     SRC_PORT  = '(?::(?:6(?:[0-4]\\d{3}|5(?:[0-4]\\d{2}|5(?:[0-2]\\d|3[0-5])))|[1-5]?\\d{1,4}))?'
-    SRC_HOST_TERMINATOR = '(?=$|' + SRC_Z_P_CC_CF + ')(?!-|_|:\\d|\\.-|\\.(?!$|' + SRC_Z_P_CC_CF + '))'
+    SRC_HOST_TERMINATOR = '(?=$|' + SRC_Z_P_CC + ')(?!-|_|:\\d|\\.-|\\.(?!$|' + SRC_Z_P_CC + '))'
     SRC_PATH =
       '(?:' +
         '[/?#]' +
           '(?:' +
-            '(?!' + SRC_Z_CC_CF + '|[()\\[\\]{}.,"\'?!\\-]).|' +
-            '\\[(?:(?!' + SRC_Z_CC_CF + '|\\]).)*\\]|' +
-            '\\((?:(?!' + SRC_Z_CC_CF + '|[)]).)*\\)|' +
-            '\\{(?:(?!' + SRC_Z_CC_CF + '|[}]).)*\\}|' +
-            '\\"(?:(?!' + SRC_Z_CC_CF + '|["]).)+\\"|' +
-            "\\'(?:(?!" + SRC_Z_CC_CF + "|[']).)+\\'|" +
+            '(?!' + SRC_Z_CC + '|[()\\[\\]{}.,"\'?!\\-]).|' +
+            '\\[(?:(?!' + SRC_Z_CC + '|\\]).)*\\]|' +
+            '\\((?:(?!' + SRC_Z_CC + '|[)]).)*\\)|' +
+            '\\{(?:(?!' + SRC_Z_CC + '|[}]).)*\\}|' +
+            '\\"(?:(?!' + SRC_Z_CC + '|["]).)+\\"|' +
+            "\\'(?:(?!" + SRC_Z_CC + "|[']).)+\\'|" +
             "\\'(?=" + SRC_PSEUDO_LETTER + ').|' +  # allow `I'm_king` if no pair found
             '\\.{2,3}[a-zA-Z0-9%]|' + # github has ... in commit range links. Restrict to
                                       # english & percent-encoded only, until more examples found.
-            '\\.(?!' + SRC_Z_CC_CF + '|[.]).|' +
-            '\\-(?!' + SRC_Z_CC_CF + '|--(?:[^-]|$))(?:[-]+|.)|' +  # `---` => long dash, terminate
-            '\\,(?!' + SRC_Z_CC_CF + ').|' +      # allow `,,,` in paths
-            '\\!(?!' + SRC_Z_CC_CF + '|[!]).|' +
-            '\\?(?!' + SRC_Z_CC_CF + '|[?]).' +
+            '\\.(?!' + SRC_Z_CC + '|[.]).|' +
+            '\\-(?!' + SRC_Z_CC + '|--(?:[^-]|$))(?:[-]+|.)|' +  # `---` => long dash, terminate
+            '\\,(?!' + SRC_Z_CC + ').|' +      # allow `,,,` in paths
+            '\\!(?!' + SRC_Z_CC + '|[!]).|' +
+            '\\?(?!' + SRC_Z_CC + '|[?]).' +
           ')+' +
         '|\\/' +
       ')?'
     SRC_EMAIL_NAME  = '[\\-;:&=\\+\\$,\\"\\.a-zA-Z0-9_]+'
-    SRC_XN          = 'xn--[a-z0-9\\-]{1,59}';
+    SRC_XN          = 'xn--[a-z0-9\\-]{1,59}'
     # More to read about domain names
     # http://serverfault.com/questions/638260/
@@ -89,7 +88,7 @@ module LinkifyRe
         SRC_IP4 +
       '|' +
         '(?:(?:(?:' + SRC_DOMAIN + ')\\.)+(?:%TLDS%))' +
-      ')';
+      ')'
     SRC_HOST_STRICT            = SRC_HOST + SRC_HOST_TERMINATOR
     TPL_HOST_FUZZY_STRICT      = TPL_HOST_FUZZY + SRC_HOST_TERMINATOR
@@ -100,12 +99,12 @@ module LinkifyRe
     # Main rules
     # Rude test fuzzy links by host, for quick deny
-    TPL_HOST_FUZZY_TEST = 'localhost|\\.\\d{1,3}\\.|(?:\\.(?:%TLDS%)(?:' + SRC_Z_P_CC_CF + '|$))'
-    TPL_EMAIL_FUZZY     = '(^|>|' + SRC_Z_CC_CF + ')(' + SRC_EMAIL_NAME + '@' + TPL_HOST_FUZZY_STRICT + ')'
+    TPL_HOST_FUZZY_TEST = 'localhost|\\.\\d{1,3}\\.|(?:\\.(?:%TLDS%)(?:' + SRC_Z_P_CC + '|$))'
+    TPL_EMAIL_FUZZY     = '(^|>|' + SRC_Z_CC + ')(' + SRC_EMAIL_NAME + '@' + TPL_HOST_FUZZY_STRICT + ')'
     TPL_LINK_FUZZY =
         # Fuzzy link can't be prepended with .:/\- and non punctuation.
         # but can start with > (markdown blockquote)
-        '(^|(?![.:/\\-_@])(?:[$+<=>^`|]|' + SRC_Z_P_CC_CF + '))' +
+        '(^|(?![.:/\\-_@])(?:[$+<=>^`|]|' + SRC_Z_P_CC + '))' +
         '((?![$+<=>^`|])' + TPL_HOST_PORT_FUZZY_STRICT + SRC_PATH + ')'
 end

data/lib/linkify-it-rb/version.rb CHANGED

@@ -1,5 +1,5 @@
 module LinkifyIt
-  VERSION = '0.1.0.0'
+  VERSION = '1.0.0.2'
 end

data/spec/linkify-it-rb/test_spec.rb CHANGED

@@ -1,49 +1,43 @@
+fixture_dir  = File.join(File.dirname(__FILE__), 'fixtures')
 #------------------------------------------------------------------------------
 describe 'links' do
-  # TODO tests which can't seem to get passing at the moment, so skip them
-  failing_test = [
-    95,     # GOOGLE.COM.     unable to get final . to be removed
-    214     # xn--d1abbgf6aiiy.xn--p1ai
-  ]
   l = Linkify.new
   l.bypass_normalizer = true    # kill the normalizer
   skipNext  = false
-  linkfile  = File.join(File.dirname(__FILE__), 'fixtures/links.txt')
+  linkfile  = File.join(fixture_dir, 'links.txt')
   lines     = File.read(linkfile).split(/\r?\n/)
   lines.each_with_index do |line, idx|
     if skipNext
       skipNext = false
       next
     end
     line      = line.sub(/^%.*/, '')
     next_line = (lines[idx + 1] || '').sub(/^%.*/, '')
     next if line.strip.empty?
-    unless failing_test.include?(idx + 1)
-      if !next_line.strip.empty?
+    if !next_line.strip.empty?
-        it "line #{idx + 1}" do
-          expect(l.pretest(line)).to eq true        # "(pretest failed in `#{line}`)"
-          expect(l.test("\n#{line}\n")).to eq true  # "(link not found in `\n#{line}\n`)"
-          expect(l.test(line)).to eq true           # "(link not found in `#{line}`)"
-          expect(l.match(line)[0].url).to eq next_line
-        end
+      it "line #{idx + 1}" do
+        expect(l.pretest(line)).to eq true        # "(pretest failed in `#{line}`)"
+        expect(l.test("\n#{line}\n")).to eq true  # "(link not found in `\n#{line}\n`)"
+        expect(l.test(line)).to eq true           # "(link not found in `#{line}`)"
+        expect(l.match(line)[0].url).to eq next_line
+      end
-        skipNext = true
-      else
+      skipNext = true
-        it "line #{idx + 1}" do
-          expect(l.pretest(line)).to eq true        # "(pretest failed in `#{line}`)"
-          expect(l.test("\n#{line}\n")).to eq true  # "(link not found in `\n#{line}\n`)"
-          expect(l.test(line)).to eq true           # "(link not found in `#{line}`)"
-          expect(l.match(line)[0].url).to eq line
-        end
+    else
+      it "line #{idx + 1}" do
+        expect(l.pretest(line)).to eq true        # "(pretest failed in `#{line}`)"
+        expect(l.test("\n#{line}\n")).to eq true  # "(link not found in `\n#{line}\n`)"
+        expect(l.test(line)).to eq true           # "(link not found in `#{line}`)"
+        expect(l.match(line)[0].url).to eq line
       end
     end
   end
@@ -54,26 +48,18 @@ end
 #------------------------------------------------------------------------------
 describe 'not links' do
-  # TODO tests which can't seem to get passing at the moment, so skip them
-  failing_test = [ 6, 7, 8, 12, 16, 19, 22, 23, 24, 25, 26, 27, 28, 29, 48 ]
   l = Linkify.new
   l.bypass_normalizer = true    # kill the normalizer
-  linkfile  = File.join(File.dirname(__FILE__), 'fixtures/not_links.txt')
+  linkfile  = File.join(fixture_dir, 'not_links.txt')
   lines     = File.read(linkfile).split(/\r?\n/)
   lines.each_with_index do |line, idx|
     line = line.sub(/^%.*/, '')
     next if line.strip.empty?
-    unless failing_test.include?(idx + 1)
-      it "line #{idx + 1}" do
-        # assert.notOk(l.test(line),
-        #  '(should not find link in `' + line + '`, but found `' +
-        #  JSON.stringify((l.match(line) || [])[0]) + '`)');
-        expect(l.test(line)).not_to eq true
-      end
+    it "line #{idx + 1}" do
+      expect(l.test(line)).not_to eq true
     end
   end
@@ -93,142 +79,143 @@ describe 'API' do
     expect(l.test('google.myroot')).to eq true
     expect(l.test('google.xyz')).to_not eq true
-    # this is some other package of tlds which we don't have
+    # TODO this is some other package of tlds which we don't have
+    # https://github.com/stephenmathieson/node-tlds
+    # instead we should be using Public Suffix List
+    # https://github.com/weppos/publicsuffix-ruby
     # l.tlds(require('tlds'));
     # assert.ok(l.test('google.xyz'));
     # assert.notOk(l.test('google.myroot'));
   end
-  # TODO Tests not passing
   #------------------------------------------------------------------------------
-  # it 'add rule as regexp, with default normalizer' do
-  #   l = Linkify.new.add('my:', {validate: /^\/\/[a-z]+/} )
-  #
-  #   match = l.match('google.com. my:// my://asdf!')
-  #
-  #   expect(match[0].text).to eq 'google.com'
-  #   expect(match[1].text).to eq 'my://asdf'
-  # end
-  # TODO Tests not passing
+  it 'add rule as regexp, with default normalizer' do
+    l = Linkify.new.add('my:', {validate: /^\/\/[a-z]+/} )
+    match = l.match('google.com. my:// my://asdf!')
+    expect(match[0].text).to eq 'google.com'
+    expect(match[1].text).to eq 'my://asdf'
+  end
+  #------------------------------------------------------------------------------
+  it 'add rule with normalizer' do
+    l = Linkify.new.add('my:', {
+      validate: /^\/\/[a-z]+/,
+      normalize: lambda do |m, obj|
+        m.text = m.text.sub(/^my:\/\//, '').upcase
+        m.url  = m.url.upcase
+      end
+    })
+    match = l.match('google.com. my:// my://asdf!')
+    expect(match[1].text).to eq 'ASDF'
+    expect(match[1].url).to eq 'MY://ASDF'
+  end
   #------------------------------------------------------------------------------
-  # it 'add rule with normalizer'
-  #   l = Linkify.new.add('my:', {
-  #     validate: /^\/\/[a-z]+/,
-  #     normalize: lambda {|m|
-  #       m.text = m.text.sub(/^my:\/\//, '').upcase
-  #       m.url  = m.url.upcase
-  #     }
-  #   })
-  #
-  #   match = l.match('google.com. my:// my://asdf!')
-  #
-  #   expect(match[1].text).to eq 'ASDF'
-  #   expect(match[1].url).to eq 'MY://ASDF'
-  # end
-#   it('disable rule', function () {
-#     var l = linkify();
-#
-#     assert.ok(l.test('http://google.com'));
-#     assert.ok(l.test('foo@bar.com'));
-#     l.add('http:', null);
-#     l.add('mailto:', null);
-#     assert.notOk(l.test('http://google.com'));
-#     assert.notOk(l.test('foo@bar.com'));
-#   });
-#
-#
-#   it('add bad definition', function () {
-#     var l;
-#
-#     l = linkify();
-#
-#     assert.throw(function () {
-#       l.add('test:', []);
-#     });
-#
-#     l = linkify();
-#
-#     assert.throw(function () {
-#       l.add('test:', { validate: [] });
-#     });
-#
-#     l = linkify();
-#
-#     assert.throw(function () {
-#       l.add('test:', {
-#         validate: function () { return false; },
-#         normalize: 'bad'
-#       });
-#     });
-#   });
-#
-#
-#   it('test at position', function () {
-#     var l = linkify();
-#
-#     assert.ok(l.testSchemaAt('http://google.com', 'http:', 5));
-#     assert.ok(l.testSchemaAt('http://google.com', 'HTTP:', 5));
-#     assert.notOk(l.testSchemaAt('http://google.com', 'http:', 6));
-#
-#     assert.notOk(l.testSchemaAt('http://google.com', 'bad_schema:', 6));
-#   });
-#
-#
-#   it('correct cache value', function () {
-#     var l = linkify();
-#
-#     var match = l.match('.com. http://google.com google.com ftp://google.com');
-#
-#     assert.equal(match[0].text, 'http://google.com');
-#     assert.equal(match[1].text, 'google.com');
-#     assert.equal(match[2].text, 'ftp://google.com');
-#   });
-#
-#   it('normalize', function () {
-#     var l = linkify(), m;
-#
-#     m = l.match('mailto:foo@bar.com')[0];
-#
-#     // assert.equal(m.text, 'foo@bar.com');
-#     assert.equal(m.url,  'mailto:foo@bar.com');
-#
-#     m = l.match('foo@bar.com')[0];
-#
-#     // assert.equal(m.text, 'foo@bar.com');
-#     assert.equal(m.url,  'mailto:foo@bar.com');
-#   });
-#
-#
-#   it('test @twitter rule', function () {
-#     var l = linkify().add('@', {
-#       validate: function (text, pos, self) {
-#         var tail = text.slice(pos);
-#
-#         if (!self.re.twitter) {
-#           self.re.twitter =  new RegExp(
-#             '^([a-zA-Z0-9_]){1,15}(?!_)(?=$|' + self.re.src_ZPCcCf + ')'
-#           );
-#         }
-#         if (self.re.twitter.test(tail)) {
-#           if (pos >= 2 && tail[pos - 2] === '@') {
-#             return false;
-#           }
-#           return tail.match(self.re.twitter)[0].length;
-#         }
-#         return 0;
-#       },
-#       normalize: function (m) {
-#         m.url = 'https://twitter.com/' + m.url.replace(/^@/, '');
-#       }
-#     });
-#
-#     assert.equal(l.match('hello, @gamajoba_!')[0].text, '@gamajoba_');
-#     assert.equal(l.match(':@givi')[0].text, '@givi');
-#     assert.equal(l.match(':@givi')[0].url, 'https://twitter.com/givi');
-#     assert.notOk(l.test('@@invalid'));
-#   });
+  it 'disable rule' do
+    l = Linkify.new
+    expect(l.test('http://google.com')).to eq true
+    expect(l.test('foo@bar.com')).to eq true
+    l.add('http:', nil)
+    l.add('mailto:', nil)
+    expect(l.test('http://google.com')).to eq false
+    expect(l.test('foo@bar.com')).to eq false
+  end
+  #------------------------------------------------------------------------------
+  it 'add bad definition' do
+    l = Linkify.new
+    expect {
+      l.add('test:', [])
+    }.to raise_error(StandardError)
+    l = Linkify.new
+    expect {
+      l.add('test:', {validate: []})
+    }.to raise_error(StandardError)
+    l = Linkify.new
+    expect {
+      l.add('test:', {validate: []})
+    }.to raise_error(StandardError)
+    expect {
+      l.add('test:', {
+        validate: lambda { return false },
+        normalize: 'bad'
+      })
+    }.to raise_error(StandardError)
+  end
+  #------------------------------------------------------------------------------
+  it 'test at position' do
+    l = Linkify.new
+    expect(l.testSchemaAt('http://google.com', 'http:', 5) > 0).to eq true
+    expect(l.testSchemaAt('http://google.com', 'HTTP:', 5) > 0).to eq true
+    expect(l.testSchemaAt('http://google.com', 'http:', 6) > 0).to eq false
+    expect(l.testSchemaAt('http://google.com', 'bad_schema:', 6) > 0).to eq false
+  end
+  #------------------------------------------------------------------------------
+  it 'correct cache value' do
+    l     = Linkify.new
+    match = l.match('.com. http://google.com google.com ftp://google.com')
+    expect(match[0].text).to eq 'http://google.com'
+    expect(match[1].text).to eq 'google.com'
+    expect(match[2].text).to eq 'ftp://google.com'
+  end
+  #------------------------------------------------------------------------------
+  it 'normalize' do
+    l = Linkify.new
+    m = l.match('mailto:foo@bar.com')[0]
+    # assert.equal(m.text, 'foo@bar.com');
+    expect(m.url).to eq 'mailto:foo@bar.com'
+    m = l.match('foo@bar.com')[0]
+    # assert.equal(m.text, 'foo@bar.com');
+    expect(m.url).to eq 'mailto:foo@bar.com'
+  end
+  #------------------------------------------------------------------------------
+  it 'test @twitter rule' do
+    l = Linkify.new.add('@', {
+      validate: lambda do |text, pos, obj|
+        tail = text.slice(pos..-1)
+        if (!obj.re[:twitter])
+          obj.re[:twitter] =  Regexp.new(
+            '^([a-zA-Z0-9_]){1,15}(?!_)(?=$|' + LinkifyRe::SRC_Z_P_CC + ')'
+          )
+        end
+        if (obj.re[:twitter] =~ tail)
+          if (pos >= 2 && text[pos - 2] == '@')
+            return 0
+          end
+          return tail.match(obj.re[:twitter])[0].length
+        end
+        return 0
+      end,
+      normalize: lambda do |m, obj|
+        m.url = 'https://twitter.com/' + m.url.sub(/^@/, '')
+      end
+    })
+    expect(l.match('hello, @gamajoba_!')[0].text).to eq '@gamajoba_'
+    expect(l.match(':@givi')[0].text).to eq '@givi'
+    expect(l.match(':@givi')[0].url).to eq 'https://twitter.com/givi'
+    expect(l.test('@@invalid')).to eq false
+  end
 end

metadata CHANGED

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: linkify-it-rb
 version: !ruby/object:Gem::Version
-  version: 0.1.0.0
+  version: 1.0.0.2
 platform: ruby
 authors:
 - Brett Walker
@@ -9,7 +9,7 @@ authors:
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2015-03-26 00:00:00.000000000 Z
+date: 2015-04-01 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: uc.micro-rb