RubyGems - ruby-spacy - Versions diffs - 0.1.4 → 0.1.5.0 - Mend

ruby-spacy 0.1.4 → 0.1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

checksums.yaml +4 -4
data/.rubocop.yml +48 -0
data/.solargraph.yml +22 -0
data/CHANGELOG.md +5 -1
data/Gemfile +7 -7
data/Gemfile.lock +3 -3
data/README.md +40 -39
data/examples/get_started/lexeme.rb +3 -1
data/examples/get_started/linguistic_annotations.rb +3 -1
data/examples/get_started/morphology.rb +3 -1
data/examples/get_started/most_similar.rb +30 -27
data/examples/get_started/named_entities.rb +4 -2
data/examples/get_started/pos_tags_and_dependencies.rb +3 -1
data/examples/get_started/similarity.rb +4 -2
data/examples/get_started/tokenization.rb +3 -1
data/examples/get_started/visualizing_dependencies.rb +2 -2
data/examples/get_started/visualizing_dependencies_compact.rb +2 -0
data/examples/get_started/visualizing_named_entities.rb +4 -2
data/examples/get_started/vocab.rb +3 -1
data/examples/get_started/word_vectors.rb +3 -1
data/examples/japanese/ancestors.rb +6 -4
data/examples/japanese/entity_annotations_and_labels.rb +4 -2
data/examples/japanese/information_extraction.rb +6 -6
data/examples/japanese/lemmatization.rb +3 -1
data/examples/japanese/most_similar.rb +30 -27
data/examples/japanese/named_entity_recognition.rb +3 -2
data/examples/japanese/navigating_parse_tree.rb +19 -17
data/examples/japanese/noun_chunks.rb +2 -0
data/examples/japanese/pos_tagging.rb +3 -1
data/examples/japanese/sentence_segmentation.rb +3 -2
data/examples/japanese/similarity.rb +2 -0
data/examples/japanese/tokenization.rb +2 -0
data/examples/japanese/visualizing_dependencies.rb +3 -1
data/examples/japanese/visualizing_named_entities.rb +4 -2
data/examples/linguistic_features/ancestors.rb +7 -5
data/examples/linguistic_features/entity_annotations_and_labels.rb +4 -2
data/examples/linguistic_features/finding_a_verb_with_a_subject.rb +3 -5
data/examples/linguistic_features/information_extraction.rb +9 -9
data/examples/linguistic_features/iterating_children.rb +6 -8
data/examples/linguistic_features/iterating_lefts_and_rights.rb +7 -5
data/examples/linguistic_features/lemmatization.rb +3 -1
data/examples/linguistic_features/named_entity_recognition.rb +3 -1
data/examples/linguistic_features/navigating_parse_tree.rb +3 -1
data/examples/linguistic_features/noun_chunks.rb +3 -1
data/examples/linguistic_features/pos_tagging.rb +3 -1
data/examples/linguistic_features/retokenize_1.rb +2 -0
data/examples/linguistic_features/retokenize_2.rb +4 -2
data/examples/linguistic_features/rule_based_morphology.rb +4 -2
data/examples/linguistic_features/sentence_segmentation.rb +3 -2
data/examples/linguistic_features/similarity.rb +4 -2
data/examples/linguistic_features/similarity_between_lexemes.rb +2 -0
data/examples/linguistic_features/similarity_between_spans.rb +7 -5
data/examples/linguistic_features/tokenization.rb +3 -2
data/examples/rule_based_matching/creating_spans_from_matches.rb +5 -3
data/examples/rule_based_matching/matcher.rb +4 -2
data/lib/ruby-spacy/version.rb +1 -1
data/lib/ruby-spacy.rb +142 -136
data/ruby-spacy.gemspec +15 -17
data/tags +132 -0
metadata +69 -10

data/examples/japanese/most_similar.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -9,38 +11,39 @@ france = nlp.get_lexeme("フランス")
 query = tokyo.vector - japan.vector + france.vector
-headings = ["key", "text", "score"]
+headings = %w[rank text score]
 rows = []
 results = nlp.most_similar(query, 20)
-results.each do |lexeme|
-  rows << [lexeme[:key], lexeme[:text], lexeme[:score],]
+results.each_with_index do |lexeme, i|
+  index = (i + 1).to_s
+  rows << [index, lexeme.text, lexeme.score]
 end
 table = Terminal::Table.new rows: rows, headings: headings
 puts table
-# +----------------------+----------------+--------------------+
-# | key                  | text           | score              |
-# +----------------------+----------------+--------------------+
-# | 12090003238699662352 | パリ           | 0.7376999855041504 |
-# | 18290786970454458111 | フランス       | 0.7221999764442444 |
-# | 9360021637096476946  | 東京           | 0.6697999835014343 |
-# | 2437546359230213520  | ストラスブール | 0.631600022315979  |
-# | 13988178952745813186 | リヨン         | 0.5939000248908997 |
-# | 10427160276079242800 | Paris          | 0.574400007724762  |
-# | 5562396768860926997  | ベルギー       | 0.5683000087738037 |
-# | 15029176915627965481 | ニース         | 0.5679000020027161 |
-# | 9750625950625019690  | アルザス       | 0.5644999742507935 |
-# | 2381640614569534741  | 南仏           | 0.5547999739646912 |
-# | 7486004458946554189  | ロンドン       | 0.5525000095367432 |
-# | 7457654095417343716  | モンマルトル   | 0.5453000068664551 |
-# | 14063777960246535660 | ブローニュ     | 0.5338000059127808 |
-# | 3297880777656467136  | トゥールーズ   | 0.5275999903678894 |
-# | 3059066136348671923  | バスティーユ   | 0.5213000178337097 |
-# | 2423471048892368989  | フランス人     | 0.5194000005722046 |
-# | 15944886306236465675 | ロレーヌ       | 0.5148000121116638 |
-# | 9592561648283566590  | モンパルナス   | 0.513700008392334  |
-# | 6560045335275831141  | 渡仏           | 0.5131000280380249 |
-# | 8597467336360225096  | イタリア       | 0.5127000212669373 |
-# +----------------------+----------------+--------------------+
+# +------+----------------+--------------------+
+# | rank | text           | score              |
+# +------+----------------+--------------------+
+# | 1    | パリ           | 0.7376999855041504 |
+# | 2    | フランス       | 0.7221999764442444 |
+# | 3    | 東京           | 0.6697999835014343 |
+# | 4    | ストラスブール | 0.631600022315979  |
+# | 5    | リヨン         | 0.5939000248908997 |
+# | 6    | Paris          | 0.574400007724762  |
+# | 7    | ベルギー       | 0.5683000087738037 |
+# | 8    | ニース         | 0.5679000020027161 |
+# | 9    | アルザス       | 0.5644999742507935 |
+# | 10   | 南仏           | 0.5547999739646912 |
+# | 11   | ロンドン       | 0.5525000095367432 |
+# | 12   | モンマルトル   | 0.5453000068664551 |
+# | 13   | ブローニュ     | 0.5338000059127808 |
+# | 14   | トゥールーズ   | 0.5275999903678894 |
+# | 15   | バスティーユ   | 0.5213000178337097 |
+# | 16   | フランス人     | 0.5194000005722046 |
+# | 17   | ロレーヌ       | 0.5148000121116638 |
+# | 18   | モンパルナス   | 0.513700008392334  |
+# | 19   | 渡仏           | 0.5131000280380249 |
+# | 20   | イタリア       | 0.5127000212669373 |
+# +------+----------------+--------------------+

data/examples/japanese/named_entity_recognition.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -6,7 +8,7 @@ nlp = Spacy::Language.new("ja_core_news_lg")
 sentence = "任天堂は1983年にファミコンを14,800円で発売した。"
 doc = nlp.read(sentence)
-headings = ["text", "start", "end", "label"]
+headings = %w[text start end label]
 rows = []
 doc.ents.each do |ent|
@@ -24,4 +26,3 @@ puts table
 # | ファミコン | 10    | 15  | PRODUCT |
 # | 14,800円   | 16    | 23  | MONEY   |
 # +------------+-------+-----+---------+

data/examples/japanese/navigating_parse_tree.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -15,20 +17,20 @@ end
 table = Terminal::Table.new rows: rows, headings: headings
 puts table
- +------+----------+-----------+----------+------------------------+
- | text | dep      | head text | head pos | children               |
- +------+----------+-----------+----------+------------------------+
- | 自動 | compound | 車        | 92       |                        |
- | 運転 | compound | 車        | 92       |                        |
- | 車   | nsubj    | 転嫁      | 100      | 自動, 運転, は         |
- | は   | case     | 車        | 92       |                        |
- | 保険 | compound | 責任      | 92       |                        |
- | 責任 | obj      | 転嫁      | 100      | 保険, を               |
- | を   | case     | 責任      | 92       |                        |
- | 製造 | compound | 者        | 92       |                        |
- | 者   | obl      | 転嫁      | 100      | 製造, に               |
- | に   | case     | 者        | 92       |                        |
- | 転嫁 | ROOT     | 転嫁      | 100      | 車, 責任, 者, する, 。 |
- | する | aux      | 転嫁      | 100      |                        |
- | 。   | punct    | 転嫁      | 100      |                        |
- +------+----------+-----------+----------+------------------------+
+# +------+----------+-----------+----------+------------------------+
+# | text | dep      | head text | head pos | children               |
+# +------+----------+-----------+----------+------------------------+
+# | 自動 | compound | 車        | 92       |                        |
+# | 運転 | compound | 車        | 92       |                        |
+# | 車   | nsubj    | 転嫁      | 100      | 自動, 運転, は         |
+# | は   | case     | 車        | 92       |                        |
+# | 保険 | compound | 責任      | 92       |                        |
+# | 責任 | obj      | 転嫁      | 100      | 保険, を               |
+# | を   | case     | 責任      | 92       |                        |
+# | 製造 | compound | 者        | 92       |                        |
+# | 者   | obl      | 転嫁      | 100      | 製造, に               |
+# | に   | case     | 者        | 92       |                        |
+# | 転嫁 | ROOT     | 転嫁      | 100      | 車, 責任, 者, する, 。 |
+# | する | aux      | 転嫁      | 100      |                        |
+# | 。   | punct    | 転嫁      | 100      |                        |
+# +------+----------+-----------+----------+------------------------+

data/examples/japanese/noun_chunks.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"

data/examples/japanese/pos_tagging.rb CHANGED Viewed

@@ -1,10 +1,12 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
 nlp = Spacy::Language.new("ja_core_news_lg")
 doc = nlp.read("任天堂は1983年にファミコンを14,800円で発売した。")
-headings = ["text", "lemma", "pos", "tag", "dep"]
+headings = %w[text lemma pos tag dep]
 rows = []
 doc.each do |token|

data/examples/japanese/sentence_segmentation.rb CHANGED Viewed

@@ -1,11 +1,12 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 nlp = Spacy::Language.new("ja_core_news_sm")
 doc = nlp.read("これは文です。今私は「これは文です」と言いました。")
-puts "doc has annotation SENT_START: " + doc.has_annotation("SENT_START").to_s
+puts "doc has annotation SENT_START: #{doc.has_annotation("SENT_START")}"
 doc.sents.each do |sent|
   puts sent.text

data/examples/japanese/similarity.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 nlp = Spacy::Language.new("ja_core_news_lg")

data/examples/japanese/tokenization.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"

data/examples/japanese/visualizing_dependencies.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -6,7 +8,7 @@ nlp = Spacy::Language.new("ja_core_news_sm")
 sentence = "自動運転車は保険責任を製造者に転嫁する。"
 doc = nlp.read(sentence)
-dep_svg = doc.displacy(style: 'dep', compact: false)
+dep_svg = doc.displacy(style: "dep", compact: false)
 File.open(File.join(File.dirname(__FILE__), "test_dep.svg"), "w") do |file|
   file.write(dep_svg)

data/examples/japanese/visualizing_named_entities.rb CHANGED Viewed

@@ -1,13 +1,15 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
 nlp = Spacy::Language.new("ja_core_news_lg")
-sentence ="セバスチアン・スランが2007年にグーグルで自動運転車に取り組み始めたとき、社外の人間で彼のことを真剣に捉えている者はほとんどいなかった。"
+sentence = "セバスチアン・スランが2007年にグーグルで自動運転車に取り組み始めたとき、社外の人間で彼のことを真剣に捉えている者はほとんどいなかった。"
 doc = nlp.read(sentence)
-ent_html = doc.displacy(style: 'ent')
+ent_html = doc.displacy(style: "ent")
 File.open(File.join(File.dirname(__FILE__), "outputs/test_ent.html"), "w") do |file|
   file.write(ent_html)

data/examples/linguistic_features/ancestors.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -6,7 +8,7 @@ nlp = Spacy::Language.new("en_core_web_sm")
 sentence = "Credit and mortgage account holders must submit their requests"
 doc = nlp.read(sentence)
-headings = ["text", "dep", "n_lefts", "n_rights", "ancestors"]
+headings = %w[text dep n_lefts n_rights ancestors]
 rows = []
 root = doc.tokens.select do |t|
@@ -14,16 +16,16 @@ root = doc.tokens.select do |t|
   t.i == t.head.i
 end.first
-puts "The sentence: " + sentence
+puts "The sentence: #{sentence}"
 subject = Spacy::Token.new(root.lefts[0])
-puts "The root of the sentence is: " + root.text
-puts "The subject of the sentence is: " + subject.text
+puts "The root of the sentence is: #{root.text}"
+puts "The subject of the sentence is: #{subject.text}"
 subject.subtree.each do |descendant|
   # need to convert "ancestors" object from a python generator to a ruby array
-  ancestors = Spacy::generator_to_array(descendant.ancestors)
+  ancestors = Spacy.generator_to_array(descendant.ancestors)
   rows << [descendant.text, descendant.dep, descendant.n_lefts, descendant.n_rights, ancestors.map(&:text).join(", ")]
 end

data/examples/linguistic_features/entity_annotations_and_labels.rb CHANGED Viewed

@@ -1,12 +1,14 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
 nlp = Spacy::Language.new("en_core_web_sm")
-sentence = "San Francisco considers banning sidewalk delivery robots"
+sentence = "San Francisco considers banning sidewalk delivery robots"
 doc = nlp.read(sentence)
-headings = ["text", "ent_iob", "ent_iob_", "ent_type_"]
+headings = %w[text ent_iob ent_iob_ ent_type_]
 rows = []
 doc.each do |ent|

data/examples/linguistic_features/finding_a_verb_with_a_subject.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -5,16 +7,12 @@ nlp = Spacy::Language.new("en_core_web_sm")
 doc = nlp.read("Autonomous cars shift insurance liability toward manufacturers")
 results = []
 doc.each do |token|
-  if token.dep_ == "nsubj" && token.head.pos_ == "VERB"
-    results << token.head.text
-  end
+  results << token.head.text if token.dep_ == "nsubj" && token.head.pos_ == "VERB"
 end
 puts results.to_s
 # ["shift"]

data/examples/linguistic_features/information_extraction.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -10,21 +12,19 @@ sentence = "Credit and mortgage account holders must submit their requests"
 doc = nlp.read(sentence)
 texts = [
-    "Net income was $9.4 million compared to the prior year of $2.7 million.",
-    "Revenue exceeded twelve billion dollars, with a loss of $1b.",
+  "Net income was $9.4 million compared to the prior year of $2.7 million.",
+  "Revenue exceeded twelve billion dollars, with a loss of $1b."
 ]
 texts.each do |text|
   doc = nlp.read(text)
   doc.each do |token|
     if token.ent_type_ == "MONEY"
-      if ["attr", "dobj"].index token.dep_
-        subj = Spacy.generator_to_array(token.head.lefts).select{|t| t.dep == "nsubj"}
-        if !subj.empty?
-          puts(subj[0].text + " --> " + token.text)
-        end
-      elsif token.dep_ == "pobj" and token.head.dep == "prep"
-        puts token.head.head.text + " --> " + token.text
+      if %w[attr dobj].index token.dep_
+        subj = Spacy.generator_to_array(token.head.lefts).select { |t| t.dep == "nsubj" }
+        puts("#{subj[0].text}  --> #{token.text}") unless subj.empty?
+      elsif token.dep_ == "pobj" && token.head.dep == "prep"
+        puts "#{token.head.head.text} --> #{token.text}"
       end
     end
   end

data/examples/linguistic_features/iterating_children.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -5,20 +7,16 @@ nlp = Spacy::Language.new("en_core_web_sm")
 doc = nlp.read("Autonomous cars shift insurance liability toward manufacturers")
 results = []
 doc.each do |token|
-  if token.pos_ == "VERB"
-    token.children.each do |child|
-      if child.dep_ == "nsubj"
-        results << child.head.text
-      end
-    end
+  next unless token.pos_ == "VERB"
+  token.children.each do |child|
+    results << child.head.text if child.dep_ == "nsubj"
   end
 end
 puts results.to_s
 # ["shift"]

data/examples/linguistic_features/iterating_lefts_and_rights.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -5,13 +7,13 @@ nlp = Spacy::Language.new("en_core_web_sm")
 doc = nlp.read("bright red apples on the tree")
-puts "Text: " + doc.text
+puts "Text: #{doc.text}"
-puts "Words to the left of 'apple': " + doc[2].lefts.map(&:text).join(", ")
-puts "Words to the right of 'apple': " + doc[2].rights.map(&:text).join(", ")
+puts "Words to the left of 'apple': #{doc[2].lefts.map(&:text).join(", ")}"
+puts "Words to the right of 'apple': #{doc[2].rights.map(&:text).join(", ")}"
-puts "Num of the words to the left of 'apple': " + doc[2].n_lefts.to_s
-puts "Num of the words to the right of 'apple': " + doc[2].n_rights.to_s
+puts "Num of the words to the left of 'apple': #{doc[2].n_lefts}"
+puts "Num of the words to the right of 'apple': #{doc[2].n_rights}"
 # Text: bright red apples on the tree
 # Words to the left of 'apple': bright, red

data/examples/linguistic_features/lemmatization.rb CHANGED Viewed

@@ -1,10 +1,12 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
 nlp = Spacy::Language.new("en_core_web_sm")
 lemmatizer = nlp.get_pipe("lemmatizer")
-puts "Lemmatizer mode: " + lemmatizer.mode
+puts "Lemmatizer mode: #{lemmatizer.mode}"
 doc = nlp.read("I was reading the paper.")

data/examples/linguistic_features/named_entity_recognition.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -6,7 +8,7 @@ nlp = Spacy::Language.new("en_core_web_sm")
 sentence = "Apple is looking at buying U.K. startup for $1 billion"
 doc = nlp.read(sentence)
-headings = ["text", "start", "end", "label"]
+headings = %w[text start end label]
 rows = []
 doc.ents.each do |ent|

data/examples/linguistic_features/navigating_parse_tree.rb CHANGED Viewed

@@ -1,10 +1,12 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
 nlp = Spacy::Language.new("en_core_web_sm")
 lemmatizer = nlp.get_pipe("lemmatizer")
-puts "Lemmatizer mode: " + lemmatizer.mode
+puts "Lemmatizer mode: #{lemmatizer.mode}"
 doc = nlp.read("Autonomous cars shift insurance liability toward manufacturers")

data/examples/linguistic_features/noun_chunks.rb CHANGED Viewed

@@ -1,10 +1,12 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
 nlp = Spacy::Language.new("en_core_web_sm")
 lemmatizer = nlp.get_pipe("lemmatizer")
-puts "Lemmatizer mode: " + lemmatizer.mode
+puts "Lemmatizer mode: #{lemmatizer.mode}"
 doc = nlp.read("Autonomous cars shift insurance liability toward manufacturers")

data/examples/linguistic_features/pos_tagging.rb CHANGED Viewed

@@ -1,10 +1,12 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
 nlp = Spacy::Language.new("en_core_web_sm")
 doc = nlp.read("Apple is looking at buying U.K. startup for $1 billion")
-headings = ["text", "lemma", "pos", "tag", "dep", "shape", "is_alpha", "is_stop"]
+headings = %w[text lemma pos tag dep shape is_alpha is_stop]
 rows = []
 doc.each do |token|

data/examples/linguistic_features/retokenize_1.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"

data/examples/linguistic_features/retokenize_2.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -6,11 +8,11 @@ nlp = Spacy::Language.new("en_core_web_sm")
 sentence = "I live in New York"
 doc = nlp.read(sentence)
-puts "Before: " + doc.tokens.map(&:text).join(", ")
+puts "Before: #{doc.tokens.map(&:text).join(", ")}"
 doc.retokenize(3, 4)
-puts "After: " + doc.tokens.map(&:text).join(", ")
+puts "After: #{doc.tokens.map(&:text).join(", ")}"
 # Before: I, live, in, New, York
 # After: I, live, in, New York

data/examples/linguistic_features/rule_based_morphology.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -5,8 +7,8 @@ nlp = Spacy::Language.new("en_core_web_sm")
 doc = nlp.read("Where are you?")
-puts "Morph features of the third word: " + doc[2].morph.to_s
-puts "POS of the third word: " + doc[2].pos
+puts "Morph features of the third word: #{doc[2].morph}"
+puts "POS of the third word: #{doc[2].pos}"
 # Morph features of the third word: Case=Nom|Person=2|PronType=Prs
 # POS of the third word: PRON

data/examples/linguistic_features/sentence_segmentation.rb CHANGED Viewed

@@ -1,11 +1,12 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 nlp = Spacy::Language.new("en_core_web_sm")
 doc = nlp.read("This is a sentence. This is another sentence.")
-puts "doc has annotation SENT_START: " + doc.has_annotation("SENT_START").to_s
+puts "doc has annotation SENT_START: #{doc.has_annotation("SENT_START")}"
 doc.sents.each do |sent|
   puts sent.text

data/examples/linguistic_features/similarity.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -5,8 +7,8 @@ nlp = Spacy::Language.new("en_core_web_lg")
 doc1 = nlp.read("I like salty fries and hamburgers.")
 doc2 = nlp.read("Fast food tastes very good.")
-puts "Doc 1: " + doc1.text
-puts "Doc 2: " + doc2.text
+puts "Doc 1: #{doc1.text}"
+puts "Doc 2: #{doc2.text}"
 puts "Similarity: #{doc1.similarity(doc2)}"
 # Doc 1: I like salty fries and hamburgers.

data/examples/linguistic_features/similarity_between_lexemes.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"

data/examples/linguistic_features/similarity_between_spans.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -5,14 +7,14 @@ nlp = Spacy::Language.new("en_core_web_lg")
 doc1 = nlp.read("I like salty fries and hamburgers.")
 doc2 = nlp.read("Fast food tastes very good.")
-puts "Doc 1: " + doc1.text
-puts "Doc 2: " + doc2.text
+puts "Doc 1: #{doc1.text}"
+puts "Doc 2: #{doc2.text}"
 puts "Similarity: #{doc1.similarity(doc2)}"
 span1 = doc1.span(2, 2) # salty fries
-span2 = doc1.span(5 .. 5) # hamberger
-puts "Span 1: " + span1.text
-puts "Span 2: " + span2.text
+span2 = doc1.span(5..5) # hamberger
+puts "Span 1: #{span1.text}"
+puts "Span 2: #{span2.text}"
 puts "Similarity: #{span1.similarity(span2)}"
 # Doc 1: I like salty fries and hamburgers.

data/examples/linguistic_features/tokenization.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
@@ -5,7 +7,7 @@ nlp = Spacy::Language.new("en_core_web_sm")
 doc = nlp.read("Apple is looking at buying U.K. startup for $1 billion")
-headings = [1,2,3,4,5,6,7,8,9,10,11]
+headings = [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11]
 row = []
 doc.each do |token|
@@ -20,4 +22,3 @@ puts table
 # +-------+----+---------+----+--------+------+---------+-----+---+----+---------+
 # | Apple | is | looking | at | buying | U.K. | startup | for | $ | 1  | billion |
 # +-------+----+---------+----+--------+------+---------+-----+---+----+---------+

data/examples/rule_based_matching/creating_spans_from_matches.rb CHANGED Viewed

@@ -1,16 +1,18 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 require "terminal-table"
 nlp = Spacy::Language.new("en_core_web_lg")
 matcher = nlp.matcher
-matcher.add("US_PRESIDENT", [[{LOWER: "barack"}, {LOWER: "obama"}]])
+matcher.add("US_PRESIDENT", [[{ LOWER: "barack" }, { LOWER: "obama" }]])
 doc = nlp.read("Barack Obama was the 44th president of the United States")
 matches = matcher.match(doc)
 matches.each do |match|
-  span = Spacy::Span.new(doc, start_index: match[:start_index], end_index: match[:end_index], options: {label: match[:match_id]})
-  puts span.text + " / " + span.label
+  span = Spacy::Span.new(doc, start_index: match[:start_index], end_index: match[:end_index], options: { label: match[:match_id] })
+  puts "#{span.text} / #{span.label}"
 end
 # Barack Obama / US_PRESIDENT

data/examples/rule_based_matching/matcher.rb CHANGED Viewed

@@ -1,8 +1,10 @@
+# frozen_string_literal: true
 require "ruby-spacy"
 nlp = Spacy::Language.new("en_core_web_sm")
-pattern = [[{LOWER: "hello"}, {IS_PUNCT: true}, {LOWER: "world"}]]
+pattern = [[{ LOWER: "hello" }, { IS_PUNCT: true }, { LOWER: "world" }]]
 matcher = nlp.matcher
 matcher.add("HelloWorld", pattern)
@@ -10,7 +12,7 @@ matcher.add("HelloWorld", pattern)
 doc = nlp.read("Hello, world! Hello world!")
 matches = matcher.match(doc)
-matches.each do | match |
+matches.each do |match|
   string_id = nlp.vocab_string_lookup(match[:match_id])
   span = doc.span(match[:start_index]..match[:end_index])
   puts "#{string_id}, #{span.text}"