RubyGems - poetize - Versions diffs - 0.0.1 - Mend

poetize 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

data/.gitignore +6 -0
data/Gemfile +4 -0
data/README.md +55 -0
data/Rakefile +1 -0
data/analyzer/analyzer.rb +44 -0
data/analyzer/strophe_analyzer.rb +84 -0
data/bin/poetize +37 -0
data/lib/file_handler.rb +16 -0
data/lib/hyphenator.rb +78 -0
data/lib/poetize.rb +5 -0
data/lib/poetize/version.rb +3 -0
data/lib/text_handler.rb +69 -0
data/model/poem.rb +25 -0
data/model/strophe.rb +20 -0
data/poetize.gemspec +24 -0
data/resources/syllables_dict.txt +156176 -0
data/test/file_handler_spec.rb +18 -0
data/test/hyphenator_spec.rb +25 -0
data/test/poem_spec.rb +22 -0
data/test/samples/01.txt +34 -0
data/test/samples/02_ballad.txt +26 -0
data/test/samples/02_doubled.txt +62 -0
data/test/samples/02_full.txt +32 -0
data/test/samples/02_original.txt +30 -0
data/test/spec_helper.rb +28 -0
data/test/strophe_analyzer_spec.rb +33 -0
data/test/strophe_spec.rb +17 -0
data/test/text_handler_spec.rb +20 -0
metadata +103 -0

data/.gitignore ADDED

@@ -0,0 +1,6 @@
+*.swp
+.DS_Store
+*.gem
+.bundle
+Gemfile.lock
+pkg/*

data/Gemfile ADDED

@@ -0,0 +1,4 @@
+source "http://rubygems.org"
+# Gem's dependencies specified in poetize.gemspec
+gemspec

data/README.md ADDED

@@ -0,0 +1,55 @@
+#ABOUT
+Our goal is to provide a tool that parses a poem and analyzes it according to the following:
+* Strophes
+    * Name (based on number of verses) [done]
+    * Type (based on verse metrics)
+* Verses
+    * Syllable division
+    * Grammatical
+    * Poetical
+    * Metric and name
+    * Cadency (rhythm)
+* Poem
+    * Number os strophes [done]
+    * Number of verses [done]
+    * Rhymes
+    * Name (based on strophe structure)
+We are focusing in the portuguese (brazillian) language since it's our native language and phonetics vary from language to language.
+For more details and examples, see our wiki: https://github.com/lfilho/poetize/wiki
+#USAGE
+Certify you chmod the poetize file to be an executable:
+`$chmod +x poetize`
+Then run in your shell:
+`$ poetize file_path [, ignore_line[, ignore_line[,...]]]`
+The ignore_line argument is the line(s) you want the program to ignore (i.e. the title, author, date created, dedicated to, etc...)
+##Usage examples:
+`poetize ./samples/my_poem.txt`
+`poetize /home/user/docs/love_poem.txt 1 2 13 14`
+#REFERENCES
+Good site for learning about "poetic science":
+* For portuguese language:
+    * http://mpbsapiens.com/ciencia-poetica/
+    * http://pt.wikipedia.org/wiki/Versifica%C3%A7%C3%A3o
+    * http://www.portaldalinguaportuguesa.org/?action=divisao&page=present
+* For english language:
+    * http://en.wikipedia.org/wiki/Poem
+#ABOUT THE DEVELOPERS
+We started this project to learn Ruby and TDD so expect it to be noobly coded :-) Feel free to refactor the code and contribute to our learning experience ;-)

data/Rakefile ADDED

	@@ -0,0 +1 @@
1	+ require "bundler/gem_tasks"

data/analyzer/analyzer.rb ADDED

@@ -0,0 +1,44 @@
+# coding: utf-8
+$app_path = File.dirname(__FILE__) + '/../'
+require $app_path + 'lib/file_handler'
+require $app_path + 'lib/hyphenator'
+require $app_path + 'analyzer/strophe_analyzer'
+class Analyzer
+  def initialize(poem)
+    @poem = poem
+    @ident = 3
+  end
+  def analyze
+    prefix = ' ' * @ident + '- '
+    output = "This poem:\n" + prefix +
+      "Contains #{@poem.number_of_strophes} strophes;\n" + prefix +
+      "Contains #{@poem.number_of_verses} verses;\n" +
+      "As for the strophes:\n"
+    output += analyze_strophes.reduce(''){|out, n| out + prefix + n + "\n"}
+    output += "Grammatical syllable divison:\n"
+    output += divide_grammatically
+  end
+  private
+  def analyze_strophes
+    strophe_analyzer = StropheAnalyzer.new @poem
+    strophe_analyzer.analyze
+  end
+  def divide_grammatically
+    hyphenated = ''
+    @poem.body.each do |line|
+      new_line = ' ' * @ident
+      line.split(' ').each do |word|
+        hyp = Hyphenator.new
+        new_line << hyp.hyphenate(word) + ' '
+      end
+      hyphenated << new_line + "\n"
+    end
+    hyphenated
+  end
+end

data/analyzer/strophe_analyzer.rb ADDED

@@ -0,0 +1,84 @@
+# coding: utf-8
+$app_path = File.dirname(__FILE__) + '/../'
+require $app_path + 'lib/file_handler'
+class StropheAnalyzer
+    attr_accessor :number_of_verses, :number_of_strophes
+    def initialize(poem)
+        @strophes = poem.strophes
+        @analyzis_output = Array.new
+        @strophes_verse_count = Array.new
+        @number_of_strophes = poem.number_of_strophes
+        @number_of_verses = poem.number_of_verses
+    end
+    def analyze
+        analyze_names
+        analyze_fixed_form
+        @analyzis_output
+    end
+    private
+    def analyze_names
+        name_num = Hash.new
+        @strophes.each_with_index do |n,i|
+            num_verses = n.number_of_verses
+            @strophes_verse_count << num_verses
+            if name_num[num_verses].nil?
+                name_num[num_verses] = [i+1]
+            else
+                name_num[num_verses] << i+1
+            end
+        end
+        name_num.each do |n|
+            num_items = n[1].size
+            name = Strophe.name(n[0])
+            temp = n[1].to_s.gsub(/[\[\]]/, '')
+            if num_items == 1
+                @analyzis_output << "Strophe #{temp} is #{name}"
+            elsif
+                temp = temp.reverse.sub(",", " and".reverse).reverse
+                @analyzis_output << "Strophes #{temp} are #{name}s"
+            end
+        end
+    end
+    def analyze_fixed_form
+        return if fixed_form_ballad?
+        return if fixed_form_italian_sonet?
+        return if fixed_form_english_sonet?
+    end
+    public
+    def fixed_form_ballad?
+        odd_verses = Array.new
+        even_verses = Array.new
+        @strophes_verse_count.each_slice(2) do |n|
+            odd_verses << n[0] unless n[0].nil?
+            even_verses << n[1] unless n[1].nil?
+        end
+        is_odds_same = odd_verses.all? {|n| n == odd_verses[0] }
+        is_evens_same = even_verses.all? {|n| n == odd_verses[0]/2 }
+        if (is_odds_same && is_evens_same)
+            @analyzis_output << "Which makes this poem is a Ballad! (" +
+                Strophe.name(odd_verses[0]) + " verses with " +
+                Strophe.name(even_verses[0]) + " verses between them)."
+            return true
+        end
+        false
+    end
+    def fixed_form_italian_sonet?
+        #TODO
+        false
+    end
+    def fixed_form_english_sonet?
+        #TODO
+        false
+    end
+end

data/bin/poetize ADDED

@@ -0,0 +1,37 @@
+#!/usr/bin/env ruby
+$app_path = File.dirname(__FILE__) + '/../'
+require $app_path + 'lib/text_handler'
+require $app_path + 'lib/file_handler'
+require $app_path + 'model/poem'
+require $app_path + 'analyzer/analyzer'
+if ARGV.size < 1
+    puts <<-eol
+== Usage:
+    poetize file_path [, ignore_line[, ignore_line[,...]]]
+== Examples:
+    poetize /home/user/docs/my_poem.txt
+    poetize /home/user/docs/my_poem.txt 1 2 13 14
+    eol
+    exit
+end
+file_path = ARGV[0]
+ignore_lines = ARGV.drop(1).map{|n| n = n.to_i - 1}
+text = ""
+if File.exists? file_path
+    text = FileHandler.get_file_contents file_path
+end
+metadata = Array.new
+ignore_lines.reverse_each do |n|
+    metadata << text[n]
+    text.delete_at n
+end
+metadata = TextHandler.normalize_text metadata.reverse!
+body = TextHandler.normalize_text text
+poem = Poem.new metadata, body
+analyzer = Analyzer.new poem
+puts analyzer.analyze

data/lib/file_handler.rb ADDED

@@ -0,0 +1,16 @@
+class FileHandler
+    def self.get_file_contents(file_path)
+        begin
+            text = Array.new
+            File.open file_path do |file|
+                while line = file.gets
+                    text << line
+                end
+            end
+            text
+        rescue Exception => e
+            raise e.message
+            puts e.backtrace.inspect
+        end
+    end
+end

data/lib/hyphenator.rb ADDED

@@ -0,0 +1,78 @@
+# encoding: utf-8
+require 'rubygems'
+require 'text-hyphen'
+class Hyphenator
+  ACCENTED_CHARS = /[çãâäõáéíóúêôàü]/
+  def initialize
+    @hyphenator = Text::Hyphen.new do |h|
+      h.left = 0
+      h.right = 0
+      h.language = 'pt'
+    end
+    @orig_accented_chars_pos = Hash.new
+  end
+  def hyphenate(word)
+    word = remove_accents word
+    hyphenated_raw = @hyphenator.visualize word
+    hyphenated_final = put_accents_back word, hyphenated_raw
+  end
+  private
+  def put_accents_back(word, hyphenated_word)
+    if @orig_accented_chars_pos.size > 0
+      dashes_pos = @hyphenator.hyphenate word
+      @orig_accented_chars_pos.keys.sort.each do |k|
+        offset = 0
+        dashes_pos.reverse.each_with_index do |p, i|
+          if k >= p
+            offset = dashes_pos.size - i
+            break
+          end
+        end
+        hyphenated_word[k + offset] = @orig_accented_chars_pos[k]
+      end
+      clean
+    end
+    hyphenated_word
+  end
+  def remove_accents(word)
+    reversed = word.reverse
+    last_pos = reversed =~ ACCENTED_CHARS
+    if (!last_pos.nil?)
+      orig_pos = word.size - 1 - last_pos
+      @orig_accented_chars_pos[orig_pos] = reversed[last_pos]
+      word = replace_accented(reversed, last_pos).reverse
+      remove_accents word
+    else
+      return word
+    end
+  end
+  def replace_accented(word, pos)
+    char = word[pos]
+    case char
+    when /[ç]/ then r = 'c'
+    when /[ãâäàá]/ then r = 'a'
+    when /[éê]/ then r = 'e'
+    when /[í]/ then r = 'i'
+    when /[õôó]/ then r = 'o'
+    when /[úü]/ then r = 'u'
+    end
+    word[pos] = r
+    word
+  end
+  def clean
+    @orig_accented_chars_pos = Hash.new
+  end
+end

data/lib/poetize.rb ADDED

@@ -0,0 +1,5 @@
+require "poetize/version"
+module Poetize
+  # TODO
+end

data/lib/poetize/version.rb ADDED

@@ -0,0 +1,3 @@
+module Poetize
+  VERSION = "0.0.1"
+end

data/lib/text_handler.rb ADDED

@@ -0,0 +1,69 @@
+class Object
+    def blank?
+        return true if self.nil?
+        return self.empty? || !self.match(/^(\s|\t|\n|\r)*$/).nil?
+    end
+end
+class TextHandler
+    def self.normalize_line(string)
+        string.strip!
+        string.squeeze(' ')
+    end
+    def self.normalize_text(text)
+        if !text.is_a?(String) && !text.is_a?(Array)
+            raise "Argument must be a String or a Array"
+            return ''
+        end
+        if text.is_a? String
+            # Trying to normalize for different OSes
+            text = text.gsub(/\015\012?/, "\n")
+            text = text.split(/\n/) # Now it's an Array
+        end
+        text = TextHandler.remove_padding_lines(text)
+        new_text = Array.new
+        found_double = false
+        text.each_with_index do |line, i|
+            next_line = text[i+1]
+            if line.blank?
+                if next_line.blank?
+                    found_double = true
+                    new_text << "$doubled$"
+                else
+                    new_text << "$single$"
+                end
+            else
+                new_text << TextHandler.normalize_line(line)
+            end
+        end
+        new_text.select! do |line|
+            found_double ? (line != "$single$") : true
+        end
+        new_text = new_text.chunk{|n| n.gsub("$doubled$", "")}.map(&:first)
+        new_text = new_text.map{|n| n.gsub("$single$", "") }
+        new_text
+    end
+    private
+    def self.remove_padding_lines(array)
+        array = TextHandler.remove_first_lines array
+        array = TextHandler.remove_first_lines(array.reverse).reverse
+    end
+    def self.remove_first_lines(array)
+        found_text = false
+        array.compact!
+        for i in 0..array.size-1
+            if array[i].strip.blank?
+                array[i] = nil
+            else
+                break
+            end
+        end
+        array.compact
+    end
+end

data/model/poem.rb ADDED

@@ -0,0 +1,25 @@
+$app_path = File.dirname(__FILE__) + '/../'
+require $app_path + 'model/strophe'
+class Poem
+    attr_accessor :metadata, :body, :strophes, :number_of_strophes, :number_of_verses
+    def initialize(metadata, body)
+        @metadata, @body = metadata, body
+        @strophes = split_in_strophes body
+        @number_of_verses = @strophes.inject(0) {|sum, n| sum + n.number_of_verses }
+        @number_of_strophes = @strophes.size
+    end
+    def split_in_strophes(body)
+        body.chunk(&:empty?).select{|n| !n[0]}.map{|n| Strophe.new(n[1])}
+    end
+    def to_s
+        "#{@metadata.join("\n")}\n\n#{@body.join("\n")}"
+    end
+    def to_html
+        to_s.gsub("\n", "<br />")
+    end
+end

data/model/strophe.rb ADDED

@@ -0,0 +1,20 @@
+# coding: utf-8
+class Strophe
+    @@Name = ["", 'Monóstico', "Dístico", "Terceto", "Quadra", "Quintilhas", "Sextilha", "Sétima", "Oitava", "Nona", "Décima", "Livre ou Polimérica"]
+    attr_accessor :number_of_verses, :verses
+    def initialize(arr)
+        @verses = arr
+        @number_of_verses = arr.size
+    end
+    def self.name(i=number_of_verses)
+        return @@Name[11] if i > 10
+        @@Name[i]
+    end
+    def name(i=number_of_verses)
+        Strophe.name(i)
+    end
+end