RubyGems - presume - Versions diffs - 0.0.2 - Mend

presume 0.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

checksums.yaml +7 -0
data/Gemfile +4 -0
data/README.Rdoc +104 -0
data/Rakefile +7 -0
data/lib/classes/bullet.rb +18 -0
data/lib/classes/classifide.rb +81 -0
data/lib/classes/header.rb +170 -0
data/lib/classes/resume_builder.rb +375 -0
data/lib/classes/resume_classifier.rb +137 -0
data/lib/classes/resume_searcher.rb +4 -0
data/lib/classes/searchable.rb +40 -0
data/lib/classes/searchables.rb +24 -0
data/lib/definitions/classifications.rb +24 -0
data/lib/definitions/machines.rb +11 -0
data/lib/definitions/regex.rb +79 -0
data/lib/presume.rb +123 -0
data/sample_resume.docx +0 -0
data/spec/classifide_spec.rb +17 -0
data/spec/header_spec.rb +73 -0
data/spec/presume_spec.rb +72 -0
data/spec/resume_builder_spec.rb +213 -0
data/spec/resume_classifier_spec.rb +140 -0
data/spec/searchable_spec.rb +34 -0
data/spec/searchables_spec.rb +22 -0
data/spec/spec_helper.rb +1 -0
metadata +140 -0

checksums.yaml ADDED

@@ -0,0 +1,7 @@
+---
+SHA1:
+  metadata.gz: b80339c1863dc69cf2e8be22e594a58bde43dbda
+  data.tar.gz: b7c250b6fb461ade98ee62d194aac7c9c8f5532a
+SHA512:
+  metadata.gz: 3048dc8d33cca2e7c141a6dafb89c4ff769ca2a3ba029c5159abda211ac334f8cd7ad8f1030441743ed7e2232f9ca9b6788a8eff77f88bafb1ec0246731c225c
+  data.tar.gz: 3b50bf15404471cb27cfaded216de75cffcd053e4fdc822065a01c7e6650988655ccafb5b8b460f0c46b8f7ab8d35865c85307456bee3cecc0fbe2d55699b8ef

data/Gemfile ADDED

@@ -0,0 +1,4 @@
+source 'https://rubygems.org'
+# Specify your gem's dependencies in parse_resume.gemspec
+gemspec

data/README.Rdoc ADDED

@@ -0,0 +1,104 @@
+# Presume
+A resume parser coupled with fundamental Applicant Tracking System Technology
+### Description
+Presume is the first open-source Applicant Tracking System technology for Ruby-on-Rails developers. It works by parsing the resume into the CVSTOM.org resume format Section >> Header >> Bullets, and then taking an input of skills and their expected duration to check for in that resume.
+### Features
+Parse resumes
+Checks resumes for specific skills, positions, and their duration
+### Resume Parser:
+    require 'presume'
+    # Sample input
+    resume_text = "Leigh Silverstein\n123 Ave.\n\nWork Experience\nProject Coordinator"
+    # Parse resume with string input
+    presume = Presume.new(resume_text)
+    # Retrieve Sections
+    Presume.sections
+    #=> {0 => SectionObject1, 1 => SectionObject2}
+    # SectionObject Functions
+    SectionObject.text
+    #=> "Work Experience"
+    SectionObject.children
+    #=> [ HeaderObject1, HeaderObject2 ]
+    # HeaderObject Functions
+    SectionObject.text
+    #=> "Project Coordinator, Projects4Ever Inc., Toronto, Ontario, Jan 2011-Jul 2012
+    SectionObject.duration
+    #=> 1.5 (In Years)
+    SectionObject.start_time_text
+    #=> Jan 2011
+    SectionObject.end_time_text
+    #=> Jul 2012
+    HeaderObject.children
+    #=> [ BulletObject1, BulletObject2 ]
+    # BulletObject inherits all functions from the HeaderObject except children
+### ATS:
+    # After parsing a resume
+    # Checking for certain position or education ("name", expected_minimum_duration_in_years)
+    intake_hash = {"Project Coordinator|Project Assistant" => 1, "Bachelors Finance|BF|B.F." => 4}
+    # Check for positions
+    presume.positions?(intake_hash)
+    #=> {"Project Coordinator|Project Assistant" => [ MatchedHeaderObject1 ], "Bachelors Finance|BF|B.F." => [ MatchedHeaderObject2 ]}
+    # Checking for certain skills ("name", expected_minimum_duration_in_years)
+    intake_hash = {"database management" => 1, "clear communication" => 0}
+    # Check for positions
+    presume.skills?(intake_hash)
+    #=> {"database management" => [ MatchedBulletObject1 ], "clear communication" => [ MatchedBulletObject2 ]}
+    #Note that matched headers and bullets are the same classes as the headers and bullets discussed in the resume parsing section
+### Requirements
+* EngTagger
+* Ruby-Stemmer
+* Docx (for testing)
+### Install
+    (sudo) gem install presume
+### Author
+of this Ruby library
+* Leigh Silverstein (lsilversteinto [at] gmail.com)
+### License
+This library is distributed under the GPL.  Please see the LICENSE file.

data/Rakefile ADDED

@@ -0,0 +1,7 @@
+require "bundler/gem_tasks"
+require "rspec/core/rake_task"
+RSpec::Core::RakeTask.new
+task :default => :spec
+task :test => :spec

data/lib/classes/bullet.rb ADDED

@@ -0,0 +1,18 @@
+class Bullet < Header
+	attr_accessor :text, :id
+	def initialize(classifide, header)
+		both_classifications.each do |classification|
+			instance_variable_set(("@" + classification).to_sym, header.send(classification))
+		end
+		@header_text = @text
+		@header_id = @id
+		@text = classifide.text
+		@id = classifide.id
+	end
+end

data/lib/classes/classifide.rb ADDED

@@ -0,0 +1,81 @@
+class Classifide
+    attr_accessor *both_classifications_symboled
+	def initialize(classifide)
+		both_classifications.each do |classification|
+			instance_variable_set(("@" + classification).to_sym, classifide[classification.to_sym])
+		end
+	end
+    def more_words_than?(number)
+        @number_of_words > number
+    end
+    def name?
+        @name.nil?
+    end
+	def many_words?
+		@many_words
+	end
+    def email?
+        !@email.nil?
+    end
+    def type?
+        @type.nil?
+    end
+    def address?
+       !@address.nil?
+    end
+    def phone?
+       !@phone.nil?
+    end
+    def verbs?
+       !@verbs.nil?
+    end
+    def date?
+        if @dates.nil? and @dates_2.nil?
+            false
+        else
+            true
+        end
+    end
+    def institution?
+       if @schools.nil? and @companies.nil?
+            false
+        else
+            true
+        end
+    end
+    def profession?
+       !@professions.nil?
+    end
+    def city?
+       !@cities.nil?
+    end
+    def section?
+        !@section.nil?
+    end
+	def set_new_value(attribute, new_value)
+		instance_variable_set(("@" + attribute).to_sym, new_value)
+	end
+    def children
+        @presume.all_types[@id].drop(1)
+    end
+end

data/lib/classes/header.rb ADDED

@@ -0,0 +1,170 @@
+class Header < Classifide
+	attr_accessor :clean_profession
+	def initialize(classifide)
+		both_classifications.each do |classification|
+			instance_variable_set(("@" + classification).to_sym, classifide.send(classification))
+		end
+	end
+	def remove_date
+		@clean_profession = @text.gsub(regex_dates, "")
+	end
+	def remove_city
+		@clean_profession.gsub!(regex_cities, "")
+	end
+	def remove_institution
+		@clean_profession.gsub!(regex_companies, "")
+		@clean_profession.gsub!(regex_schools, "")
+	end
+	def get_professions
+		@clean_profession.gsub!(regex_companies, "")
+	end
+	def remove_all_but_profession
+		@clean_profession = @clean_profession[regex_professions]
+	end
+    def season?
+    	!@text[regex_season].nil?
+	end
+    def split_date
+    	@prepare_split_date = @dates.gsub(Regexp.new('( |)(to\\b|-|–)( |)', 'i'), "{+)")
+    	@split_date = @prepare_split_date.split("{+)")
+    	if @split_date.kind_of?(Array)
+    		@split_date
+    	else
+    		@split_date = [@dates]
+    	end
+    end
+    def start_time_text?
+    	if date?
+	    	split_date[0]
+	    end
+    end
+    def start_time_number
+    	if date?
+			@start_time_number = start_year.to_i + convert_month_to_number(start_month)
+		else
+			nil
+		end
+    end
+    def end_time_text?
+    	if @end_time_text.nil?
+	    	if date?
+		    	if end_date_exists?
+		    		@end_time_text = split_date[1]
+		    	end
+		    end
+		else
+			@end_time_text
+		end
+    end
+    def current?
+    	!end_time_text?[regex_current].nil?
+    end
+    def end_time_number
+		if date?
+			if end_date_exists?
+				if current?
+					@end_time_number = Date.today.strftime("%Y").to_i + (Date.today.strftime("%m")).to_i/12
+				else
+					@end_time_number = end_year.to_i + convert_month_to_number(end_month)
+				end
+			end
+		end
+    end
+    def end_date_exists?
+    	split_date.length == 2
+    end
+    def start_year
+    	@start_year = split_date[0][regex_year]
+    end
+    def start_month
+    	@start_month = split_date[0][regex_month]
+    	if @start_month.nil?
+    		@start_month = split_date[0][regex_season]
+	    	if @start_month.nil?
+	    		@start_month = "Jan"
+	    	end
+	    end
+	    @start_month
+	end
+    def end_year
+    	@end_year = split_date[1][regex_year]
+    end
+    def end_month
+    	if @end_month.nil?
+    		@end_month = split_date[1][regex_month]
+    		if @end_month.nil?
+    			@end_month = "Jan"
+    		end
+    		@end_month
+    	else
+    		@end_month
+    	end
+    end
+    def duration
+    	if season?
+    		@duration = 3/12
+    	else
+    		@duration = end_time_number - start_time_number
+    	end
+    end
+    def convert_season_to_number(season)
+    	case season.downcase
+    		when "winter"
+    			0
+    		when "spring"
+    			3
+    		when "summer"
+    			6
+    		when "fall"
+    			9
+    	end
+    end
+    def convert_month_to_number(month)
+    	if season?
+			@converted_month = convert_season_to_number(month)
+		else
+			@converted_month = Date::ABBR_MONTHNAMES.index(month[0..2])
+		end
+		@converted_month_of_12 = (@converted_month / 12).to_f
+	end
+	def split_cities
+		@location = @cities.split(", ")
+	end
+	def just_city
+		split_cities[0]
+	end
+	def just_state
+		split_cities[1]
+	end
+end

data/lib/classes/resume_builder.rb ADDED

@@ -0,0 +1,375 @@
+class ResumeBuilder
+    attr_accessor :classifides, :resume
+    def initialize(classified_lines)
+        @classifides = classified_lines
+        @length = classified_lines.length
+    end
+    def set_classifide(line_number)
+        @classifide = @classifides[line_number]
+        @line_number = line_number
+    end
+    def header_line_number?
+        ((@line_number + 1)/@length).to_f <= 0.10
+    end
+    def check_for_name_in_header
+        if !@classifide.many_words? and !@classifide.name? and @classifide.type?
+            @classifide.type = "name"
+        end
+    end
+    def check_for_email_in_header
+        if !@classifide.many_words? and @classifide.email? and @classifide.type?
+            @classifide.type = "email"
+        end
+    end
+    def check_for_address_in_header
+        if @classifide.address? and @classifide.type?
+            @classifide.type = "address"
+        end
+    end
+    def check_for_phone_in_header
+        if !@classifide.many_words? and @classifide.phone? and @classifide.type?
+            @classifide.type = "phone"
+        end
+    end
+    def check_header
+        if header_line_number?
+            check_for_name_in_header
+            check_for_email_in_header
+            check_for_address_in_header
+            check_for_phone_in_header
+        end
+    end
+    def classifide_after
+        if @line_number == @length - 1
+            @classifide_after = @classifides[@line_number]
+        else
+            @classifide_after = @classifides[@line_number + 1]
+        end
+    end
+    def classifide_after_after
+        if @line_number >= @length - 2
+            @classifide_after = @classifides[@line_number]
+        else
+            @classifide_after = @classifides[@line_number + 2]
+        end
+    end
+    def classifide_before
+        @classifide_before = @classifides[@line_number - 1]
+    end
+    def check_obvious_types
+        if !@classifide.institution? and @classifide.type? and !@classifide.date? and !@classifide.city? and !@classifide.profession? and !@classifide.many_words? and @classifide.section?
+            @classifide.type = "section"
+        end
+        if @classifide.many_words? and @classifide.verbs? and @classifide.type? and !@classifide.date?
+            @classifide.type = "bullet"
+        end
+        if !@classifide.institution? and @classifide.type? and !@classifide.date? and !@classifide.city? and !@classifide.profession? and !@classifide.section?
+            @classifide.type = "bullet"
+        end
+        if @classifide.institution? and @classifide.type? and @classifide.date? and @classifide.city? and @classifide.profession?
+            @classifide.type = "header"
+        end
+        if @classifide.type? and ((@classifide.institution? and @classifide.date? and @classifide.city? and @classifide.profession?) or (@classifide.institution? and @classifide.date? and @classifide.city?) or (@classifide.institution? and @classifide.date? and !@classifide.many_words?) or (@classifide.date? and @classifide.city? and @classifide.profession? and !@classifide.many_words?))
+            @classifide.type = "header_x"
+        end
+        if @classifide.type? and @classifide.many_words? and !@classifide.verbs? and (@classifide.profession? or @classifide.city? or @classifide.institution?)
+            @classifide.type = "header_x"
+        end
+    end
+    def first_pass
+        @length.times do |n|
+            set_classifide(n)
+            check_header
+            check_obvious_types
+        end
+    end
+    def second_pass
+        @length.times do |n|
+            set_classifide(n)
+            if !@classifide.institution? and @classifide.type? and !@classifide.date? and !@classifide.city? and !@classifide.profession? and !@classifide.many_words?
+                if (@classifide_after.institution? and @classifide_after.profession?) or (!@classifide_after.institution? and !@classifide_after.profession?)
+                    @classifide.type = "section"
+                end
+            end
+            if (@classifide.institution? or @classifide.profession?) and !@classifide.many_words? and @classifide.type?
+              @classifide.type = "header_x"
+            end
+            if !@classifide.institution? and @classifide.profession? and  @classifide.type?
+              @classifide.type = "header_x"
+            end
+            if @classifide.type? and @classifide.more_words_than?(10)
+              @classifide.type = "bullet"
+            end
+        end
+    end
+    def reset_header_x_start
+        @header_x_start = true
+    end
+    def build_resume
+        reset_header_x_start
+        @length.times do |n|
+            set_classifide(n)
+            unless @classifide.type?
+                unless @classifide.type == "name" or @classifide.type == "email" or @classifide.type == "phone" or @classifide.type == "address"
+                    send(@classifide.type + "_build")
+                end
+            end
+        end
+    end
+    def add_to_all_types(id)
+        if all_types[id].nil?
+            all_types[id] = [@all_type]
+        else
+            all_types[id] += [@all_type]
+        end
+    end
+    def section_build
+        @header_number = nil
+        @header_x_start = true
+        @section_number = @line_number
+        @all_type = @classifide
+        add_section_to_resume
+    end
+    def add_section_to_resume
+        sections.merge!({@line_number => @all_type})
+        add_to_all_types(@line_number)
+    end
+    def add_header_to_resume
+        headers.merge!({@line_number => @header})
+        add_to_all_types(@line_number)
+        add_to_all_types(@section_number)
+    end
+    def add_bullet_to_resume
+        bullets.merge!({@line_number => @bullet})
+        add_to_all_types(@line_number)
+        add_to_all_types(header_number?)
+    end
+    def section_number?
+        if @section_number.nil?
+            @section_number = -1
+        else
+            @section_number
+        end
+    end
+    def previous_section_headers?
+        !headers[@section_number].nil?
+    end
+    def header_build
+        @bullet = nil
+        @header_number = @line_number
+        @header = Header.new(@classifide)
+        @header_x_start = true
+        @all_type = @header
+        add_header_to_resume
+    end
+    def create_blank_classifide
+        @blank_classifide = Classifide.new(id: -1)
+    end
+    def bullet_parent
+        if all_types[header_number?].nil?
+            @all_type = create_blank_classifide
+            add_to_all_types(-1)
+            all_types[-1][0]
+        else
+            all_types[header_number?][0]
+        end
+    end
+    def bullet_build
+        @header_x_start = true
+        @bullet = Bullet.new(@classifide, bullet_parent)
+        @all_type = @bullet
+        add_bullet_to_resume
+    end
+    def header_number?
+        if @header_number.nil?
+            section_number?
+        else
+            @header_number
+        end
+    end
+    def check_for_gaps
+        header_classifications.each do |classification|
+                if @classifide.send(classification).nil?
+                    if !classifide_after_after.send(classification).nil?
+                        @classifide.set_new_value(classification, classifide_after_after.send(classification))
+                    @header_x_start = "almost"
+                    end
+                end
+            end
+    end
+    def combine_text()
+    end
+    def header_x_build
+        @header_number = @line_number
+        if @header_x_start == true
+            if classifide_after.type == "header_x"
+                header_classifications.each do |classification|
+                    if @classifide.send(classification).nil?
+                        @classifide.set_new_value(classification, classifide_after.send(classification))
+                    end
+                end
+                @classifide.set_new_value("text", @classifide.text + ", " + classifide_after.text)
+                if classifide_after_after.type == "header_x"
+                    check_for_gaps
+                    if @header_x_start == 'almost'
+                        @classifide.set_new_value("text", @classifide.text + ", " + classifide_after_after.text)
+                    end
+                    @header_x_start = false unless @header_x_start == "almost"
+                else
+                    @header_x_start = false
+                end
+            end
+            @header = Header.new(@classifide)
+            @all_type = @header
+            add_header_to_resume
+        else
+            if @header_x_start == "almost"
+                @header_x_start == "almost_closer"
+            else
+                @header_x_start = true
+            end
+        end
+    end
+    def resume
+        resume = {sections: sections, headers: headers, bullets: bullets, all_types: all_types}
+    end
+    def sections
+        @sections ||= {}
+    end
+    def headers
+        @headers ||= {}
+    end
+    def bullets
+        @bullets ||= {}
+    end
+    def all_types
+       @all_types ||= {}
+    end
+=begin
+        @length.times do |n|
+            set_classifide(n)
+            if type?
+            #check following types
+                if n < @n - 2 and n > 1
+                    if !many_words? and @p_hash[n+1][:type] == "resume_post"  and @p[:type].nil?
+                        @p[:type] = "resume_group"
+                    end
+                    if @p[:word_length] == false and @p_hash[n+1][:type] == "resume_post_x" and @p_hash[n-1][:type] != "resume_post_x"  and @p[:type].nil?
+                        @p[:type] = "resume_group"
+                    end
+                    if @p[:word_length] == false and @p_hash[n+1][:type] == "resume_line" and /resume_post/.match(@p_hash[n-1][:type]).nil? and @p[:type].nil?
+                        @p[:type] = "resume_group"
+                    end
+                end
+            end
+        end
+    #pass 4
+        (@n -1).times do |n|
+            @p = @p_hash[n]
+            if @p[:type].nil?
+                #check following types
+                if n < @n - 2 and n > 1
+                    if (@p_hash[n+1][:type] == "resume_post" or @p_hash[n+1][:type] == "resume_group") and @p_hash[n-1][:type] == "resume_post"  and @p[:type].nil?
+                        @p[:type] = "resume_line"
+                    end
+                    if @p_hash[n-1][:type] == "resume_post" and @p_hash[n+1][:type] == "resume_line"  and @p[:type].nil?
+                        @p[:type] = "resume_post_x"
+                    end
+                end
+            end
+        end
+=end
+=begin
+        @current_user_2 = current_user
+        #@current_user_2 = User.find(2)
+        @resume_line_shoot = 0
+        @resume_line_build = 0
+        (@n -1).times do |n|
+            @p = @p_hash[n]
+            puts @p[:type]
+            unless /resume/.match(@p[:type]).nil?
+                puts @p[:type]
+                construct_resume_object(args = {n: n, p_hash: @p_hash, resume_group: @resume_group, resume_post: @resume_post, resume_line: @resume_line})
+            end
+        end
+        redirect_to current_user
+=end
+end