RubyGems - lyrics - Versions diffs - 0.0.2 - Mend

lyrics 0.0.2

Files changed (50) hide show

data/.document +5 -0
data/.gitignore +21 -0
data/LICENSE +20 -0
data/README.rdoc +17 -0
data/Rakefile +45 -0
data/VERSION +1 -0
data/bin/lyrics +66 -0
data/lib/lyrics.rb +4 -0
data/lib/lyrics/cli/application.rb +99 -0
data/lib/lyrics/cli/optionsparser.rb +228 -0
data/lib/lyrics/cli/pluginadapter.rb +56 -0
data/lib/lyrics/cli/plugins.rb +79 -0
data/lib/lyrics/cli/wikipluginadapter.rb +139 -0
data/lib/lyrics/i18n/README +1 -0
data/lib/lyrics/i18n/en.rb +181 -0
data/lib/lyrics/i18n/es.rb +181 -0
data/lib/lyrics/i18n/i18n.rb +126 -0
data/lib/lyrics/i18n/sk.rb +174 -0
data/lib/lyrics/itrans/COPYRIGHT +31 -0
data/lib/lyrics/itrans/itrans +0 -0
data/lib/lyrics/itrans/itrans.txt +8 -0
data/lib/lyrics/itrans/lyric.txt +23 -0
data/lib/lyrics/itrans/udvng.ifm +206 -0
data/lib/lyrics/lyrics.rb +567 -0
data/lib/lyrics/lyrics_AZLyrics.rb +113 -0
data/lib/lyrics/lyrics_DarkLyrics.rb +124 -0
data/lib/lyrics/lyrics_Giitaayan.rb +124 -0
data/lib/lyrics/lyrics_Jamendo.rb +166 -0
data/lib/lyrics/lyrics_LeosLyrics.rb +142 -0
data/lib/lyrics/lyrics_LoudSongs.rb +135 -0
data/lib/lyrics/lyrics_LyricWiki.rb +328 -0
data/lib/lyrics/lyrics_LyricsDownload.rb +118 -0
data/lib/lyrics/lyrics_LyricsMania.rb +141 -0
data/lib/lyrics/lyrics_Lyriki.rb +286 -0
data/lib/lyrics/lyrics_SeekLyrics.rb +108 -0
data/lib/lyrics/lyrics_Sing365.rb +103 -0
data/lib/lyrics/lyrics_TerraLetras.rb +126 -0
data/lib/lyrics/mediawikilyrics.rb +1417 -0
data/lib/lyrics/utils/formdata.rb +56 -0
data/lib/lyrics/utils/htmlentities.rb +291 -0
data/lib/lyrics/utils/http.rb +198 -0
data/lib/lyrics/utils/itrans.rb +160 -0
data/lib/lyrics/utils/logger.rb +123 -0
data/lib/lyrics/utils/strings.rb +378 -0
data/lib/lyrics/utils/xmlhash.rb +111 -0
data/lyrics.gemspec +98 -0
data/spec/lyrics_spec.rb +7 -0
data/spec/spec.opts +1 -0
data/spec/spec_helper.rb +9 -0
metadata +137 -0

@@ -0,0 +1,160 @@
+# Copyright (C) 2006-2008 by Sergio Pistone
+# sergio_pistone@yahoo.com.ar
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the
+# Free Software Foundation, Inc.,
+# 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+require File.expand_path( File.dirname( __FILE__ ) + "/strings" )
+module ITRANS
+	@@itrans_dir = File.dirname( File.expand_path(__FILE__) ) + "/../itrans"
+	@@null_dev = "/dev/null"
+	def ITRANS.normalize( text )
+		return ITRANS.from_devanagari!( ITRANS.to_devanagari( text ) )
+	end
+	def ITRANS.to_devanagari!( text )
+		text.replace( to_devanagari( text ) )
+	end
+	def ITRANS.to_devanagari( text )
+		orig_pwd = Dir.pwd()
+		Dir.chdir( @@itrans_dir )
+		trans = `echo #{Strings.shell_quote( "#indianifm=udvng.ifm\n #indian\n#{text}\n#endindian" )} | #{@@itrans_dir}/itrans -U 2>#{@@null_dev}`
+		Dir.chdir( orig_pwd )
+		trans.gsub!( /%[^\n]*/, "" ) # TODO search line
+		trans.strip!()
+		return trans
+	end
+	def ITRANS.from_devanagari!( text )
+		@@devanagari2itrans.each() do |devana, itrans|
+			text.gsub!( devana, itrans )
+		end
+		@@devanagari2itrans_consonants.each() do |devana, itrans|
+			# is the only symbol in the 'word' --> add an 'a' at the end:
+			text.gsub!( /(^|[ ""\.:;\(\[])#{devana}([,;:?!\)\]\s]|$)/, "\\1#{itrans}a\\2" )
+			# is not followed by a vocal --> add an 'a' at the end:
+			text.gsub!( /#{devana}([^aeiouAEIOU,;:?!\)\]\s])/, "#{itrans}a\\1" )
+			text.gsub!( devana, itrans )
+		end
+		return text
+	end
+	def ITRANS.from_devanagari( text )
+		return ITRANS.from_devanagari!( String.new( text ) )
+	end
+	def ITRANS.unicode( codepoint )
+		[codepoint].pack( "U*" )
+	end
+	@@devanagari2itrans = {
+		ITRANS.unicode( 0x0901 ) => "",
+		# vowels:
+		ITRANS.unicode( 0x0905 ) => "a",
+		ITRANS.unicode( 0x0906 ) => "aa", # /A
+		ITRANS.unicode( 0x093E ) => "aa", # /A
+		ITRANS.unicode( 0x0907 ) => "i",
+		ITRANS.unicode( 0x093F ) => "i",
+		ITRANS.unicode( 0x0908 ) => "ii", # /I
+		ITRANS.unicode( 0x0940 ) => "ii", # /I
+		ITRANS.unicode( 0x0909 ) => "u",
+		ITRANS.unicode( 0x0941 ) => "u",
+		ITRANS.unicode( 0x090A ) => "uu", # /U
+		ITRANS.unicode( 0x0942 ) => "uu", # /U
+		ITRANS.unicode( 0x090B ) => "RRi", # R^i
+		ITRANS.unicode( 0x0943 ) => "RRi", # R^i
+		ITRANS.unicode( 0x090C ) => "LLi", # L^i
+		ITRANS.unicode( 0x0944 ) => "LLi", # L^i
+		ITRANS.unicode( 0x090F ) => "e",
+		ITRANS.unicode( 0x0947 ) => "e",
+		ITRANS.unicode( 0x0910 ) => "ai",
+		ITRANS.unicode( 0x0948 ) => "ai",
+		ITRANS.unicode( 0x0913 ) => "o",
+		ITRANS.unicode( 0x094B ) => "o",
+		ITRANS.unicode( 0x0914 ) => "au",
+		ITRANS.unicode( 0x094C ) => "au",
+		# itrans irregular
+		"क्ष"=> "kSh", # x / kS
+		"त्र"=> "tr",
+		"ज्ञ"=> "j~n", # GY / dny
+		"श्र"=> "shr",
+	}
+	@@devanagari2itrans_consonants = {
+		# gutturals:
+		ITRANS.unicode( 0x0915 ) => "k",
+		ITRANS.unicode( 0x0916 ) => "kh",
+#		ITRANS.unicode( 0x0916 ) => ".Nkh",
+		ITRANS.unicode( 0x0917 ) => "g",
+		ITRANS.unicode( 0x0918 ) => "gh",
+		ITRANS.unicode( 0x0918 ) => "~N",
+		# palatals:
+		ITRANS.unicode( 0x091A ) => "ch",
+		ITRANS.unicode( 0x091B ) => "Ch",
+		ITRANS.unicode( 0x091C ) => "j",
+		ITRANS.unicode( 0x091D ) => "jh",
+		ITRANS.unicode( 0x091E ) => "~n", # JN
+		# retroflexes:
+		ITRANS.unicode( 0x091F ) => "T",
+		ITRANS.unicode( 0x0920 ) => "Th",
+		ITRANS.unicode( 0x0921 ) => "D",
+		ITRANS.unicode( 0x0922 ) => "Dh",
+#		ITRANS.unicode( 0x0922 ) => ".Dh", # Rh (valid?)
+		ITRANS.unicode( 0x0923 ) => "N",
+		# dentals:
+		ITRANS.unicode( 0x0924 ) => "t",
+		ITRANS.unicode( 0x0925 ) => "th",
+		ITRANS.unicode( 0x0926 ) => "d",
+		ITRANS.unicode( 0x0927 ) => "dh",
+		ITRANS.unicode( 0x0928 ) => "n",
+		# labials:
+		ITRANS.unicode( 0x092A ) => "p",
+		ITRANS.unicode( 0x092B ) => "ph",
+		ITRANS.unicode( 0x092C ) => "b",
+		ITRANS.unicode( 0x092D ) => "bh",
+		ITRANS.unicode( 0x092E ) => "m",
+		# semi-vowels:
+		ITRANS.unicode( 0x092F ) => "y",
+		ITRANS.unicode( 0x0930 ) => "r",
+		ITRANS.unicode( 0x0932 ) => "l",
+		ITRANS.unicode( 0x0935 ) => "v", # w
+		# sibilants:
+		ITRANS.unicode( 0x0936 ) => "sh",
+		ITRANS.unicode( 0x0937 ) => "Sh", # shh
+		ITRANS.unicode( 0x0938 ) => "s",
+		# miscellaneous:
+		ITRANS.unicode( 0x0939 ) => "h",
+		ITRANS.unicode( 0x0902 ) => ".n", # M / .m
+		ITRANS.unicode( 0x0903 ) => "H", # .h
+		ITRANS.unicode( 0x0950 ) => "OM", # AUM
+		# other consonants:
+		"क़" => "q",
+		ITRANS.unicode( 0x0958 ) => "q",
+		"ख़" => "Kh",
+		"ग़" => "G",
+		"ज़" => "z",
+		ITRANS.unicode( 0x095B ) => "z",
+		"फ़" => "f",
+		"ड़" => ".D", # R
+		ITRANS.unicode( 0x095C ) => ".D", # R (valid?)
+		"ढ़" => ".Dh", # Rh
+	}
+end

data/lib/lyrics/utils/logger.rb ADDED

@@ -0,0 +1,123 @@
+# Copyright (C) 2006-2008 by Sergio Pistone
+# sergio_pistone@yahoo.com.ar
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the
+# Free Software Foundation, Inc.,
+# 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+class Logger
+	def initialize( file_path, truncate_to_lines=-1 )
+		@file_path = file_path
+		@tabulation = nil
+		@tabulation_base = "   ".freeze()
+		@tabulation_level = 0
+		@skip_first_line_tabulation = false
+		truncate( truncate_to_lines ) if truncate_to_lines >= 0
+	end
+	def finalize() # TODO revise implementation
+	end
+	def get_file_path()
+		return @file_path
+	end
+	def set_file_path( file_path )
+		if @file_path != file_path
+			File.delete( @file_path ) if File.exist?( @file_path ) && ! File.directory?( @file_path )
+			@file_path = file_path.clone().freeze()
+		end
+	end
+	def truncate( max_lines )
+		begin
+			file = File.new( @file_path, File::RDONLY )
+		rescue Errno::ENOENT
+			file = File.new( @file_path, File::CREAT|File::TRUNC )
+		end
+		lines = file.read().split( "\n" )
+		file.close()
+		offset = lines.size() - max_lines
+		if offset > 0
+			file = File.new( @file_path, File::CREAT|File::TRUNC|File::WRONLY )
+			max_lines.times() do |index|
+				line = lines[offset + index]
+				break if ! line
+				file.write( line )
+				file.write( "\n" )
+			end
+			file.close()
+		end
+	end
+	def reset()
+		output = File.new( @file_path, File::CREAT|File::TRUNC )
+		output.close()
+	end
+	def log( msg, new_lines=1 )
+		output = File.new( @file_path, File::CREAT|File::APPEND|File::WRONLY )
+		if @tabulation
+			output.write( @tabulation ) if ! @skip_first_line_tabulation
+			output.write( msg.gsub( "\n", "\n#{@tabulation}" ) )
+			@skip_first_line_tabulation = new_lines <= 0
+		else
+			output.write( msg )
+		end
+		new_lines.times() { output.write( "\n" ) }
+		output.close()
+	end
+	def get_tabulation_base()
+		return @tabulation_base
+	end
+	def set_tabulation_base( tabulation_base )
+		if @tabulation_base != tabulation_base
+			@tabulation_level = tabulation_base.clone().freeze()
+			if level <= 0
+				@tabulation = nil
+			else
+				@tabulation = ""
+				level.times() { @tabulation << @tabulation_base }
+			end
+		end
+	end
+	def get_tabulation_level()
+		return @tabulation_level
+	end
+	def set_tabulation_level( level )
+		if @tabulation_level != level
+			@tabulation_level = level
+			if level <= 0
+				@tabulation = nil
+			else
+				@tabulation = ""
+				level.times() { @tabulation << @tabulation_base }
+			end
+		end
+	end
+	def increase_tabulation_level()
+		set_tabulation_level( @tabulation_level + 1 )
+	end
+	def decrease_tabulation_level()
+		set_tabulation_level( @tabulation_level - 1 )
+	end
+end

data/lib/lyrics/utils/strings.rb ADDED

@@ -0,0 +1,378 @@
+# Copyright (C) 2006-2008 by Sergio Pistone
+# sergio_pistone@yahoo.com.ar
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the
+# Free Software Foundation, Inc.,
+# 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+require File.expand_path( File.dirname( __FILE__ ) + "/htmlentities" )
+require "cgi"
+$KCODE="u" # unicode support
+module Strings
+	@@word_separators = " \t\n()[],.;:-¿?¡!\"/\\"
+	def Strings.empty?( text )
+		text = text.to_s()
+		return  text.empty? ? true : text.strip.empty?
+	end
+	def Strings.shell_quote( text )
+		return "\"" + text.gsub( "\\", "\\\\\\" ).gsub( "\"", "\\\"" ).gsub( "`", "\\\\`" ) + "\""
+	end
+	def Strings.shell_unquote( text )
+		if text.slice( 0, 1 ) == "\""
+			return text.gsub( "\\`", "`" ).gsub( "\\\"", "\"" ).slice( 1..-2 )
+		else # if text.slice( 0, 1 ) == "'"
+			return text.slice( 1..-2 )
+		end
+	end
+	def Strings.shell_escape( text )
+		return text.gsub( "\\", "\\\\\\" ).gsub( "\"", "\\\"" ).gsub( "`", "\\\\`" ).gsub( %q/'/, %q/\\\'/ ).gsub( " ", "\\ " )
+	end
+	def Strings.shell_unescape( text )
+		return text.gsub( "\\ ", " " ).gsub( "\\'", "'" ).gsub( "\\`", "`" ).gsub( "\\\"", "\"" )
+	end
+	def Strings.sql_quote( text )
+		return "'" + Strings.sql_escape( text ) + "'"
+	end
+	def Strings.sql_unquote( text )
+		return Strings.sql_unescape( text.slice( 1..-2 ) )
+	end
+	def Strings.sql_escape( text )
+		return text.gsub( "'", "''" )
+	end
+	def Strings.sql_unescape( text )
+		return text.gsub( "''", "'" )
+	end
+	def Strings.random_token( length=10 )
+		chars = ( "a".."z" ).to_a() + ( "0".."9" ).to_a()
+		token = ""
+		1.upto( length ) { |i| token << chars[rand(chars.size-1)] }
+		return token
+	end
+	def Strings.remove_invalid_filename_chars( filename )
+		return Strings.remove_invalid_filename_chars!( String.new( filename ) )
+	end
+	def Strings.remove_invalid_filename_chars!( filename )
+		filename.tr_s!( "*?:|/\\<>", "" )
+		return filename
+	end
+	def Strings.remove_vocal_accents( text )
+		return Strings.remove_vocal_accents!( String.new( text ) )
+	end
+	def Strings.remove_vocal_accents!( text )
+		text.gsub!( /á|à|ä|â|å|ã/, "a" )
+		text.gsub!( /Á|À|Ä|Â|Å|Ã/, "A" )
+		text.gsub!( /é|è|ë|ê/, "e" )
+		text.gsub!( /É|È|Ë|Ê/, "E" )
+		text.gsub!( /í|ì|ï|î/, "i" )
+		text.gsub!( /Í|Ì|Ï|Î/, "I" )
+		text.gsub!( /ó|ò|ö|ô/, "o" )
+		text.gsub!( /Ó|Ò|Ö|Ô/, "O" )
+		text.gsub!( /ú|ù|ü|û/, "u" )
+		text.gsub!( /Ú|Ù|Ü|Û/, "U" )
+		return text
+	end
+	def Strings.google_search_quote( text )
+		text = text.gsub( "\"", "" )
+		text.gsub!( /^\ *the\ */i, "" )
+		return Strings.empty?( text) ? "" : "\"#{text}\""
+	end
+	def Strings.build_google_feeling_lucky_url( query, site=nil )
+		url = "http://www.google.com/search?q=#{CGI.escape( query )}"
+		url += "+site%3A#{site}" if site
+		return url + "&btnI"
+	end
+	def Strings.downcase( text )
+		begin
+			return text.to_s().unpack( "U*" ).collect() do |c|
+				if c >= 65 && c <= 90 # abcdefghijklmnopqrstuvwxyz
+					c + 32
+				elsif c >= 192 && c <= 222 # ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞ
+					c + 32
+				else
+					c
+				end
+			end.pack( "U*" )
+		rescue Exception # fallback to normal operation on error
+			return text.downcase()
+		end
+	end
+	def Strings.downcase!( text )
+		return text.replace( Strings.downcase( text ) )
+	end
+	def Strings.upcase( text )
+		begin
+			return text.to_s().unpack( "U*" ).collect() do |c|
+				if c >= 97 && c <= 122 # ABCDEFGHIJKLMNOPQRSTUVWXYZ
+					c - 32
+				elsif c >= 224 && c <= 254 # àáâãäåæçèéêëìíîïðñòóôõö×øùúûüýþ
+					c - 32
+				else
+					c
+				end
+			end.pack( "U*" )
+		rescue Exception # fallback to normal operation on error
+			return text.upcase()
+		end
+	end
+	def Strings.upcase!( text )
+		return text.replace( Strings.upcase( text ) )
+	end
+	def Strings.capitalize( text, downcase=false, first_only=false )
+		text = downcase ? Strings.downcase( text ) : text.to_s()
+		if first_only
+			text.sub!( /^([0-9a-zA-Zàáâãäåæçèéêëìíîïðñòóôõö×øùúûüýþÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞ])/ ) {|c| Strings.upcase( c ) }
+		else
+			text.sub!( /([0-9a-zA-Zàáâãäåæçèéêëìíîïðñòóôõö×øùúûüýþÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞ])/ ) {|c| Strings.upcase( c ) }
+		end
+		return text
+	end
+	def Strings.capitalize!( text, downcase=false, first_only=false )
+		return text.replace( Strings.capitalize( text, downcase, first_only ) )
+	end
+	def Strings.titlecase( text, correct_case=true, downcase=false )
+		text = Strings.capitalize( text, downcase )
+		word_start = true
+		text = text.unpack( "U*" ).collect() do |c|
+			if word_start
+				chr = [c].pack( "U*" )
+				if ! @@word_separators.include?( chr )
+					word_start = false
+					c = Strings.upcase( chr ).unpack( "U*" )[0]
+				end
+			else
+				chr = c < 256 ? c.chr() : [c].pack( "U*" )
+				word_start = true if @@word_separators.include?( chr )
+			end
+			c
+		end.pack( "U*" )
+		if correct_case
+			lc_words = [
+				"the", "a", "an", # articles
+				"and", "but", "or", "nor", # conjunctions
+				"'n'", "'n", "n'", # and contractions
+				"as", "at", "by", "for", "in", "of", "on", "to", # short prepositions
+				#"from", "into", "onto", "with", "over" # not so short prepositions
+				"feat", "vs", # special words
+			]
+			lc_words.each() do |lc_word|
+				text.gsub!( /\ #{lc_word}([ ,;:\.-?!\"\/\\\)])/i, " #{lc_word}\\1" )
+			end
+		end
+		return text
+	end
+	def Strings.titlecase!( text, correct_case=true, downcase=false )
+		return text.replace( Strings.titlecase( text, correct_case, downcase ) )
+	end
+	def Strings.normalize( token )
+		token = Strings.downcase( token )
+		token.tr_s!( " \n\r\t.;:()[]", " " )
+		token.strip!()
+		token.gsub!( /`|´|’/, "'" )
+		token.gsub!( /''|«|»/, "\"" )
+		token.gsub!( /[&+]/, "and" )
+		token.gsub!( /\ ('n'|'n|n') /, " and " )
+		token.gsub!( /^the /, "" )
+		token.gsub!( /, the$/, "" )
+		return token
+	end
+	def Strings.normalize!( token )
+		return token.replace( Strings.normalize( token ) )
+	end
+	def Strings.decode_htmlentities!( var )
+		if var.is_a?( String )
+			HTMLEntities.decode!( var )
+		elsif var.is_a?( Hash )
+			var.each() { |key, value| decode_htmlentities!( value ) }
+		end
+		return var
+	end
+	def Strings.decode_htmlentities( var )
+		if var.is_a?( String )
+			return HTMLEntities.decode( var )
+		elsif var.is_a?( Hash )
+			ret = {}
+			var.each() do |key, value|
+				ret[key] = decode_htmlentities( value )
+			end
+			return ret
+		else
+			return var
+		end
+	end
+	def Strings.cleanup_lyrics( lyrics )
+		lyrics = HTMLEntities.decode( lyrics )
+		prev_line = ""
+		lines = []
+		lyrics.split( /\r\n|\n|\r/ ).each do |line|
+			# remove unnecesary spaces
+			line.tr_s!( "\t ", " " )
+			line.strip!()
+			# quotes and double quotes
+			line.gsub!( /`|´|’|‘|’|/, "'" )
+			line.gsub!( /''|&quot;|«|»|„|”||/, "\"" )
+			# suspensive points
+			line.gsub!( /…+/, "..." )
+			line.gsub!( /[,;]?\.{2,}/, "..." )
+			# add space after "?", "!", ",", ";", ":", ".", ")" and "]" if not present
+			line.gsub!( /([^\.]?[\?!,;:\.\)\]])([^ "'<])/, "\\1 \\2" )
+			# remove spaces after "¿", "¡", "(" and ")"
+			line.gsub!( /([¿¡\(\[]) /, "\\1" )
+			# remove spaces before "?", "!", ",", ";", ":", ".", ")" and "]"
+			line.gsub!( /\ ([\?!,;:\.\)\]])/, "\\1" )
+			# remove space after ... at the beginning of sentence
+			line.gsub!( /^\.\.\. /, "..." )
+			# remove single points at end of sentence
+			line.gsub!( /([^\.])\.$/, "\\1" )
+			# remove commas and semicolons at end of sentence
+			line.gsub!( /[,;]$/, "" )
+			# fix english I pronoun capitalization
+			line.gsub!( /([ "'\(\[])i([\ '",;:\.\?!\]\)]|$)/, "\\1I\\2" )
+			# remove spaces after " or ' at the begin of sentence of before them when at the end
+			line.sub!( /^(["']) /, "\\1" )
+			line.sub!( /\ (["'])$/, "\\1" )
+			# capitalize first alfabet character of the line
+			Strings.capitalize!( line )
+			# no more than one empty line at the time
+			if ! line.empty? || ! prev_line.empty?
+				lines << line
+				prev_line = line
+			end
+		end
+		if lines.length > 0 && lines[lines.length-1].empty?
+			lines.delete_at( lines.length-1 )
+		end
+		return lines.join( "\n" )
+	end
+	def Strings.cleanup_lyrics!( lyrics )
+		return lyrics.replace( Strings.cleanup_lyrics( lyrics ) )
+	end
+	def Strings.cleanup_artist( artist, title )
+		artist = artist.strip()
+		if artist != ""
+			if (md = /[ \(\[](ft\.|ft |feat\.|feat |featuring ) *([^\)\]]+)[\)\]]? *$/i.match( title.to_s() ))
+				artist << " feat. " << md[2]
+			else
+				artist.gsub!( /[ \(\[](ft\.|ft |feat\.|feat |featuring ) *([^\)\]]+)[\)\]]? *$/i, " feat. \\2" )
+			end
+		end
+		return artist
+	end
+	def Strings.cleanup_title( title )
+		title = title.gsub( /[ \(\[](ft\.|ft |feat\.|feat |featuring ) *([^\)\]]+)[\)\]]? *$/i, "" )
+		title.strip!()
+		return title
+	end
+	def Strings.utf82latin1( text )
+		begin
+			return text.unpack( "U*" ).pack( "C*" )
+		rescue Exception
+			$stderr << "warning: conversion from UTF-8 to Latin1 failed\n"
+			return text
+		end
+	end
+	def Strings.latin12utf8( text )
+		begin
+			return text.unpack( "C*" ).pack( "U*" )
+		rescue Exception
+			$stderr << "warning: conversion from Latin1 to UTF-8 failed\n"
+			return text
+		end
+	end
+	def Strings.scramble( text )
+		text = text.to_s()
+		2.times() do
+			chars = text.unpack( "U*" ).reverse()
+			chars.size.times() { |idx| chars[idx] = (chars[idx] + idx + 1) }
+			text = chars.collect() { |c| c.to_s }.join( ":" )
+		end
+		return text
+	end
+	def Strings.scramble!( text )
+		return text.replace( Strings.scramble( text ) )
+	end
+	def Strings.descramble( text )
+		text = text.to_s()
+		2.times() do
+			chars = text.split( ":" ).collect() { |c| c.to_i }
+			chars.size.times() { |idx| chars[idx] = (chars[idx] - idx - 1) }
+			text = chars.reverse().pack( "U*" )
+		end
+		return text
+	end
+	def Strings.descramble!( text )
+		return text.replace( Strings.descramble( text ) )
+	end
+end