RubyGems - linguistics - Versions diffs - 1.0.9 → 2.0.0 - Mend

linguistics 1.0.9 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (69) hide show

data.tar.gz.sig +0 -0
data/.gemtest +0 -0
data/ChangeLog +849 -342
data/History.rdoc +11 -0
data/LICENSE +9 -9
data/Manifest.txt +44 -0
data/README.rdoc +226 -0
data/Rakefile +32 -349
data/examples/endocs.rb +272 -0
data/examples/generalize_sentence.rb +2 -1
data/examples/klingon.rb +22 -0
data/lib/linguistics.rb +130 -292
data/lib/linguistics/en.rb +337 -1628
data/lib/linguistics/en/articles.rb +138 -0
data/lib/linguistics/en/conjugation.rb +2245 -0
data/lib/linguistics/en/conjunctions.rb +202 -0
data/lib/linguistics/en/{infinitive.rb → infinitives.rb} +41 -55
data/lib/linguistics/en/linkparser.rb +41 -49
data/lib/linguistics/en/numbers.rb +483 -0
data/lib/linguistics/en/participles.rb +33 -0
data/lib/linguistics/en/pluralization.rb +810 -0
data/lib/linguistics/en/stemmer.rb +75 -0
data/lib/linguistics/en/titlecase.rb +121 -0
data/lib/linguistics/en/wordnet.rb +63 -97
data/lib/linguistics/inflector.rb +89 -0
data/lib/linguistics/iso639.rb +534 -448
data/lib/linguistics/languagebehavior.rb +36 -0
data/lib/linguistics/monkeypatches.rb +42 -0
data/spec/lib/constants.rb +15 -0
data/spec/lib/helpers.rb +38 -0
data/spec/linguistics/en/articles_spec.rb +797 -0
data/spec/linguistics/en/conjugation_spec.rb +2083 -0
data/spec/linguistics/en/conjunctions_spec.rb +154 -0
data/spec/linguistics/en/infinitives_spec.rb +518 -0
data/spec/linguistics/en/linkparser_spec.rb +66 -0
data/spec/linguistics/en/numbers_spec.rb +1295 -0
data/spec/linguistics/en/participles_spec.rb +55 -0
data/spec/linguistics/en/pluralization_spec.rb +4636 -0
data/spec/linguistics/en/stemmer_spec.rb +72 -0
data/spec/linguistics/en/titlecase_spec.rb +841 -0
data/spec/linguistics/en/wordnet_spec.rb +85 -0
data/spec/linguistics/en_spec.rb +45 -167
data/spec/linguistics/inflector_spec.rb +40 -0
data/spec/linguistics/iso639_spec.rb +49 -53
data/spec/linguistics/monkeypatches_spec.rb +40 -0
data/spec/linguistics_spec.rb +46 -76
metadata +241 -113
metadata.gz.sig +0 -0
data/README +0 -166
data/README.english +0 -245
data/rake/191_compat.rb +0 -26
data/rake/dependencies.rb +0 -76
data/rake/documentation.rb +0 -123
data/rake/helpers.rb +0 -502
data/rake/hg.rb +0 -318
data/rake/manual.rb +0 -787
data/rake/packaging.rb +0 -129
data/rake/publishing.rb +0 -341
data/rake/style.rb +0 -62
data/rake/svn.rb +0 -668
data/rake/testing.rb +0 -152
data/rake/verifytask.rb +0 -64
data/tests/en/infinitive.tests.rb +0 -207
data/tests/en/inflect.tests.rb +0 -1389
data/tests/en/lafcadio.tests.rb +0 -77
data/tests/en/linkparser.tests.rb +0 -42
data/tests/en/lprintf.tests.rb +0 -77
data/tests/en/titlecase.tests.rb +0 -73
data/tests/en/wordnet.tests.rb +0 -95

data/lib/linguistics/en/participles.rb ADDED Viewed

@@ -0,0 +1,33 @@
+#!/usr/bin/ruby
+require 'linguistics/en' unless defined?( Linguistics::EN )
+# Methods for deriving present participles for the English-language
+# Linguistics module.
+module Linguistics::EN::Participles
+	# Register this module to the list of modules to include
+	Linguistics::EN.register_extension( self )
+	### Attempt to return the inflected string in its present participle
+	### form (e.g., talked -> talking).
+	def present_participle
+        plural = self.to_s.en.plural_verb
+		plural.sub!( /ie$/, 'y' ) or
+			plural.sub!( /ue$/, 'u' ) or
+			plural.sub!( /([auy])e$/, '$1' ) or
+			plural.sub!( /i$/, '' ) or
+			plural.sub!( /([^e])e$/, "\\1" ) or
+			/er$/.match( plural ) or
+			plural.sub!( /([^aeiou][aeiouy]([bdgmnprst]))$/, "\\1\\2" )
+        return "#{plural}ing"
+	end
+	alias_method :part_pres, :present_participle
+	Linguistics::EN.register_lprintf_formatter :PART_PRES, :present_participle
+end # module Linguistics::EN::Participles

data/lib/linguistics/en/pluralization.rb ADDED Viewed

@@ -0,0 +1,810 @@
+#!/usr/bin/env ruby
+require 'linguistics/en' unless defined?( Linguistics )
+# Plural inflection methods for the English-language Linguistics module.
+#
+# It provides conversion of plural forms of all nouns, most verbs,
+# and some adjectives. It also provides "classical" variants (for
+# example: "brother" -> "brethren", "dogma" -> "dogmata", etc.) where
+# appropriate.
+module Linguistics::EN::Pluralization
+	# Register this module to the list of modules to include
+	Linguistics::EN.register_extension( self )
+	### Utility function for creating Regexp unions
+	def self::matchgroup( *parts )
+		return Regexp.union( *(parts.flatten) )
+	end
+	private_class_method :matchgroup
+	#
+	# Plurals
+	#
+	PL_sb_irregular_s = {
+		"ephemeris"	=> "ephemerides",
+		"iris"		=> "irises|irides",
+		"clitoris"	=> "clitorises|clitorides",
+		"corpus"	=> "corpuses|corpora",
+		"opus"		=> "opuses|opera",
+		"genus"		=> "genera",
+		"mythos"	=> "mythoi",
+		"penis"		=> "penises|penes",
+		"testis"	=> "testes",
+	}
+	PL_sb_irregular_h = {
+		"child"		=> "children",
+		"brother"	=> "brothers|brethren",
+		"loaf"		=> "loaves",
+		"hoof"		=> "hoofs|hooves",
+		"beef"		=> "beefs|beeves",
+		"money"		=> "monies",
+		"mongoose"	=> "mongooses",
+		"ox"		=> "oxen",
+		"cow"		=> "cows|kine",
+		"soliloquy"	=> "soliloquies",
+		"graffito"	=> "graffiti",
+		"prima donna"	=> "prima donnas|prime donne",
+		"octopus"	=> "octopuses|octopodes",
+		"genie"		=> "genies|genii",
+		"ganglion"	=> "ganglions|ganglia",
+		"trilby"	=> "trilbys",
+		"turf"		=> "turfs|turves",
+	}.update( PL_sb_irregular_s )
+	PL_sb_irregular = matchgroup PL_sb_irregular_h.keys
+	# Classical "..a" -> "..ata"
+	PL_sb_C_a_ata = matchgroup %w[
+		anathema bema carcinoma charisma diploma
+		dogma drama edema enema enigma lemma
+		lymphoma magma melisma miasma oedema
+		sarcoma schema soma stigma stoma trauma
+		gumma pragma
+	].collect {|word| word[0...-1]}
+	# Unconditional "..a" -> "..ae"
+	PL_sb_U_a_ae = matchgroup %w[
+		alumna alga vertebra persona
+	]
+	# Classical "..a" -> "..ae"
+	PL_sb_C_a_ae = matchgroup [/.*umbra/ ] + %w[
+		amoeba antenna formula hyperbola
+		medusa nebula parabola abscissa
+		hydra nova lacuna aurora
+		flora fauna
+	]
+	# Classical "..en" -> "..ina"
+	PL_sb_C_en_ina = matchgroup %w[
+		stamen	foramen	lumen
+	].collect {|word| word[0...-2] }
+	# Unconditional "..um" -> "..a"
+	PL_sb_U_um_a = matchgroup %w[
+		bacterium agendum desideratum erratum
+		stratum datum ovum extremum candelabrum
+	].collect {|word| word[0...-2] }
+	# Classical "..um" -> "..a"
+	PL_sb_C_um_a = matchgroup %w[
+		maximum	minimum	momentum	optimum
+		quantum	cranium	curriculum	dictum
+		phylum	aquarium	compendium	emporium
+		enconium	gymnasium	honorarium	interregnum
+		lustrum 	memorandum	millenium 	rostrum
+		spectrum	speculum	stadium	trapezium
+		ultimatum	medium	vacuum	velum
+		consortium
+	].collect {|word| word[0...-2]}
+	# Unconditional "..us" -> "i"
+	PL_sb_U_us_i = matchgroup %w[
+		alumnus	alveolus	bacillus	bronchus
+		locus	nucleus	stimulus	meniscus
+	].collect {|word| word[0...-2]}
+	# Classical "..us" -> "..i"
+	PL_sb_C_us_i = matchgroup %w[
+		focus	radius	genius
+		incubus	succubus	nimbus
+		fungus	nucleolus	stylus
+		torus	umbilicus	uterus
+		hippopotamus
+	].collect {|word| word[0...-2]}
+	# Classical "..us" -> "..us"  (assimilated 4th declension latin nouns)
+	PL_sb_C_us_us = matchgroup %w[
+		status apparatus prospectus sinus
+		hiatus impetus plexus
+	]
+	# Unconditional "..on" -> "a"
+	PL_sb_U_on_a = matchgroup %w[
+		criterion	perihelion	aphelion
+		phenomenon	prolegomenon	noumenon
+		organon	asyndeton	hyperbaton
+	].collect {|word| word[0...-2]}
+	# Classical "..on" -> "..a"
+	PL_sb_C_on_a = matchgroup %w[
+		oxymoron
+	].collect {|word| word[0...-2]}
+	# Classical "..o" -> "..i"  (but normally -> "..os")
+	PL_sb_C_o_i_a = %w[
+		solo		soprano	basso	alto
+		contralto	tempo	piano
+	]
+	PL_sb_C_o_i = matchgroup PL_sb_C_o_i_a.collect{|word| word[0...-1]}
+	# Always "..o" -> "..os"
+	PL_sb_U_o_os = matchgroup( %w[
+		albino	archipelago	armadillo
+		commando	crescendo	fiasco
+		ditto	dynamo	embryo
+		ghetto	guano	inferno
+		jumbo	lumbago	magneto
+		manifesto	medico	octavo
+		photo	pro		quarto
+		canto	lingo	generalissimo
+		stylo	rhino
+	] | PL_sb_C_o_i_a )
+	# Unconditional "..[ei]x" -> "..ices"
+	PL_sb_U_ex_ices = matchgroup %w[
+		codex	murex	silex
+	].collect {|word| word[0...-2]}
+	PL_sb_U_ix_ices = matchgroup %w[
+		radix	helix
+	].collect {|word| word[0...-2]}
+	# Classical "..[ei]x" -> "..ices"
+	PL_sb_C_ex_ices = matchgroup %w[
+		vortex	vertex	cortex	latex
+		pontifex	apex		index	simplex
+	].collect {|word| word[0...-2]}
+	PL_sb_C_ix_ices = matchgroup %w[
+		appendix
+	].collect {|word| word[0...-2]}
+	# Arabic: ".." -> "..i"
+	PL_sb_C_i = matchgroup %w[
+		afrit	afreet	efreet
+	]
+	# Hebrew: ".." -> "..im"
+	PL_sb_C_im = matchgroup %w[
+		goy		seraph	cherub
+	]
+	# Unconditional "..man" -> "..mans"
+	PL_sb_U_man_mans = matchgroup %w[
+		human
+		Alabaman Bahaman Burman German
+		Hiroshiman Liman Nakayaman Oklahoman
+		Panaman Selman Sonaman Tacoman Yakiman
+		Yokohaman Yuman
+	]
+	PL_sb_uninflected_s = [
+		# Pairs or groups subsumed to a singular...
+		"breeches", "britches", "clippers", "gallows", "hijinks",
+		"headquarters", "pliers", "scissors", "testes", "herpes",
+		"pincers", "shears", "proceedings", "trousers",
+		# Unassimilated Latin 4th declension
+		"cantus", "coitus", "nexus",
+		# Recent imports...
+		"contretemps", "corps", "debris",
+		/.*ois/,
+		# Diseases
+		/.*measles/, "mumps",
+		# Miscellaneous others...
+		"diabetes", "jackanapes", "series", "species", "rabies",
+		"chassis", "innings", "news", "mews",
+	]
+	# Don't inflect in classical mode, otherwise normal inflection
+	PL_sb_uninflected_herd = matchgroup %w[
+		wildebeest swine eland bison buffalo
+		elk moose rhinoceros
+	]
+	PL_sb_uninflected = matchgroup(
+		# Some fish and herd animals
+		/.*fish/, "tuna", "salmon", "mackerel", "trout",
+		"bream", /sea[- ]bass/, "carp", "cod", "flounder", "whiting",
+		/.*deer/, /.*sheep/,
+		# All nationals ending in -ese
+		"Portuguese", "Amoyese", "Borghese", "Congoese", "Faroese",
+		"Foochowese", "Genevese", "Genoese", "Gilbertese", "Hottentotese",
+		"Kiplingese", "Kongoese", "Lucchese", "Maltese", "Nankingese",
+		"Niasese", "Pekingese", "Piedmontese", "Pistoiese", "Sarawakese",
+		"Shavese", "Vermontese", "Wenchowese", "Yengeese",
+		/.*[nrlm]ese/,
+		# Some words ending in ...s (often pairs taken as a whole)
+		PL_sb_uninflected_s,
+		# Diseases
+		/.*pox/,
+		# Other oddities
+		"graffiti", "djinn"
+	)
+	# Singular words ending in ...s (all inflect with ...es)
+	PL_sb_singular_s = matchgroup [ /.*ss/, /.*us/ ] +
+		%w[
+			acropolis aegis alias arthritis asbestos atlas
+			bathos bias bronchitis bursitis caddis cannabis
+			canvas chaos cosmos dais digitalis encephalitis
+			epidermis ethos eyas gas glottis hepatitis
+			hubris ibis lens mantis marquis metropolis
+			neuritis pathos pelvis polis rhinoceros
+			sassafras tonsillitis trellis
+		]
+	PL_v_special_s = matchgroup [
+		PL_sb_singular_s,
+		PL_sb_uninflected_s,
+		PL_sb_irregular_s.keys,
+		/(.*[csx])is/,
+		/(.*)ceps/,
+		/[A-Z].*s/,
+	]
+	PL_sb_postfix_adj = '(' + {
+		'general' => '(?!major|lieutenant|brigadier|adjutant)\S+',
+		'martial' => "court",
+	}.collect {|key,val|
+		"(?:#{val})(?=(?:-|\\s+)#{key})"
+	}.join("|") + ")(.*)"
+	PL_sb_military = %r'major|lieutenant|brigadier|adjutant|quartermaster'
+	PL_sb_general = %r'((?!#{PL_sb_military.source}).*?)((-|\s+)general)'
+	PL_prep = matchgroup %w[
+		about above across after among around at athwart before behind
+		below beneath beside besides between betwixt beyond but by
+		during except for from in into near of off on onto out over
+		since till to under until unto upon with
+	]
+	PL_sb_prep_dual_compound = %r'(.*?)((?:-|\s+)(?:#{PL_prep}|d[eu])(?:-|\s+))a(?:-|\s+)(.*)'
+	PL_sb_prep_compound = %r'(.*?)((-|\s+)(#{PL_prep}|d[eu])((-|\s+)(.*))?)'
+	PL_pron_nom_h = {
+		#	Nominative		Reflexive
+		"i"		=> "we",	"myself"   =>	"ourselves",
+		"you"	=> "you",	"yourself" =>	"yourselves",
+		"she"	=> "they",	"herself"  =>	"themselves",
+		"he"	=> "they",	"himself"  =>	"themselves",
+		"it"	=> "they",	"itself"   =>	"themselves",
+		"they"	=> "they",	"themself" =>	"themselves",
+		#	Possessive
+		"mine"	 => "ours",
+		"yours"	 => "yours",
+		"hers"	 => "theirs",
+		"his"	 => "theirs",
+		"its"	 => "theirs",
+		"theirs" => "theirs",
+	}
+	PL_pron_nom = Regexp.new( PL_pron_nom_h.keys.join('|'), Regexp::IGNORECASE )
+	PL_pron_acc_h = {
+		#	Accusative		Reflexive
+		"me"	=> "us",	"myself"   =>	"ourselves",
+		"you"	=> "you",	"yourself" =>	"yourselves",
+		"her"	=> "them",	"herself"  =>	"themselves",
+		"him"	=> "them",	"himself"  =>	"themselves",
+		"it"	=> "them",	"itself"   =>	"themselves",
+		"them"	=> "them",	"themself" =>	"themselves",
+	}
+	PL_pron_acc = matchgroup PL_pron_acc_h.keys
+	PL_v_irregular_pres_h = {
+		#	1St pers. sing.		2nd pers. sing.		3rd pers. singular
+		#				3rd pers. (indet.)
+		"am"	=> "are",	"are"	=> "are",	"is"	 => "are",
+		"was"	=> "were",	"were"	=> "were",	"was"	 => "were",
+		"have"  => "have",	"have"  => "have",	"has"	 => "have",
+	}
+	PL_v_irregular_pres = matchgroup PL_v_irregular_pres_h.keys
+	PL_v_ambiguous_pres_h = {
+		#	1st pers. sing.		2nd pers. sing.		3rd pers. singular
+		#				3rd pers. (indet.)
+		"act"	=> "act",	"act"	=> "act",	"acts"	  => "act",
+		"blame"	=> "blame",	"blame"	=> "blame",	"blames"  => "blame",
+		"can"	=> "can",	"can"	=> "can",	"can"	  => "can",
+		"must"	=> "must",	"must"	=> "must",	"must"	  => "must",
+		"fly"	=> "fly",	"fly"	=> "fly",	"flies"	  => "fly",
+		"copy"	=> "copy",	"copy"	=> "copy",	"copies"  => "copy",
+		"drink"	=> "drink",	"drink"	=> "drink",	"drinks"  => "drink",
+		"fight"	=> "fight",	"fight"	=> "fight",	"fights"  => "fight",
+		"fire"	=> "fire",	"fire"	=> "fire",	"fires"   => "fire",
+		"like"	=> "like",	"like"	=> "like",	"likes"   => "like",
+		"look"	=> "look",	"look"	=> "look",	"looks"   => "look",
+		"make"	=> "make",	"make"	=> "make",	"makes"   => "make",
+		"reach"	=> "reach",	"reach"	=> "reach",	"reaches" => "reach",
+		"run"	=> "run",	"run"	=> "run",	"runs"    => "run",
+		"sink"	=> "sink",	"sink"	=> "sink",	"sinks"   => "sink",
+		"sleep"	=> "sleep",	"sleep"	=> "sleep",	"sleeps"  => "sleep",
+		"view"	=> "view",	"view"	=> "view",	"views"   => "view",
+	}
+	PL_v_ambiguous_pres = matchgroup PL_v_ambiguous_pres_h.keys
+	PL_v_irregular_non_pres = matchgroup %w[
+		did had ate made put
+		spent fought sank gave sought
+		shall could ought should
+	]
+	PL_v_ambiguous_non_pres = matchgroup %w[
+		thought saw bent will might cut
+	]
+	PL_count_zero = matchgroup %w[
+		0 no zero nil
+	]
+	PL_count_one = matchgroup %w[
+		1 a an one each every this that
+	]
+	PL_adj_special_h = {
+		"a"    => "some",	"an"   =>  "some",
+		"this" => "these",	"that" => "those",
+	}
+	PL_adj_special = matchgroup PL_adj_special_h.keys
+	PL_adj_poss_h = {
+		"my"    => "our",
+		"your"	=> "your",
+		"its"	=> "their",
+		"her"	=> "their",
+		"his"	=> "their",
+		"their"	=> "their",
+	}
+	PL_adj_poss = matchgroup PL_adj_poss_h.keys
+	#################################################################
+	###	P U B L I C   F U N C T I O N S
+	#################################################################
+	### Return the plural of the given +phrase+ if +count+ indicates it should
+	### be plural.
+	def plural( count=2 )
+		phrase = if self.respond_to?( :to_int )
+				self.numwords
+			else
+				self.to_s
+			end
+		self.log.debug "Pluralizing %p" % [ phrase ]
+		pre = text = post = nil
+		# If the string has whitespace, only pluralize the middle bit, but
+		# preserve the whitespace to add back to the result.
+		if md = /\A(\s*)(.+?)(\s*)\Z/.match( phrase.to_s )
+			pre, text, post = md.captures
+		else
+			return phrase
+		end
+		plural = postprocess( text,
+			pluralize_special_adjective(text, count) ||
+			pluralize_special_verb(text, count) ||
+			pluralize_noun(text, count) )
+		return pre + plural + post
+	end
+	Linguistics::EN.register_lprintf_formatter :PL, :plural
+	### Return the plural of the given noun +phrase+ if +count+ indicates it
+	### should be plural.
+	def plural_noun( count=2 )
+		phrase = self.to_s
+		md = /\A(\s*)(.+?)(\s*)\Z/.match( phrase )
+		pre, word, post = md.captures
+		return phrase if word.nil? or word.empty?
+		plural = postprocess( word, pluralize_noun(word, count) )
+		return pre + plural + post
+	end
+	### Return the plural of the given verb +phrase+ if +count+ indicates it
+	### should be plural.
+	def plural_verb( count=2 )
+		phrase = self.to_s
+		md = /\A(\s*)(.+?)(\s*)\Z/.match( phrase )
+		pre, word, post = md.captures
+		return phrase if word.nil? or word.empty?
+		plural = postprocess( word,
+			pluralize_special_verb(word, count) ||
+			pluralize_general_verb(word, count) )
+		return pre + plural + post
+	end
+	### Return the plural of the given adjectival +phrase+ if +count+ indicates
+	### it should be plural.
+	def plural_adjective( count=2 )
+		phrase = self.to_s
+		md = /\A(\s*)(.+?)(\s*)\Z/.match( phrase )
+		pre, word, post = md.captures
+		return phrase if word.nil? or word.empty?
+		plural = postprocess( word, pluralize_special_adjective(word, count) || word )
+		return pre + plural + post
+	end
+	alias_method :plural_adj, :plural_adjective
+	#################################################################
+	###	P R I V A T E   F U N C T I O N S
+	#################################################################
+	#######
+	private
+	#######
+	### Do normal/classical switching and match capitalization in +inflected+ by
+	### examining the +original+ input.
+	def postprocess( original, inflected )
+		# If there's a classical variant, use it instead of the modern one if
+		# classical mode is on.
+		inflected.sub!( /([^|]+)\|(.+)/ ) do
+			Linguistics::EN.classical? ? $2 : $1
+		end
+		# Try to duplicate the case of the original string
+		case original
+		when "I"
+			return inflected
+		when /^[A-Z]+$/
+			return inflected.upcase
+		when /^[A-Z]/
+			# Can't use #capitalize, as it will downcase the rest of the string,
+			# too.
+			inflected[0,1] = inflected[0,1].upcase
+			return inflected
+		else
+			return inflected
+		end
+	end
+	### Normalize a count to either 1 or 2 (singular or plural)
+	def normalize_count( count, default=2 )
+		return default if count.nil? # Default to plural
+		if /^(#{PL_count_one})$/i =~ count.to_s ||
+		   ( Linguistics::EN.classical? && /^(#{PL_count_zero})$/ =~ count.to_s )
+			return 1
+		else
+			return default
+		end
+	end
+	### Pluralize nouns
+	def pluralize_noun( word, count=2 )
+		self.log.debug "Trying to pluralize %p as a noun" % [ word ]
+		value = nil
+		count = normalize_count( count )
+		return word if count == 1
+		# Handle user-defined nouns
+		#if value = ud_match( word, PL_sb_user_defined )
+		#	return value
+		#end
+		# Handle empty word, singular count and uninflected plurals
+		case word
+		when ''
+			self.log.debug "  empty string"
+			return word
+		when /^(#{PL_sb_uninflected})$/i
+			self.log.debug "  uninflected plural"
+			return word
+		else
+			if Linguistics::EN.classical? && /^(#{PL_sb_uninflected_herd})$/i =~ word
+				self.log.debug "  uninflected classical herd word"
+				return word
+			end
+		end
+		# Handle compounds ("Governor General", "mother-in-law", "aide-de-camp", etc.)
+		case word
+		when /^(?:#{PL_sb_postfix_adj})$/i
+			value = $2
+			noun = $1
+			self.log.debug "  postfixed adjectival compound noun phrase (#{value} -> #{noun})"
+			return pluralize_noun( noun, 2 ) + value
+		when /^(?:#{PL_sb_prep_dual_compound})$/i
+			noun = $1
+			value = [ $2, $3 ]
+			self.log.debug "  prepositional dual compound noun phrase (%s -> %s %s)" %
+				[ noun, *value ]
+			return pluralize_noun( noun, 2 ) + value[0] + pluralize_noun( value[1] )
+		when /^(?:#{PL_sb_prep_compound})$/i
+			noun = $1
+			value = $2
+			self.log.debug "  prepositional singular compound noun phrase (%s -> %s)" %
+				[ noun, value ]
+			return pluralize_noun( noun, 2 ) + value
+		# Handle pronouns
+		when /^((?:#{PL_prep})\s+)(#{PL_pron_acc})$/i
+			prep, pron = $1, $2
+			self.log.debug "  prepositional pronoun phrase (%p + %p)" % [ prep, pron ]
+			return prep + PL_pron_acc_h[ pron.downcase ]
+		when /^(#{PL_pron_nom})$/i
+			pron = $1
+			self.log.debug "  nominative pronoun; using PL_pron_nom table"
+			return PL_pron_nom_h[ word.downcase ]
+		when /^(#{PL_pron_acc})$/i
+			self.log.debug "  accusative pronoun; using PL_pron_acc table"
+			return PL_pron_acc_h[ word.downcase ]
+		# Handle isolated irregular plurals
+		when /(.*)\b(#{PL_sb_irregular})$/i
+			prefix, word = $1, $2
+			self.log.debug "  isolated irregular; using PL_sb_irregular_h table"
+			return prefix + PL_sb_irregular_h[ word.downcase ]
+		# Unconditional ...man -> ...mans
+		when /(#{PL_sb_U_man_mans})$/i
+			word = $1
+			self.log.debug "  unconditional man -> mans (%p)" % [ word ]
+			return "#{word}s"
+		# Handle families of irregular plurals
+		when /(.*)man$/i then                  return "#{$1}men"
+		when /(.*[ml])ouse$/i then             return "#{$1}ice"
+		when /(.*)goose$/i then                return "#{$1}geese"
+		when /(.*)tooth$/i then                return "#{$1}teeth"
+		when /(.*)foot$/i then                 return "#{$1}feet"
+		# Handle unassimilated imports
+		when /(.*)ceps$/i then                 return word
+		when /(.*)zoon$/i then                 return "#{$1}zoa"
+		when /(.*[csx])is$/i then              return "#{$1}es"
+		when /(#{PL_sb_U_ex_ices})ex$/i then   return "#{$1}ices"
+		when /(#{PL_sb_U_ix_ices})ix$/i then   return "#{$1}ices"
+		when /(#{PL_sb_U_um_a})um$/i then      return "#{$1}a"
+		when /(#{PL_sb_U_us_i})us$/i then      return "#{$1}i"
+		when /(#{PL_sb_U_on_a})on$/i then      return "#{$1}a"
+		when /(#{PL_sb_U_a_ae})$/i then        return "#{$1}e"
+		end
+		# Handle incompletely assimilated imports in classical mode
+		if Linguistics::EN.classical?
+			self.log.debug "  checking for classical incompletely assimilated imports"
+			case word
+			when /(.*)trix$/i then               return "#{$1}trices"
+			when /(.*)eau$/i then                return "#{$1}eaux"
+			when /(.*)ieu$/i then                return "#{$1}ieux"
+			when /(.{2,}[yia])nx$/i then         return "#{$1}nges"
+			when /(#{PL_sb_C_en_ina})en$/i then  return "#{$1}ina"
+			when /(#{PL_sb_C_ex_ices})ex$/i then return "#{$1}ices"
+			when /(#{PL_sb_C_ix_ices})ix$/i then return "#{$1}ices"
+			when /(#{PL_sb_C_um_a})um$/i then    return "#{$1}a"
+			when /(#{PL_sb_C_us_i})us$/i then    return "#{$1}i"
+			when /(#{PL_sb_C_us_us})$/i then     return "#{$1}"
+			when /(#{PL_sb_C_a_ae})$/i then      return "#{$1}e"
+			when /(#{PL_sb_C_a_ata})a$/i then    return "#{$1}ata"
+			when /(#{PL_sb_C_o_i})o$/i then      return "#{$1}i"
+			when /(#{PL_sb_C_on_a})on$/i then    return "#{$1}a"
+			when /#{PL_sb_C_im}$/i then          return "#{word}im"
+			when /#{PL_sb_C_i}$/i then           return "#{word}i"
+			end
+		end
+		# Handle singular nouns ending in ...s or other silibants
+		case word
+		when /^(#{PL_sb_singular_s})$/i then    return "#{$1}es"
+		when /^([A-Z].*s)$/ then                return "#{$1}es"
+		when /(.*)([cs]h|[zx])$/i then          return "#{$1}#{$2}es"
+		# when /(.*)(us)$/i then                return "#{$1}#{$2}es"
+		# Handle ...f -> ...ves
+		when /(.*[eao])lf$/i then              return "#{$1}lves"
+		when /(.*[^d])eaf$/i then              return "#{$1}eaves"
+		when /(.*[nlw])ife$/i then             return "#{$1}ives"
+		when /(.*)arf$/i then                  return "#{$1}arves"
+		# Handle ...y
+		when /(.*[aeiou])y$/i then             return "#{$1}ys"
+		when /([A-Z].*y)$/ then                return "#{$1}s"
+		when /(.*)y$/i then                    return "#{$1}ies"
+		# Handle ...o
+		when /#{PL_sb_U_o_os}$/i then          return "#{word}s"
+		when /[aeiou]o$/i then                 return "#{word}s"
+		when /o$/i then                        return "#{word}es"
+		# Otherwise just add ...s
+		else
+			self.log.debug "  appears to be regular; adding +s"
+			return "#{word}s"
+		end
+	end # def pluralize_noun
+	### Pluralize special verbs
+	def pluralize_special_verb( word, count )
+		self.log.debug "Trying to pluralize %p as a special verb..." % [ word ]
+		count ||= 1
+		count = normalize_count( count )
+		if /^(#{PL_count_one})$/i =~ count.to_s
+			self.log.debug "  it's a single-count word, returning it unchanged."
+			return word # :FIXME: should this return nil instead?
+			# return nil
+		end
+		# Handle user-defined verbs
+		#if value = ud_match( word, PL_v_user_defined )
+		#	return value
+		#end
+		case word
+		# Handle irregular present tense (simple and compound)
+		when /^(#{PL_v_irregular_pres})((\s.*)?)$/i
+			key = $1.downcase
+			self.log.debug "  yep, it's an irregular present tense verb (%p)" % [ key ]
+			return PL_v_irregular_pres_h[ $1.downcase ] + $2
+		# Handle irregular future, preterite and perfect tenses
+		when /^(#{PL_v_irregular_non_pres})((\s.*)?)$/i
+			self.log.debug "  yep, it's an irregular non-present tense verb (%p)" % [ key ]
+			return word
+		# Handle special cases
+		when /^(#{PL_v_special_s})$/
+			self.log.debug "  it's a not special-case verb; aborting."
+			return nil
+		# Handle standard 3rd person (chop the ...(e)s off single words)
+		when /^(.*)([cs]h|[x]|zz|ss)es$/i
+			base, suffix = $1, $2
+			self.log.debug "  it's a standard third-person verb (%p + %p)" % [ base, suffix ]
+			return base + suffix
+		when /^(..+)ies$/i
+			verb = $1
+			self.log.debug "  it's a standard third-person verb (%p + ies -> +y)" % [ verb ]
+			return "#{verb}y"
+		when /^(.+)oes$/i
+			verb = $1
+			self.log.debug "  it's a standard third-person verb (%p + oes -> +o)" % [ verb ]
+			return "#{verb}o"
+		when /^(.*[^s])s$/i
+			verb = $1
+			self.log.debug "  it's a standard third-person verb (%p + (^s)s -> -s)" % [ verb ]
+			return verb
+		# Otherwise, a regular verb (handle elsewhere)
+		else
+			self.log.debug "  nope. Either a regular verb or not a verb."
+			return nil
+		end
+	end
+	### Pluralize regular verbs
+	def pluralize_general_verb( word, count )
+		count = normalize_count( count )
+		return word if /^(#{PL_count_one})$/i =~ count.to_s
+		case word
+		# Handle ambiguous present tenses  (simple and compound)
+		when /^(#{PL_v_ambiguous_pres})((\s.*)?)$/i
+			return PL_v_ambiguous_pres_h[ $1.downcase ] + $2
+		# Handle ambiguous preterite and perfect tenses
+		when /^(#{PL_v_ambiguous_non_pres})((\s.*)?)$/i
+			return word
+		# Otherwise, 1st or 2nd person is uninflected
+		else
+			return word
+		end
+	end
+	### Handle special adjectives
+	def pluralize_special_adjective( word, count )
+		self.log.debug "Trying to pluralize %p as a special adjective..." % [ word ]
+		count ||= 1
+		count = normalize_count( count )
+		if /^(#{PL_count_one})$/i =~ count.to_s
+			self.log.debug "  it's a single-count word; aborting"
+			return nil
+		end
+		# Handle user-defined verbs
+		#if value = ud_match( word, PL_adj_user_defined )
+		#	return value
+		#end
+		case word
+		# Handle known cases
+		when /^(#{PL_adj_special})$/i
+			key = $1.downcase
+			self.log.debug "  yep, it's a special plural adjective (%p)" % [ key ]
+			return PL_adj_special_h[ key ]
+		# Handle possessives
+		when /^(#{PL_adj_poss})$/i
+			key = $1.downcase
+			self.log.debug "  it's a special possessive adjective (%p)" % [ key ]
+			return PL_adj_poss_h[ $1.downcase ]
+		when /^(.*)'s?$/
+			pl = $1.en.plural_noun( count )
+			self.log.debug "  it has an apostrophe (%p); using generic possessive rules" % [ pl ]
+			if /s$/ =~ pl
+				return "#{pl}'"
+			else
+				return "#{pl}'s"
+			end
+		# Otherwise, no idea
+		else
+			self.log.debug "  nope."
+			return nil
+		end
+	end
+end # module Linguistics::EN::Pluralization