RubyGems - lbp - Versions diffs - 0.0.2 → 0.1.0 - Mend

lbp 0.0.2 → 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

checksums.yaml +4 -4
data/.gitignore +4 -0
data/.ruby-gemset +1 -1
data/.ruby-version +1 -1
data/bin/lbp +33 -2
data/lbp.gemspec +3 -4
data/lib/lbp.rb +15 -5
data/lib/lbp/expression.rb +163 -0
data/lib/lbp/file.rb +173 -0
data/lib/lbp/file_part.rb +120 -0
data/lib/lbp/functions.rb +11 -2
data/lib/lbp/manifestation.rb +36 -0
data/lib/lbp/paragraph_image.rb +39 -0
data/lib/lbp/query.rb +181 -0
data/lib/lbp/resource.rb +72 -0
data/lib/lbp/transcription.rb +27 -243
data/lib/lbp/version.rb +1 -1
data/spec/config_globals.rb +28 -13
data/spec/expression_spec.rb +96 -0
data/spec/file_part_spec.rb +55 -0
data/spec/file_spec.rb +130 -0
data/spec/paragraph_image_spec.rb +46 -0
data/spec/query_spec.rb +27 -0
data/spec/resource_spec.rb +78 -0
data/spec/transcription_spec.rb +21 -111
metadata +40 -19
data/lib/lbp/collection.rb +0 -131
data/lib/lbp/item.rb +0 -153
data/lib/lbp/item_group.rb +0 -52
data/lib/lbp/paragraph.rb +0 -87
data/spec/collection_spec.rb +0 -60
data/spec/item_group_spec.rb +0 -39
data/spec/item_spec.rb +0 -74
data/spec/paragraph_spec.rb +0 -37

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: d49f877ac5360958e5c62b4701c97b2a897112be
-  data.tar.gz: 3fc110f62a9545f20785e8b8b01d609c7ab12e68
+  metadata.gz: be83290049ce0d3c203adf4e3ff2139a709ab72c
+  data.tar.gz: cfdfe9478a8f86ddd3e381c391cfc97142241f45
 SHA512:
-  metadata.gz: 4113fffbc328ab020d952eb88dfaf2ebe01bd12abdc929473052f3b2d307b606f00536702b87c45a68b2d1f36c98df5c5c20d268cd5bb54178079b2ba23f740a
-  data.tar.gz: d2d3535865aaf51cfd8abd3af442bc2d6b830a2f2c97419ad5416c6ed1fe0e9acd4ae10be71140197eed348cd00f30d956b6a4f18177ec89ea7d2abcc44010f8
+  metadata.gz: cc21ee397365f89a2194178c533d36fe42d91bebf472561234002a8a9e9e84ca3b61553daa12baf4a5aad9f55f78edbaadf5950e1ffd58cae52e8b1a253d6fe9
+  data.tar.gz: 0eb62da1320ecb9377ff83a5ce4fa3369117fa510af19c5160580823dcf0e00940b8f39750c5d2eddbddf28c9b9dd377143fad7e6ed2b31a9946f9b507b3ad31

data/.gitignore CHANGED

@@ -12,4 +12,8 @@
 *.o
 *.a
 mkmf.log
+/projectfiles/
+/pp-projectfiles/
+/pg-projectfiles/
+/aw-projectfiles/

data/.ruby-gemset CHANGED

	@@ -1 +1 @@
1	- ~~lbp~~
1	+ default

data/.ruby-version CHANGED

	@@ -1 +1 @@
1	- ruby-2.2.0
1	+ ruby-2.2.1

data/bin/lbp CHANGED

@@ -65,7 +65,7 @@ class LbpCli < Thor
     itemarray << headerdata
-    data.query(:predicate => RDF::DC.hasPart).each do |part|
+    data.query(:predicate => RDF::URI.new("http://scta.info/property/hasItem")).each do |part|
       newresource = RDF::Resource.new(part.object)
       newgraph = RDF::Graph.load(newresource)
@@ -78,13 +78,44 @@ class LbpCli < Thor
       unless status == 'Not Started'
         title = newdata.query(:predicate => RDF::DC11.title).first.object
+        if newdata.query(:predicate => RDF::URI.new("http://scta.info/property/questionTitle")).count == 0
+          question_title = "unknown"
+        else
+          question_title = newdata.query(:predicate => RDF::URI.new("http://scta.info/property/questionTitle")).first.object
+        end
         id = URI(part.object.to_s).path.split('/').last
         itemunit = "
         <item live='#{status}'>
           <fileName filestem='#{id}'>#{id}.xml</fileName>
           <title>#{title}</title>
-        </item>\n"
+          <questionTitle>#{question_title}</questionTitle>"
         itemarray << itemunit
+        #eventually hasPart property should be sctap:hasTranscription
+          hastranscriptions = newdata.query(:predicate => RDF::DC.hasPart)
+          if hastranscriptions.count > 0
+            partunitopen = "\n<hasParts>"
+            itemarray << partunitopen
+            hastranscriptions.each do |transcription|
+              transcription_resource = RDF::Resource.new(transcription.object)
+              transcription_graph = RDF::Graph.load(transcription_resource)
+              transcription_data = transcription_graph.data
+              transcription_title = transcription_data.query(:predicate => RDF::DC11.title).first.object
+              transcription_id = URI(transcription.object.to_s).path.split('/').last
+              transcription_slug = transcription_id.split("_").first
+              transcription_initial = transcription_slug.each_char.first.upcase # not ideal, some initials will be two letters
+              partunit = "\n<part>
+                <slug>#{transcription_slug}</slug>
+                <title>#{transcription_title}</title>
+                <initial>#{transcription_initial}</initial>
+              </part>"
+              itemarray << partunit
+            end
+            partunitclose = "\n</hasParts>"
+            itemarray << partunitclose
+          end
+         #end
+        close_item_unit = "\n</item>\n"
+        itemarray << close_item_unit
       end
     end

data/lbp.gemspec CHANGED

@@ -23,14 +23,13 @@ Gem::Specification.new do |spec|
   spec.add_development_dependency "rspec"
   spec.add_development_dependency "pry"
   spec.add_runtime_dependency "nokogiri"
-  spec.add_runtime_dependency "rugged"
+  #spec.add_runtime_dependency "rugged"
   spec.add_runtime_dependency "thor"
   spec.add_runtime_dependency "rdf"
   spec.add_runtime_dependency "rdf-rdfxml"
+  spec.add_runtime_dependency "rdf-vocab"
   spec.add_runtime_dependency "rest-client"
+  spec.add_runtime_dependency "sparql"
 end

data/lib/lbp.rb CHANGED

@@ -1,11 +1,21 @@
 require "lbp/version"
+  require 'lbp/functions'
+#still need review
+  require 'lbp/query'
+  require 'lbp/paragraph_image'
-	require 'lbp/functions'
-  require 'lbp/item'
-  require 'lbp/paragraph'
+#new files
+  require 'lbp/resource'
+  require 'lbp/expression'
+  require 'lbp/manifestation'
   require 'lbp/transcription'
-	require 'lbp/item_group'
-  require 'lbp/collection'
+  require 'lbp/file'
+  require 'lbp/file_part'

data/lib/lbp/expression.rb ADDED

@@ -0,0 +1,163 @@
+require 'openssl'
+require 'rdf'
+require 'rdf/rdfxml'
+require 'rdf/ntriples'
+require 'rdf/vocab'
+require 'lbp'
+module Lbp
+	class Expression < Resource
+		#inherits initialization from Resource
+		def manifestationUrls
+			results = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/hasManifestation"))
+			manifestations = results.map {|m| m[:o].to_s}
+			return manifestations
+		end
+		def canonicalManifestationUrl
+			manifestation = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/hasCanonicalManifestation")).first[:o].to_s
+			return manifestation
+		end
+		def canonicalManifestation
+			url = self.canonicalManifestationUrl
+			manifestationObj = Manifestation.new(url)
+			return manifestationObj
+		end
+		def canonicalManifestation?
+			if self.canonicalManifestationUrl == nil
+				return false
+			else
+				return true
+			end
+		end
+		# cannonical transcriptions refers to the canonical trancription
+		# of the canonical manifestation
+		def canonicalTranscriptionUrl
+			manifestationObj = self.canonicalManifestation
+			url = manifestationObj.canonicalTranscriptionUrl
+			return url
+		end
+		def canonicalTranscription
+			url = self.canonicalTranscriptionUrl
+			transcriptionObj = Transcription.new(url)
+			return transcriptionObj
+		end
+		def canonicalTranscription?
+			if self.canonicalManifestation? == false
+				return false
+			else
+				if self.canonicalTranscriptionUrl == nil
+					return false
+				else
+					return true
+				end
+			end
+		end
+		def transcriptionUrl(manifestationUrl)
+			manifestationObj = Manifestation.new(manifestationUrl)
+			transcriptionObj = manifestationObj.canonicalTranscriptionUrl
+			return transcriptionObj
+		end
+		def transcription(manifestationUrl)
+			manifestationObj = Manifestation.new(manifestationUrl)
+			transcriptionObj = manifestationObj.canonicalTranscription
+			return transcriptionObj
+		end
+		def next
+			unless self.results.dup.filter(:p => RDF::URI("http://scta.info/property/next")).count == 0
+				next_expression = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/next")).first[:o].to_s
+			else
+				next_expression = nil
+			end
+			return next_expression
+		end
+		def previous
+			unless self.results.dup.filter(:p => RDF::URI("http://scta.info/property/previous")).count == 0
+				previous_expression = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/previous")).first[:o].to_s
+			else
+				previous_expression = nil
+			end
+			return previous_expression
+		end
+		def order_number
+			## TODO: consider changing property so that there is more symmetry here
+			if self.structureType_shortId == "structureBlock"
+				ordernumber = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/paragraphNumber")).first[:o].to_s.to_i
+			else
+				ordernumber = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/totalOrderNumber")).first[:o].to_s.to_i
+			end
+			return ordernumber
+		end
+		def status
+			status = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/status")).first[:o].to_s
+		end
+		def top_level_expression_url
+			#TODO make sure this can handle different structure types
+			status = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/isPartOfTopLevelExpression")).first[:o].to_s
+		end
+		def top_level_expression_shortId
+			self.top_level_expression_url.split("/").last
+		end
+		def top_level_expression
+			expression = Expression.new(self.top_level_expression_url)
+		end
+		def item_level_expression_url
+			#TODO make sure this can handle different structure types
+			status = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/isPartOfStructureItem")).first[:o].to_s
+		end
+		def item_level_expression_shortId
+			self.item_level_expression_url.split("/").last
+		end
+		def item_level_expression
+			expression = Expression.new(self.item_level_expression_url)
+		end
+		def level
+			result = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/level")).first[:o]
+			unless self.results.count == 0
+				level = result.to_s.to_i
+			else
+				level = nil
+			end
+			return level
+		end
+		# connection properties
+		#TODO: notice how all these return RDF::Solutions (or some RDF:: object)
+		# rather already performing the conversion to strings as is done in all the above methods
+		# this should be standardized
+		def abbreviates
+    	abbreviates = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/abbreviates"))
+    end
+    def abbreviatedBy
+    	abbreviatedBy = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/abbreviatedBy"))
+    end
+    def references
+    	references = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/references"))
+    end
+    def referencedBy
+    	references = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/referencedBy"))
+    end
+    def copies
+    	copies = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/copies"))
+    end
+    def copiedBy
+    	copies = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/copiedBy"))
+    end
+    def mentions
+    	mentions = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/mentions"))
+    end
+    def quotes
+    	quotes = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/quotes"))
+    end
+    def quotedBy
+    	quotedBy = self.results.dup.filter(:p => RDF::URI("http://scta.info/property/quotedBy"))
+    end
+	end
+end

data/lib/lbp/file.rb ADDED

@@ -0,0 +1,173 @@
+require 'nokogiri'
+#require 'lbp/functions'
+#require 'lbp/item'
+require 'open-uri'
+require 'lbp'
+module Lbp
+	# class should be renamed to Transcription
+	class File
+		attr_reader :xslt_dir, :file_path
+		def initialize(filepath, transcription_type, confighash)
+			@file_path = filepath
+			@confighash = confighash
+			@xslthash = @confighash[:xslt_dirs]
+		  @type = transcription_type # critical or documentary
+		  #xslt version needs to gathered from a method
+		  xslt_version = nil
+		  #for now its being set to nil because no documents currently declare it
+	    if xslt_version == nil
+	    	@schema = @xslthash["default"]
+	   	else
+	    	@schema = @xslthash[xslt_version]
+	    end
+	    if @type == 'critical' || @type == 'Critical'
+	    	@xslt_dir = @schema[:critical]
+	    elsif @type == 'documentary' || @type == 'Documentary' || @type == 'diplomatic'
+	    	@xslt_dir = @schema[:documentary]
+	  	end
+	  end
+		def file
+			#TODO: needs to be written so auth is only need after request without
+			#auth is rejected
+			#file = open(self.file_path)
+			file = open(self.file_path, {:http_basic_authentication => [@confighash[:git_username], @confighash[:git_password]]})
+			return file
+		end
+		def nokogiri
+			xmldoc = Nokogiri::XML(self.file)
+		end
+		## End File Path Methods
+		### Item Header Extraction and Metadata Methods
+		def title
+			xmldoc = self.nokogiri
+			title = xmldoc.xpath("/tei:TEI/tei:teiHeader[1]/tei:fileDesc[1]/tei:titleStmt[1]/tei:title[1]", 'tei' => 'http://www.tei-c.org/ns/1.0')
+			return title.text
+		end
+		def author
+			xmldoc = self.nokogiri
+			author = xmldoc.xpath("/tei:TEI/tei:teiHeader[1]/tei:fileDesc/tei:titleStmt[1]/tei:author", 'tei' => 'http://www.tei-c.org/ns/1.0')
+			return author.text
+		end
+		def editor
+			xmldoc = self.nokogiri
+			editor = xmldoc.xpath("/tei:TEI/tei:teiHeader[1]/tei:fileDesc/tei:titleStmt[1]/tei:editor", 'tei' => 'http://www.tei-c.org/ns/1.0')
+			return editor.text
+		end
+		def ed_no
+			xmldoc = self.nokogiri
+			ed_no = xmldoc.at_xpath("/tei:TEI/tei:teiHeader[1]/tei:fileDesc[1]/tei:editionStmt[1]/tei:edition[1]/@n", 'tei' => 'http://www.tei-c.org/ns/1.0')
+			return ed_no.value
+		end
+		def ed_date
+			xmldoc = self.nokogiri
+			ed_date = xmldoc.at_xpath("/tei:TEI/tei:teiHeader[1]/tei:fileDesc[1]/tei:editionStmt[1]/tei:edition[1]/tei:date[1]/@when", 'tei' => 'http://www.tei-c.org/ns/1.0')
+			return ed_date.value
+		end
+		def pub_date
+			xmldoc = self.nokogiri
+			pub_date = xmldoc.at_xpath("/tei:TEI/tei:teiHeader[1]/tei:fileDesc[1]/tei:publicationStmt[1]/tei:date[1]/@when", 'tei' => 'http://www.tei-c.org/ns/1.0')
+			return pub_date.value
+		end
+		def encoding_method
+			xmldoc = self.nokogiri
+			encoding_method = xmldoc.at_xpath("/tei:TEI/tei:teiHeader[1]/tei:encodingDesc[1]/tei:variantEncoding[1]/@method", 'tei' => 'http://www.tei-c.org/ns/1.0')
+			return encoding_method.value
+		end
+		def encoding_location
+			xmldoc = self.nokogiri
+			encoding_location = xmldoc.at_xpath("/tei:TEI/tei:teiHeader[1]/tei:encodingDesc[1]/tei:variantEncoding[1]/@location", 'tei' => 'http://www.tei-c.org/ns/1.0')
+			return encoding_location.value
+		end
+		def number_of_columns
+			xmldoc = self.nokogiri
+			test = xmldoc.xpath("//tei:pb", 'tei' => 'http://www.tei-c.org/ns/1.0')
+			if @type == "critical"
+				number_of_columns = nil
+			elsif xmldoc.xpath("//tei:pb", 'tei' => 'http://www.tei-c.org/ns/1.0').count != 0
+            number_of_columns = 1
+      elsif xmldoc.xpath("//tei:cb", 'tei' => 'http://www.tei-c.org/ns/1.0').count != 0
+           	number_of_columns = 2
+      end
+      return number_of_columns
+    end
+		### Begin transform (XSLT) methocs ###
+		def transform(xsltfile, xslt_param_array=[])
+			doc = xslt_transform(self.nokogiri, xsltfile, xslt_param_array)
+    end
+		def transform_apply(xsltfile, xslt_param_array=[])
+			doc = xslt_apply_to(self.nokogiri, xsltfile, xslt_param_array)
+    end
+    def transform_main_view(xslt_param_array=[])
+			xsltfile=@xslt_dir + @schema[:main_view] # "text_display.xsl"
+			doc = self.transform_apply(xsltfile, xslt_param_array)
+		end
+		def transform_index_view(xslt_param_array=[])
+			xsltfile=@xslt_dir + @schema[:index_view] # "text_display_index.xsl"
+			doc = self.transform_apply(xsltfile, xslt_param_array)
+		end
+		def transform_clean(xslt_param_array=[])
+    	xsltfile=@xslt_dir + @schema[:clean_view] # "clean_forStatistics.xsl"
+    	doc = self.transform_apply(xsltfile, xslt_param_array)
+    end
+    def transform_clean_nokogiri(xslt_param_array=[])
+    	xsltfile=@xslt_dir + @schema[:clean_view] # "clean_forStatistics.xsl"
+    	doc = self.transform(xsltfile, xslt_param_array)
+    end
+		def transform_plain_text(xslt_param_array=[])
+    	xsltfile=@xslt_dir + @schema[:plain_text] # "plaintext.xsl"
+    	doc = self.transform_apply(xsltfile, xslt_param_array)
+    end
+    def transform_plain_text_nokogiri(xslt_param_array=[])
+    	xsltfile=@xslt_dir + @schema[:plain_text] # "plaintext.xsl"
+    	doc = self.transform(xsltfile, xslt_param_array)
+    end
+    def transform_json(xslt_param_array=[])
+    	xsltfile=@xslt_dir + @schema[:json] # "plaintext.xsl"
+    	doc = self.transform_apply(xsltfile, xslt_param_array)
+    end
+    def transform_toc(xslt_param_array=[])
+    	xsltfile=@xslt_dir + @schema[:toc] # "lectio_outline.xsl"
+    	doc = self.transform_apply(xsltfile, xslt_param_array)
+    end
+    ### End of Transformation Methods ###
+    ### Begin Statistics Methods ###
+    def word_count
+    	plaintext = self.transform_plain_text
+    	size = plaintext.split.size
+    end
+    def word_array
+    	plaintext = self.transform_plain_text
+    	word_array = plaintext.split
+    	word_array.map!{ |word| word.downcase}
+    end
+    def word_frequency(sort, order)
+    	word_array = self.word_array
+    	wf = Hash.new(0)
+			word_array.each { |word| wf[word] += 1 }
+			if sort == "frequency"
+				if order == "descending" # high to low
+					wf = wf.sort_by{|k,v| v}.reverse
+				elsif order == "ascending" # low to high
+					wf = wf.sort_by{|k,v| v}
+				end
+			elsif sort == "word"
+				if order == "descending" # z - a
+						wf = wf.sort_by{|k,v| k}.reverse
+				elsif order == "ascending" #a - z
+						wf = wf.sort_by{|k,v| k}
+				end
+			end
+			return wf.to_h
+    end
+  end
+end