RubyGems - markitdown - Versions diffs - 0.0.9 → 0.0.10 - Mend

markitdown 0.0.9 → 0.0.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

data/.gitignore CHANGED Viewed

@@ -15,3 +15,5 @@ spec/reports
 test/tmp
 test/version_tmp
 tmp
+.ruby-version

data/README.md CHANGED Viewed

@@ -8,6 +8,8 @@ Markitdown is a Ruby library that converts HTML to Markdown. It's powered by Nok
  * Lists (and nested list) inside of block quotes
  * Images
  * Links
+ * Code (inline and blocks)
+ * Definition lists
 As well as other tags.

data/lib/markitdown/version.rb CHANGED Viewed

@@ -1,3 +1,3 @@
 module Markitdown
-  VERSION = "0.0.9"
+  VERSION = "0.0.10"
 end

data/lib/markitdown.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# encoding=utf-8
 require "markitdown/version"
 require "nokogiri"
@@ -11,7 +13,7 @@ module Markitdown
     # gsub(/\n{2,}/,"\n\n") - collapse any series of more an than 2 new lines down to 2
     # gsub(/\t+/," ") - collapse consecutive tabs down to a single space. I use tabs to pad divs and span, this causes multiple nested spans and divs to ultimately be surrounded by a single space.
     # gsub(/ ([\.\?])/,'\1') - removes a space before a period or question mark. Things like links get surrounded by spaces. If they appear at the end of a sentence, this makes sure the punctation isn't off.
-    self.parse_node(node).flatten.compact.join.gsub(/\n\s+\n/,"\n\n").gsub(/\n{2,}/,"\n\n").gsub(/( > \n){2,}/,"\n > \n > ").gsub(/\t+/," ").gsub(/ ([\.\?])/,'\1')
+    self.parse_node(node).flatten.compact.join.gsub(/\n\s+\n/,"\n\n").gsub(/\n{2,}/,"\n\n").gsub(/( > \n){2,}/,"\n > \n > ").gsub(/\t+/," ").gsub(/ ([\.\?])/,'\1').gsub(/\s*END_TAG\((.{1,3})\)/, "\\1")
   end
   private
@@ -69,17 +71,17 @@ module Markitdown
     when "br"
       results << self.newline(pre, nil,  2)
     when "em"
-      results << " *"
-      after = "* "
+      results << " _"
+      after = "END_TAG(_) "
     when "i"
-      results << " *"
-      after = "* "
+      results << " _"
+      after = "END_TAG(_) "
     when "strong"
       results << " **"
-      after = "** "
+      after = "END_TAG(**) "
     when "b"
       results << " **"
-      after = "** "
+      after = "END_TAG(**) "
     when "blockquote"
       results << "\n\n"
       results << pre
@@ -136,7 +138,14 @@ module Markitdown
         results << contents
       end
     end
-    results << after
+    if strip_content
+      last_tags = results.pop
+      after = after.flatten.compact.join if after.is_a?(Array)
+      last_tags = "#{last_tags}#{after}"
+      results << last_tags
+    else
+      results << after
+    end
     states.shift
     results
   end

data/spec/asmartbear.html ADDED Viewed

@@ -0,0 +1,23 @@
+<div>
+  A <a href="http://blog.smartbear.com/careers/how-to-speak-to-a-technical-person/">smart bear writes about how to talk to a technical person</a>. Some of these points really hit home for me. When I'm with my friends, I get sarcasm, but in interactions where I don't expect it, it often goes over my head. Also ambiguous pronouns are one of my biggest pet peeves both in technical and casual conversation. For instance, &quot;My friend was talking to her boss, she said X&quot;. Did your friend say X, or her boss?
+  <blockquote>
+    <br clear="none"/>
+    <div style="position: relative">
+      <div style="font-size: 16px">
+        <div style="text-decoration:none;background-color:rgb(255, 255, 255);color:rgb(51, 51, 51);font-size:16px;font-family:Arial, sans-serif;line-height:1.5625;">
+          <div style="background-color:rgb(255, 255, 255);">
+            <div style="background-color:rgb(255, 255, 255);overflow:hidden;">
+              <div style="background-color:rgb(255, 255, 255);">
+                <div style="overflow:hidden;">
+                    <span style="line-height: 1.5625;">Try to avoid using vague words like "one" or "it" to describe an issue. For example:<i style="line-height: 1.5625;">"When I opened the document, the content was askew. When I tried to print the document, the printer jammed up.<b>It</b>cannot blow up like that!"</i><span style="line-height: 1.5625;">In the last sentence of this example, are you complaining about the document or the printer? It's not really clear. So I would repeat myself even at the risk of sounding redundant. It's better to be redundant and clear than to leave the other person wondering.</span><br/>
+                </div>
+              </div>
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+    <br clear="none"/>
+  </blockquote>
+</div>

data/spec/asmartbear.markdown ADDED Viewed

@@ -0,0 +1,10 @@
+ A [smart bear writes about how to talk to a technical person](http://blog.smartbear.com/careers/how-to-speak-to-a-technical-person/). Some of these points really hit home for me. When I'm with my friends, I get sarcasm, but in interactions where I don't expect it, it often goes over my head. Also ambiguous pronouns are one of my biggest pet peeves both in technical and casual conversation. For instance, "My friend was talking to her boss, she said X". Did your friend say X, or her boss?
+ >
+ >
+ >  Try to avoid using vague words like "one" or "it" to describe an issue. For example: _"When I opened the document, the content was askew. When I tried to print the document, the printer jammed up. **It** cannot blow up like that!"_  In the last sentence of this example, are you complaining about the document or the printer? It's not really clear. So I would repeat myself even at the risk of sounding redundant. It's better to be redundant and clear than to leave the other person wondering.
+ >
+ >
+ >
+ >

data/spec/doc.markdown CHANGED Viewed

@@ -2,7 +2,7 @@
 # Main Header
-This *is* a **test**. It includes a [link](http://www.google.com) as well as an image ![Google Logo](https://www.google.com/images/srpr/logo3w.png)
+This _is_ a **test**. It includes a [link](http://www.google.com) as well as an image ![Google Logo](https://www.google.com/images/srpr/logo3w.png)
  * bullet 1
  * bullet 2

data/spec/doc_spec.rb CHANGED Viewed

@@ -9,6 +9,14 @@ describe Markitdown do
     end
   end
+  context "When parsing the document 'asmartbear'" do
+    let(:html) { File.read("spec/asmartbear.html") }
+    it "should produce valid markdown" do
+      Markitdown.from_html(html).should == File.read("spec/asmartbear.markdown")
+    end
+  end
   context "When parsing an evernote document" do
     let(:xml) { File.read("spec/evernote.xml") }

data/spec/tag_spec.rb CHANGED Viewed

@@ -77,7 +77,7 @@ describe Markitdown do
     let(:html) { "<em>emphasis added</em>" }
     it "should return valid markdown" do
-      Markitdown.from_html(html).should == " *emphasis added* "
+      Markitdown.from_html(html).should == " _emphasis added_ "
     end
   end
@@ -85,7 +85,7 @@ describe Markitdown do
     let(:html) { "<i>italics added</i>" }
     it "should return valid markdown" do
-      Markitdown.from_html(html).should == " *italics added* "
+      Markitdown.from_html(html).should == " _italics added_ "
     end
   end
@@ -117,7 +117,7 @@ describe Markitdown do
     let(:html) { "<html><em>emphasis added</em>?</html>" }
     it "should return valid markdown without a space" do
-      Markitdown.from_html(html).should == " *emphasis added*?"
+      Markitdown.from_html(html).should == " _emphasis added_?"
     end
   end

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: markitdown
 version: !ruby/object:Gem::Version
-  version: 0.0.9
+  version: 0.0.10
   prerelease:
 platform: ruby
 authors:
@@ -9,7 +9,7 @@ authors:
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2013-05-29 00:00:00.000000000 Z
+date: 2013-07-05 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: nokogiri
@@ -75,6 +75,8 @@ files:
 - lib/markitdown.rb
 - lib/markitdown/version.rb
 - markitdown.gemspec
+- spec/asmartbear.html
+- spec/asmartbear.markdown
 - spec/doc.html
 - spec/doc.markdown
 - spec/doc_spec.rb
@@ -96,7 +98,7 @@ required_ruby_version: !ruby/object:Gem::Requirement
       version: '0'
       segments:
       - 0
-      hash: -2154247864884821099
+      hash: 73152326707210871
 required_rubygems_version: !ruby/object:Gem::Requirement
   none: false
   requirements:
@@ -105,14 +107,16 @@ required_rubygems_version: !ruby/object:Gem::Requirement
       version: '0'
       segments:
       - 0
-      hash: -2154247864884821099
+      hash: 73152326707210871
 requirements: []
 rubyforge_project:
-rubygems_version: 1.8.24
+rubygems_version: 1.8.23
 signing_key:
 specification_version: 3
 summary: Converts HTML to Markdown
 test_files:
+- spec/asmartbear.html
+- spec/asmartbear.markdown
 - spec/doc.html
 - spec/doc.markdown
 - spec/doc_spec.rb