RubyGems - rbpdf-fruitcake0525 - Versions diffs - 1.19.0 - Mend

rbpdf-fruitcake0525 1.19.0

Files changed (51) hide show

checksums.yaml +7 -0
data/CHANGELOG +96 -0
data/Gemfile +7 -0
data/LICENSE.TXT +504 -0
data/README.md +64 -0
data/Rakefile +12 -0
data/lib/core/rmagick.rb +93 -0
data/lib/htmlcolors.rb +207 -0
data/lib/rbpdf.rb +15138 -0
data/lib/rbpdf/version.rb +3 -0
data/lib/unicode_data.rb +18315 -0
data/logo_example.png +0 -0
data/rbpdf.gemspec +37 -0
data/test/err_font1.rb +3 -0
data/test/err_font2.rb +4 -0
data/test/logo_rbpdf_8bit.gif +0 -0
data/test/logo_rbpdf_8bit.jpg +0 -0
data/test/logo_rbpdf_8bit.png +0 -0
data/test/logo_rbpdf_8bit_alpha.gif +0 -0
data/test/logo_rbpdf_mono_gray.jpg +0 -0
data/test/logo_rbpdf_mono_gray.png +0 -0
data/test/logo_rbpdf_mono_rgb.jpg +0 -0
data/test/logo_rbpdf_mono_rgb.png +0 -0
data/test/png_test_alpha.png +0 -0
data/test/png_test_msk_alpha.png +0 -0
data/test/png_test_non_alpha.png +0 -0
data/test/rbpdf_bidi_test.rb +438 -0
data/test/rbpdf_bookmark_test.rb +56 -0
data/test/rbpdf_cell_test.rb +266 -0
data/test/rbpdf_content_test.rb +196 -0
data/test/rbpdf_css_test.rb +636 -0
data/test/rbpdf_dom_test.rb +338 -0
data/test/rbpdf_font_func_test.rb +41 -0
data/test/rbpdf_font_style_test.rb +33 -0
data/test/rbpdf_font_test.rb +291 -0
data/test/rbpdf_format_test.rb +26 -0
data/test/rbpdf_func_test.rb +135 -0
data/test/rbpdf_html_anchor_test.rb +107 -0
data/test/rbpdf_html_func_test.rb +166 -0
data/test/rbpdf_html_test.rb +580 -0
data/test/rbpdf_htmlcell_test.rb +64 -0
data/test/rbpdf_image_rmagick_test.rb +294 -0
data/test/rbpdf_image_test.rb +107 -0
data/test/rbpdf_test.rb +377 -0
data/test/rbpdf_transaction_test.rb +199 -0
data/test/rbpdf_viewerpreferences_test.rb +37 -0
data/test/rbpdf_write_test.rb +225 -0
data/test/test_helper.rb +4 -0
data/test_unicode.rbpdf +115 -0
data/utf8test.txt +120 -0
metadata +205 -0

data/test/rbpdf_format_test.rb ADDED Viewed

@@ -0,0 +1,26 @@
+require 'test_helper'
+class RbpdfFormatTest < Test::Unit::TestCase
+  test "set_page_orientation" do
+    pdf = RBPDF.new
+    pagedim = pdf.set_page_orientation('')
+    assert_equal pagedim['or'], 'P'
+    assert_equal pagedim['pb'], true
+    assert_equal pagedim['olm'], nil
+    assert_equal pagedim['orm'], nil
+    assert_in_delta pagedim['bm'], 20, 0.1
+    pagedim = pdf.set_page_orientation('P')
+    assert_equal pagedim['or'], 'P'
+    pagedim = pdf.set_page_orientation('L', false)
+    assert_equal pagedim['or'], 'L'
+    assert_equal pagedim['pb'], false
+    pagedim = pdf.set_page_orientation('P', true, 5)
+    assert_equal pagedim['or'], 'P'
+    assert_equal pagedim['pb'], true
+    assert_equal pagedim['bm'], 5
+  end
+end

data/test/rbpdf_func_test.rb ADDED Viewed

@@ -0,0 +1,135 @@
+require 'test_helper'
+class RbpdfTest < Test::Unit::TestCase
+  class MYPDF < RBPDF
+    def getSpaceString
+      super
+    end
+  end
+  test "get_html_unit_to_units test" do
+    pdf = RBPDF.new
+    unit = pdf.get_html_unit_to_units("100", 1)
+    assert_in_delta unit, 35.27, 0.01
+    unit = pdf.get_html_unit_to_units("100px", 1, 'px', false)
+    assert_in_delta unit, 35.27, 0.01
+    unit = pdf.get_html_unit_to_units(100, 1, 'pt', false)
+    assert_in_delta unit, 35.27, 0.01
+    unit = pdf.get_html_unit_to_units(100.0, 1, 'pt', false)
+    assert_in_delta unit, 35.27, 0.01
+    unit = pdf.get_html_unit_to_units("100.0", 1, 'pt', false)
+    assert_in_delta unit, 35.27, 0.01
+    unit = pdf.get_html_unit_to_units("200", 1, '%', false)
+    assert_equal unit, 2.0
+    unit = pdf.get_html_unit_to_units("400%", 1, '%', false)
+    assert_equal unit, 4.0
+    unit = pdf.get_html_unit_to_units("10", 1, '%', false)
+    assert_equal unit, 0.1
+    unit = pdf.get_html_unit_to_units("10mm", 1, '%', false)
+    assert_in_delta unit, 10, 0.01
+    unit = pdf.get_html_unit_to_units("10", 1, 'mm', false)
+    assert_in_delta unit, 10, 0.01
+    unit = pdf.get_html_unit_to_units(10, 1, 'mm', false)
+    assert_in_delta unit, 10, 0.01
+    unit = pdf.get_html_unit_to_units("1", 1, 'cm', false)
+    assert_in_delta unit, 10, 0.01
+    unit = pdf.get_html_unit_to_units(10, 1, 'em', false)
+    assert_equal unit, 10
+    unit = pdf.get_html_unit_to_units(10, 2, 'em', false)
+    assert_equal unit, 20
+  end
+  test "getSpaceString test" do
+    pdf = MYPDF.new
+    spacestr = pdf.getSpaceString()
+    assert_equal spacestr, 32.chr
+    pdf.set_font('freesans', '', 18)
+    spacestr = pdf.getSpaceString()
+    assert_equal spacestr, 0.chr + 32.chr
+  end
+  test "revstrpos test" do
+    pdf = RBPDF.new
+    pos = pdf.revstrpos('abcd efgh ', 'cd')
+    assert_equal pos, 2
+    pos = pdf.revstrpos('abcd efgh ', 'cd ')
+    assert_equal pos, 2
+    pos = pdf.revstrpos('abcd efgh abcd efg', 'cd')
+    assert_equal pos, 12
+    pos = pdf.revstrpos('abcd efgh abcd efg', 'zy')
+    assert_equal pos, nil
+  end
+  test "revstrpos offset test 1" do
+    pdf = RBPDF.new
+    pos = pdf.revstrpos('abcd efgh ', 'cd', 3)          # 'abc'
+    assert_equal pos, nil
+    pos = pdf.revstrpos('abcd efgh ', 'cd', 4)          # 'abcd'
+    assert_equal pos, 2
+    pos = pdf.revstrpos('abcd efgh abcd efg', 'cd', 3)  # 'abc'
+    assert_equal pos, nil
+    pos = pdf.revstrpos('abcd efgh abcd efg', 'cd', 4)  # 'abcd'
+    assert_equal pos, 2
+    pos = pdf.revstrpos('abcd efgh abcd efg', 'cd', 13) # 'abcd efgh abc'
+    assert_equal pos, 2
+    pos = pdf.revstrpos('abcd efgh abcd efg', 'cd', 14) # 'abcd efgh abcd'
+    assert_equal pos, 12
+  end
+  test "revstrpos offset test 2" do
+    pdf = RBPDF.new
+    pos = pdf.revstrpos('abcd efgh ', 'cd', -6)         # 'abcd'
+    assert_equal pos, 2
+    pos = pdf.revstrpos('abcd efgh ', 'cd', -7)         # 'abc'
+    assert_equal pos, nil
+    pos = pdf.revstrpos('abcd efgh abcd efg', 'cd', -4) # 'abcd efgh abcd'
+    assert_equal pos, 12
+    pos = pdf.revstrpos('abcd efgh abcd efg', 'cd', -5) # 'abcd efgh abc'
+    assert_equal pos, 2
+  end
+  test "set_line_style Basic test" do
+    pdf = RBPDF.new
+    pdf.set_line_style({'width' => 0.1, 'cap' => 'butt', 'join' => 'miter', 'dash' => 0, 'color' => [0, 0, 0]})
+    pdf.set_line_style({'width' => 0.1, 'cap' => 'butt', 'join' => 'miter', 'dash' => '', 'phase' => 0, 'color' => [255, 0, 0]})
+    pdf.set_line_style({'width' => 0.1, 'cap' => 'butt', 'join' => 'miter', 'dash' => '1,2,3,4', 'phase' => 0, 'color' => [255, 0, 0]})
+    pdf.set_line_style({'width' => 0.1, 'cap' => 'butt', 'join' => 'miter', 'dash' => 'a', 'phase' => 0, 'color' => [255, 0, 0]}) # Invalid
+  end
+  test "get_string_width encoding test" do
+    return unless 'test'.respond_to?(:force_encoding)
+    pdf = RBPDF.new
+    str = 'test'.force_encoding('UTF-8')
+    width = pdf.get_string_width(str)
+    assert_equal str.encoding.to_s, 'UTF-8'
+  end
+end

data/test/rbpdf_html_anchor_test.rb ADDED Viewed

@@ -0,0 +1,107 @@
+require 'test_helper'
+class RbpdfTest < Test::Unit::TestCase
+  class MYPDF < RBPDF
+    def getPageBuffer(page)
+      super
+    end
+  end
+  test "anchor with text inside" do
+    pdf = RBPDF.new
+    pdf.add_page()
+    htmlcontent = '<a name="foo">HTML Example</a>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    position = pdf.get_html_anchor_position('foo')
+    assert_equal position, [1, 10.001249999999999]
+  end
+  test "anchor with id" do
+    pdf = RBPDF.new
+    pdf.add_page()
+    htmlcontent = '<a id="foo">HTML Example</a>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    position = pdf.get_html_anchor_position('foo')
+    assert_equal position, [1, 10.001249999999999]
+  end
+  test "empty anchor" do
+    pdf = RBPDF.new
+    pdf.add_page()
+    htmlcontent = '<a id="foo"></a>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    position = pdf.get_html_anchor_position('foo')
+    assert_equal position, [1, 10.001249999999999]
+  end
+  test "anchor with overtical offset" do
+    pdf = RBPDF.new
+    pdf.add_page()
+    htmlcontent = '<br><br><br><br><br><br><br><br><br><br><a id="foo"></a>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    position = pdf.get_html_anchor_position('foo')
+    assert_equal position, [1, 57.626249999999985]
+  end
+  test "on the second page" do
+    pdf = RBPDF.new
+    pdf.add_page()
+    htmlcontent = '1<br><br><br><br><br><br><br><br><br><br> 2<br><br><br><br><br><br><br><br><br><br> 3<br><br><br><br><br><br><br><br><br><br> 4<br><br><br><br><br><br><br><br><br><br> 5<br><br><br><br><br><br><br><br><br><br> 6<br><br><br><br><br><br><br><br><br><br> 7<br><br><br><br><br><br><br><br><br><br> 8<br><br><br><br><br><br><br><br><br><br> 9<br><br><br><br><br><br><br><br><br><br> 10<br><br><br><br><br><br><br><br><br><br> 11<br><br><br><br><br><br><br><br><br><br>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    htmlcontent = '<a id="foo"></a>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    position = pdf.get_html_anchor_position('foo')
+    assert_equal position, [3, 68.20958333333331]
+  end
+  test "maps when anchor after link" do
+    pdf = RBPDF.new
+    pdf.add_page()
+    htmlcontent = '<a href="#foo">FooLink</a>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    htmlcontent = '1<br><br><br><br><br><br><br><br><br><br> 2<br><br><br><br><br><br><br><br><br><br> 3<br><br><br><br><br><br><br><br><br><br> 4<br><br><br><br><br><br><br><br><br><br> 5<br><br><br><br><br><br><br><br><br><br> 6<br><br><br><br><br><br><br><br><br><br> 7<br><br><br><br><br><br><br><br><br><br> 8<br><br><br><br><br><br><br><br><br><br> 9<br><br><br><br><br><br><br><br><br><br> 10<br><br><br><br><br><br><br><br><br><br> 11<br><br><br><br><br><br><br><br><br><br>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    htmlcontent = '<a id="foo"></a>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    pdf.send(:mapLinksToHtmlAnchors)
+    link_position = pdf.instance_variable_get(:@links)[1]
+    assert_equal link_position,  [3, 73.50124999999998]
+  end
+  test "maps when anchor before link" do
+    pdf = RBPDF.new
+    pdf.add_page()
+    htmlcontent = '<a id="foo"></a>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    htmlcontent = '1<br><br><br><br><br><br><br><br><br><br> 2<br><br><br><br><br><br><br><br><br><br> 3<br><br><br><br><br><br><br><br><br><br> 4<br><br><br><br><br><br><br><br><br><br> 5<br><br><br><br><br><br><br><br><br><br> 6<br><br><br><br><br><br><br><br><br><br> 7<br><br><br><br><br><br><br><br><br><br> 8<br><br><br><br><br><br><br><br><br><br> 9<br><br><br><br><br><br><br><br><br><br> 10<br><br><br><br><br><br><br><br><br><br> 11<br><br><br><br><br><br><br><br><br><br>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    htmlcontent = '<a href="#foo">FooLink</a>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    pdf.send(:mapLinksToHtmlAnchors)
+    link_position = pdf.instance_variable_get(:@links)[1]
+    assert_equal link_position, [1, 10.001249999999999]
+  end
+end

data/test/rbpdf_html_func_test.rb ADDED Viewed

@@ -0,0 +1,166 @@
+require 'test_helper'
+class RbpdfTest < Test::Unit::TestCase
+  class MYPDF < RBPDF
+    def addHTMLVertSpace(hbz, hb, cell, firstorlast)
+      super
+    end
+    def sanitize_html(html)
+      super
+    end
+  end
+  test "html func addHTMLVertSpace empty lines test" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    # same line, start position
+    x1 = pdf.get_x
+    pdf.set_x(x1 + 10)
+    y1 = pdf.get_y
+    pdf.addHTMLVertSpace(1, 0, false, true)
+    x2 = pdf.get_x
+    y2 = pdf.get_y
+    assert_equal x2, x1
+    assert_equal y2, y1
+    # same line, @c_margin position
+    margins = pdf.get_margins
+    x1 = pdf.get_x
+    y1 = pdf.get_y
+    pdf.addHTMLVertSpace(1, 0, true, true)
+    x2 = pdf.get_x
+    y2 = pdf.get_y
+    assert_equal x2, x1 + margins['cell']
+    assert_equal y2, y1
+  end
+  test "html func addHTMLVertSpace add line test" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    # next line, start position
+    x1 = pdf.get_x
+    pdf.set_x(x1 + 10)
+    y1 = pdf.get_y
+    pdf.addHTMLVertSpace(5, 0, false, false)
+    x2 = pdf.get_x
+    y2 = pdf.get_y
+    assert_equal x2, x1
+    assert_equal y2, y1 + 5
+    # next line, @c_margin position
+    margins = pdf.get_margins
+    x1 = pdf.get_x
+    y1 = pdf.get_y
+    pdf.addHTMLVertSpace(5, 0, true, false)
+    x2 = pdf.get_x
+    y2 = pdf.get_y
+    assert_equal x2, x1 + margins['cell']
+    assert_equal y2, y1 + 5
+  end
+  test "html func addHTMLVertSpace height of the break test 1" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    margins = pdf.get_margins
+    x1 = pdf.get_x
+    y1 = pdf.get_y
+    pdf.addHTMLVertSpace(0, 5, true, false) # height of the break : 5
+    x2 = pdf.get_x
+    y2 = pdf.get_y
+    assert_equal x2, x1 + margins['cell']
+    assert_equal y2, y1 + 5
+    pdf.addHTMLVertSpace(0, 5, true, false)  # height of the break : 5
+    x3 = pdf.get_x
+    y3 = pdf.get_y
+    assert_equal x3, x2
+    assert_equal y3, y2
+    pdf.addHTMLVertSpace(0, 5 + 2, true, false)  # height of the break : 7
+    x4 = pdf.get_x
+    y4 = pdf.get_y
+    assert_equal x4, x3
+    assert_equal y4, y3 + 2
+    pdf.addHTMLVertSpace(0, 5, true, false)  # height of the break : 7
+    x5 = pdf.get_x
+    y5 = pdf.get_y
+    assert_equal x5, x4
+    assert_equal y5, y4
+    pdf.addHTMLVertSpace(0, 5 + 2 + 1, true, false)  # height of the break : 8
+    x6 = pdf.get_x
+    y6 = pdf.get_y
+    assert_equal x6, x5
+    assert_equal y6, y5 + 1
+    pdf.addHTMLVertSpace(0, 10, true, true)  # height of the break : 0 (reset)
+    x7 = pdf.get_x
+    y7 = pdf.get_y
+    assert_equal x7, x6
+    assert_equal y7, y6
+    pdf.addHTMLVertSpace(0, 2, true, false)  # height of the break : 2
+    x8 = pdf.get_x
+    y8 = pdf.get_y
+    assert_equal x8, x7
+    assert_equal y8, y7 + 2
+  end
+  test "html func addHTMLVertSpace height of the break test 2" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    x1 = pdf.get_x
+    y1 = pdf.get_y
+    pdf.addHTMLVertSpace(10, 5, false, false) # height of the break : 5
+    x2 = pdf.get_x
+    y2 = pdf.get_y
+    assert_equal x2, x1
+    assert_equal y2, y1 + 10 + 5
+    pdf.addHTMLVertSpace(10, 5, false, false)  # height of the break : 5
+    x3 = pdf.get_x
+    y3 = pdf.get_y
+    assert_equal x3, x2
+    assert_equal y3, y2 + 10
+    pdf.addHTMLVertSpace(10, 5 + 2, false, false)  # height of the break : 7
+    x4 = pdf.get_x
+    y4 = pdf.get_y
+    assert_equal x4, x3
+    assert_equal y4, y3 + 10 + 2
+  end
+  test "html func sanitize test 1" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    html = '<table border="1"><thead><tr><td>ABCD</td><td>EFGH</td><td>IJKL</td></tr></thead><tr><td>abcd</td><td>efgh</td><td>ijkl</td></tr><tr><td>' + 'ABC' + '</td></tr></table>'
+    html = pdf.sanitize_html(html).gsub(/[\r\n]/,'')
+    assert_equal html, %{<table border="1"><thead><tr><td>ABCD</td><td>EFGH</td><td>IJKL</td></tr></thead><tr><td>abcd</td><td>efgh</td><td>ijkl</td></tr><tr><td>ABC</td></tr></table>}
+  end
+  test "html func sanitize test 2" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    htmlcontent = '1<br><br><br><br><br><br><br><br><br><br> 2<br><br><br><br><br><br><br><br><br><br> 3<br><br><br><br><br><br><br><br><br><br> 4<br><br><br><br><br><br><br><br><br><br> 5<br><br><br><br><br><br><br><br><br><br> 6<br><br><br><br><br><br><br><br><br><br> 7<br><br><br><br><br><br><br><br><br><br> 8<br><br><br><br><br><br><br><br><br><br> 9<br><br><br><br><br><br><br><br><br><br> 10<br><br><br><br><br><br><br><br><br><br> 11<br><br><br><br><br><br><br><br><br><br>'
+    html = '<table cellpadding="1"><thead><tr><td>ABCD</td><td>EFGH</td><td>IJKL</td></tr></thead><tr><td>abcd</td><td>efgh</td><td>ijkl</td></tr><tr><td>' + htmlcontent + '</td></tr></table>'
+    html = pdf.sanitize_html(html).gsub(/[\r\n]/,'')
+    assert_equal html, %{<table cellpadding="1"><thead><tr><td>ABCD</td><td>EFGH</td><td>IJKL</td></tr></thead><tr><td>abcd</td><td>efgh</td><td>ijkl</td></tr><tr><td>1<br><br><br><br><br><br><br><br><br><br> 2<br><br><br><br><br><br><br><br><br><br> 3<br><br><br><br><br><br><br><br><br><br> 4<br><br><br><br><br><br><br><br><br><br> 5<br><br><br><br><br><br><br><br><br><br> 6<br><br><br><br><br><br><br><br><br><br> 7<br><br><br><br><br><br><br><br><br><br> 8<br><br><br><br><br><br><br><br><br><br> 9<br><br><br><br><br><br><br><br><br><br> 10<br><br><br><br><br><br><br><br><br><br> 11<br><br><br><br><br><br><br><br><br><br></td></tr></table>}
+  end
+  test "html func sanitize open angled bracket '<' test" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    html = "<p>AAA '<'-BBB << <<< '</' '<//' '<///' <</ <<// CCC.</p>"
+    html = pdf.sanitize_html(html).gsub(/[\r\n]/,'')
+    assert_equal %{<p>AAA '&lt;'-BBB &lt;&lt; &lt;&lt;&lt; '&lt;/' '&lt;//' '&lt;///' &lt;&lt;/ &lt;&lt;// CCC.</p>}, html
+  end
+end

data/test/rbpdf_html_test.rb ADDED Viewed

@@ -0,0 +1,580 @@
+# coding: ASCII-8BIT
+require 'test_helper'
+class RbpdfHtmlTest < Test::Unit::TestCase
+  class MYPDF < RBPDF
+    def getPageBuffer(page)
+      super
+    end
+    # get text count and x_pos from pdf page
+    def get_html_text_position_x(page, regrep_text, x_pos_exp=nil)
+      count_line, count_text, x_pos, y_pos = get_html_text_position(page, regrep_text, x_pos_exp)
+      return count_line, count_text, x_pos
+    end
+    # get text count and y_pos from pdf page
+    def get_html_text_position_y(page, regrep_text)
+      count_line, count_text, x_pos, y_pos = get_html_text_position(page, regrep_text)
+      return count_line, count_text, y_pos
+    end
+    # get text count and pos from pdf page
+    def get_html_text_position(page, regrep_text, x_pos_exp=nil)
+      content = []
+      contents = getPageBuffer(page)
+      contents.each_line {|line| content.push line.chomp }
+      count_line = count_text = 0
+      x_pos = y_pos = -1
+      content.each do |line|
+        count_line += 1 if line =~ /TJ ET Q$/ # Text Line Count
+        if line =~ regrep_text
+          count_text += 1
+          line =~ /BT ([0-9.]+) ([0-9.]+) Td/
+          x_pos = $1
+          y_pos = $2 if y_pos == -1 # y first position only
+          if x_pos.nil? or y_pos.nil? # Error
+            return count_line, count_text, nil, nil
+          end
+          if !x_pos_exp.nil? and x_pos != x_pos_exp # Error
+            return count_line, count_text, x_pos, y_pos
+          end
+        end
+      end
+      return count_line, count_text, x_pos, y_pos
+    end
+    # get text from pdf page
+    def get_html_text(page)
+      content = []
+      contents = getPageBuffer(page)
+      contents.each_line {|line| content.push line.chomp }
+      pdf_text = ''
+      content.each do |line|
+        if line =~ /\[\((.*)\)\] TJ ET/
+          pdf_text << $1
+        end
+      end
+      return pdf_text
+    end
+  end
+  test "write_html Basic test" do
+    pdf = RBPDF.new
+    pdf.add_page()
+    htmlcontent = '<h1>HTML Example</h1>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    htmlcontent = 'abcdefghijklmnopgrstuvwxyz01234567890 abcdefghijklmnopgrstuvwxyz01234567890 abcdefghijklmnopgrstuvwxyz01234567890 abcdefghijklmnopgrstuvwxyz01234567890 abcdefghijklmnopgrstuvwxyz01234567890'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    htmlcontent = '1<br><br><br><br><br><br><br><br><br><br> 2<br><br><br><br><br><br><br><br><br><br> 3<br><br><br><br><br><br><br><br><br><br> 4<br><br><br><br><br><br><br><br><br><br> 5<br><br><br><br><br><br><br><br><br><br> 6<br><br><br><br><br><br><br><br><br><br> 7<br><br><br><br><br><br><br><br><br><br> 8<br><br><br><br><br><br><br><br><br><br> 9<br><br><br><br><br><br><br><br><br><br> 10<br><br><br><br><br><br><br><br><br><br> 11<br><br><br><br><br><br><br><br><br><br>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    pno = pdf.get_page
+    assert_equal pno, 3
+  end
+  test "write_html Table test 1" do
+    pdf = RBPDF.new
+    pdf.add_page()
+    tablehtml = '<table border="1" cellspacing="1" cellpadding="1"><tr><td>a</td><td>b</td></tr><tr><td>c</td><td>d</td></tr></table>'
+    pdf.write_html(tablehtml, true, 0, true, 0)
+    htmlcontent = '1<br><br><br><br><br><br><br><br><br><br> 2<br><br><br><br><br><br><br><br><br><br> 3<br><br><br><br><br><br><br><br><br><br> 4<br><br><br><br><br><br><br><br><br><br> 5<br><br><br><br><br><br><br><br><br><br> 6<br><br><br><br><br><br><br><br><br><br> 7<br><br><br><br><br><br><br><br><br><br> 8<br><br><br><br><br><br><br><br><br><br> 9<br><br><br><br><br><br><br><br><br><br> 10<br><br><br><br><br><br><br><br><br><br> 11<br><br><br><br><br><br><br><br><br><br>'
+    tablehtml = '<table border="1" cellspacing="1" cellpadding="1"><tr><td>a</td><td>b</td></tr><tr><td>c</td><td>' + htmlcontent + '</td></tr></table>'
+    pdf.write_html(tablehtml, true, 0, true, 0)
+    pno = pdf.get_page
+    assert_equal pno, 3
+  end
+  test "write_html Table test 2" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    htmlcontent = '1<br><br><br><br><br><br><br><br><br><br> 2<br><br><br><br><br><br><br><br><br><br> 3<br><br><br><br><br><br><br><br><br><br> 4<br><br><br><br><br><br><br><br><br><br> 5<br><br><br><br><br><br><br><br><br><br> 6<br><br><br><br><br><br><br><br><br><br> 7<br><br><br><br><br><br><br><br><br><br> 8<br><br><br><br><br><br><br><br><br><br> 9<br><br><br><br><br><br><br><br><br><br> 10<br><br><br><br><br><br><br><br><br><br> 11<br><br><br><br><br><br><br><br><br><br>'
+    tablehtml = '<table border="1"><tr><td>ABCD</td><td>EFGH</td><td>IJKL</td></tr>
+                 <tr><td>abcd</td><td>efgh</td><td>ijkl</td></tr>
+                 <tr><td>' + htmlcontent + '</td></tr></table>'
+    pdf.write_html(tablehtml, true, 0, true, 0)
+    pno = pdf.get_page
+    assert_equal pno, 3
+    # Page 1
+    count_line, count_text, xpos1 = pdf.get_html_text_position_x(1, /ABCD/) # Header
+    assert_not_nil xpos1
+    assert_equal 1, count_text
+    assert_equal 13, count_line
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(1, /abcd/)
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 13, count_line
+    # Page 2
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(2, /\([6-9]\)/, xpos1)
+    assert_not_nil xpos2
+    assert_equal xpos1, xpos2
+    assert_equal 7, count_line
+  end
+  test "write_html Table thead tag test 1" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    tablehtml = '<table border="1" cellpadding="1" cellspacing="1">
+    <thead><tr><td>ABCD</td><td>EFGH</td><td>IJKL</td></tr></thead>
+    <tr><td>abcd</td><td>efgh</td><td>ijkl</td></tr>
+    </table>'
+    pdf.write_html(tablehtml, true, 0, true, 0)
+    page = pdf.get_page
+    assert_equal 1, page
+    count_line, count_text, xpos = pdf.get_html_text_position_x(1, /ABCD/) # Header
+    assert_equal 1, count_text
+  end
+  test "write_html Table thead tag test 2" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    htmlcontent = '1<br><br><br><br><br><br><br><br><br><br> 2<br><br><br><br><br><br><br><br><br><br> 3<br><br><br><br><br><br><br><br><br><br> 4<br><br><br><br><br><br><br><br><br><br> 5<br><br><br><br><br><br><br><br><br><br> 6<br><br><br><br><br><br><br><br><br><br> 7<br><br><br><br><br><br><br><br><br><br> 8<br><br><br><br><br><br><br><br><br><br> 9<br><br><br><br><br><br><br><br><br><br> 10<br><br><br><br><br><br><br><br><br><br> 11<br><br><br><br><br><br><br><br><br><br>'
+    tablehtml = '<table><thead><tr><td>ABCD</td><td>EFGH</td><td>IJKL</td></tr></thead>
+                 <tr><td>abcd</td><td>efgh</td><td>ijkl</td></tr>
+                 <tr><td>' + htmlcontent + '</td></tr></table>'
+    pdf.write_html(tablehtml, true, 0, true, 0)
+    page = pdf.get_page
+    assert_equal 3, page
+    # Page 1
+    count_line, count_text, xpos1 = pdf.get_html_text_position_x(1, /ABCD/) # Header
+    assert_not_nil xpos1
+    assert_equal 1, count_text
+    assert_equal 13, count_line
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(1, /abcd/)
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 13, count_line
+    # Page 2
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(2, /ABCD/, xpos1) # Header
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 10, count_line
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(2, /abcd/)
+    assert_equal 0, count_text
+    assert_equal 10, count_line
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(2, /\([6-9]\)/, xpos1)
+    assert_not_nil xpos2
+    assert_equal xpos1, xpos2
+    assert_equal 10, count_line
+    # Page 3
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(3, /ABCD/, xpos1) # Header
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 5, count_line
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(3, /abcd/)
+    assert_equal 0, count_text
+    assert_equal 5, count_line
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(3, /\(11\)/, xpos1)
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 5, count_line
+  end
+  test "write_html_cell Table thead tag test" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    htmlcontent = '<br>1<br><br><br><br><br><br><br><br><br><br> 2<br><br><br><br><br><br><br><br><br><br> 3<br><br><br><br><br><br><br><br><br><br> 4<br>
+<br><br><br><br><br><br><br><br><br> 5<br><br><br><br><br><br><br><br><br><br> 6<br><br><br><br><br><br><br><br><br><br> 7<br><br><br><br><br><br><br>
+<br><br><br> 8<br><br><br><br><br><br><br><br><br><br> 9<br><br><br><br><br><br><br><br><br><br> 10<br><br><br><br><br><br><br><br><br><br> 11<br><br>
+<br><br><br><br><br><br><br><br>'
+    tablehtml ='<table><thead><tr>
+    <th style="text-align: left">Left align</th>
+    <th style="text-align: right">Right align</th>
+    <th style="text-align: center">Center align</th>
+    </tr> </thead><tbody> <tr>
+    <td style="text-align: left">left' + htmlcontent + '</td>
+    <td style="text-align: right">right</td>
+    <td style="text-align: center">center</td>
+    </tr> </tbody></table>'
+    pdf.write_html_cell(0, 0, '', '',tablehtml)
+    page = pdf.get_page
+    assert_equal 1, page
+    # Page 1
+    count_line, count_text, xpos1 = pdf.get_html_text_position_x(1, /Left align/) # Header
+    assert_not_nil xpos1
+    assert_equal 1, count_text
+    assert_equal 13, count_line
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(1, /left/)
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal 13, count_line
+    assert_equal xpos1, xpos2
+    # Page 2
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(2, /Left align/, xpos1) # Header
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 10, count_line
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(2, /\(6\)/, xpos1)
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 10, count_line
+    # Page 3
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(3, /Left align/, xpos1) # Header
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 5, count_line
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(3, /\(11\)/, xpos1)
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 5, count_line
+  end
+  test "write_html_cell Table thead tag  cellpadding x position test" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    htmlcontent = '<br>1<br><br><br><br><br><br><br><br><br><br> 2<br><br><br><br><br><br><br><br><br><br> 3<br><br><br><br><br><br><br><br><br><br> 4<br>
+<br><br><br><br><br><br><br><br><br> 5<br><br><br><br><br><br><br><br><br><br> 6<br><br><br><br><br><br><br><br><br><br> 7<br><br><br><br><br><br><br>
+<br><br><br> 8<br><br><br><br><br><br><br><br><br><br> 9<br><br><br><br><br><br><br><br><br><br> 10<br><br><br><br><br><br><br><br><br><br> 11<br><br>
+<br><br><br><br><br><br><br><br>'
+    tablehtml ='<table cellpadding="10"><thead><tr>
+    <th style="text-align: left">Left align</th>
+    <th style="text-align: right">Center align</th>
+    <th style="text-align: left">Right align</th>
+    </tr> </thead><tbody> <tr>
+    <td style="text-align: left">left</td>
+    <td style="text-align: right">center</td>
+    <td style="text-align: left">right' + htmlcontent + '</td>
+    </tr> </tbody></table>'
+    pdf.write_html_cell(0, 0, '', '',tablehtml)
+    page = pdf.get_page
+    assert_equal 1, page
+    # Page 1
+    count_line, count_text, xpos1 = pdf.get_html_text_position_x(1, /Right align/) # Header
+    assert_not_nil xpos1
+    assert_equal 1, count_text
+    assert_equal 13, count_line
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(1, /right/)
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 13, count_line
+    # Page 2
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(2, /Right align/, xpos1) # Header
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 10, count_line
+    count_line, count_text, xpos2 = pdf.get_html_text_position_x(2, /\(6\)/, xpos1)
+    assert_not_nil xpos2
+    assert_equal 1, count_text
+    assert_equal xpos1, xpos2
+    assert_equal 10, count_line
+  end
+  test "write_html_cell Table thead tag cellpadding y position test 1" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    table_start='<table cellpadding="10"><thead><tr>
+<th style="text-align: left">Left align</th><th style="text-align: center">Center align</th><th style="text-align: right">Right align</th>
+</tr></thead><tbody>'
+    table_col='<tr><td style="text-align: left">AAA</td><td style="text-align: center">BBB</td><td style="text-align: right">CCC</td></tr>'
+    table_end='</tbody></table>'
+    tablehtml= table_start + table_col * 30 + table_end
+    pdf.write_html_cell(0, 0, '', '',tablehtml)
+    # Page 1
+    count_line, count_text, ypos1 = pdf.get_html_text_position_y(1, /Left align/) # Header
+    assert_not_nil ypos1
+    assert_equal 1, count_text
+    assert_equal 65, count_line
+    count_line, count_text, ypos2 = pdf.get_html_text_position_y(1, /AAA/)
+    assert_not_nil ypos2
+    assert_equal 20, count_text
+    assert_equal 65, count_line
+    base_pos = ypos1.to_i - ypos2.to_i
+    # Page 2
+    count_line, count_text, ypos1 = pdf.get_html_text_position_y(2, /Left align/) # Header
+    assert_not_nil ypos2
+    assert_equal 1, count_text
+    assert_equal 34, count_line
+    count_line, count_text, ypos2 = pdf.get_html_text_position_y(2, /AAA/)
+    assert_not_nil ypos2
+    assert_equal 10, count_text
+    assert_equal 34, count_line
+    assert_equal base_pos, ypos1.to_i - ypos2.to_i
+  end
+  test "write_html_cell Table thead tag cellpadding y position test 2" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    table_start='abc<br><table cellpadding="10"><thead><tr>
+<th style="text-align: left">Left align</th><th style="text-align: center">Center align</th><th style="text-align: right">Right align</th>
+</tr></thead><tbody>'
+    table_col='<tr><td style="text-align: left">AAA</td><td style="text-align: center">BBB</td><td style="text-align: right">CCC</td></tr>'
+    table_end='</tbody></table>'
+    tablehtml= table_start + table_col * 30 + table_end
+    pdf.write_html_cell(0, 0, '', '',tablehtml)
+    # Page 1
+    count_line, count_text, ypos1 = pdf.get_html_text_position_y(1, /Left align/) # Header
+    assert_not_nil ypos1
+    assert_equal 1, count_text
+    assert_equal 66, count_line
+    count_line, count_text, ypos2 = pdf.get_html_text_position_y(1, /AAA/)
+    assert_not_nil ypos2
+    assert_equal 20, count_text
+    assert_equal 66, count_line
+    base_pos = ypos1.to_i - ypos2.to_i
+    # Page 2
+    count_line, count_text, ypos1 = pdf.get_html_text_position_y(2, /Left align/) # Header
+    assert_not_nil ypos2
+    assert_equal 1, count_text
+    assert_equal 34, count_line
+    count_line, count_text, ypos2 = pdf.get_html_text_position_y(2, /AAA/)
+    assert_not_nil ypos2
+    assert_equal 10, count_text
+    assert_equal 34, count_line
+    assert_equal base_pos, ypos1.to_i - ypos2.to_i
+  end
+  test "write_html ASCII text test" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    text = 'HTML Example'
+    htmlcontent = '<h1>' + text + '</h1>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    page = pdf.get_page
+    assert_equal 1, page
+    content = []
+    contents = pdf.getPageBuffer(1)
+    contents.each_line {|line| content.push line.chomp }
+    count_text = 0
+    content.each do |line|
+      count_text += 1 unless line.scan(text).empty?
+    end
+    assert_equal count_text, 1
+  end
+  test "write_html Non ASCII text test" do
+    pdf = MYPDF.new
+    pdf.add_page()
+    text = 'HTML Example ' + "\xc2\x83\xc2\x86"
+    htmlcontent = '<h1>' + text + '</h1>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    page = pdf.get_page
+    assert_equal 1, page
+    content = []
+    contents = pdf.getPageBuffer(1)
+    contents.each_line {|line| content.push line.chomp }
+    text = 'HTML Example ' + "\x83\x86"
+    text.force_encoding('ASCII-8BIT') if text.respond_to?(:force_encoding)
+    count_text = 0
+    content.each do |line|
+      line.force_encoding('ASCII-8BIT') if line.respond_to?(:force_encoding)
+      count_text += 1 unless line.scan(text).empty?
+    end
+    assert_equal count_text, 1
+  end
+  test "works internal links out of page range" do
+    pdf = RBPDF.new
+    pdf.add_page()
+    htmlcontent = '<a href="#100400_somelink">FooLink</a>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    assert_nothing_raised do
+      pdf.Close
+    end
+    assert_nothing_raised do
+      pdf.Output
+    end
+  end
+  test "write_html <b> tag test" do
+    pdf = MYPDF.new
+    pdf.set_print_header(false)
+    pdf.add_page()
+    text = ' ' + 'A' * 70
+    htmlcontent = '<b>' + text + '</b>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    pdf_text = pdf.get_html_text(1)
+    assert_equal 'A' * 70, pdf_text
+  end
+  test "write_html <i> tag test" do
+    pdf = MYPDF.new
+    pdf.set_print_header(false)
+    pdf.add_page()
+    text = ' ' + 'A' * 70
+    htmlcontent = '<i>' + text + '</i>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    pdf_text = pdf.get_html_text(1)
+    assert_equal 'A' * 70, pdf_text
+  end
+  test "write_html <u> tag test" do
+    pdf = MYPDF.new
+    pdf.set_print_header(false)
+    pdf.add_page()
+    text = ' ' + 'A' * 70
+    htmlcontent = '<u>' + text + '</u>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    pdf_text = pdf.get_html_text(1)
+    assert_equal 'A' * 70, pdf_text
+  end
+  test "write_html <pre> tag space 1 test" do
+    pdf = MYPDF.new
+    pdf.set_print_header(false)
+    pdf.add_page()
+    text = ' ' + 'A' * 70
+    htmlcontent = '<pre>' + text + '</pre>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    pdf_text = pdf.get_html_text(1)
+    assert_equal "\xa0" + 'A' * 70, pdf_text
+  end
+  test "write_html <pre> tag space 2 test" do
+    pdf = MYPDF.new
+    pdf.set_print_header(false)
+    pdf.add_page()
+    text = '  ' + 'A' * 70
+    htmlcontent = '<pre>' + text + '</pre>'
+    pdf.write_html(htmlcontent, true, 0, true, 0)
+    pdf_text = pdf.get_html_text(1)
+    assert_equal "\xa0" * 2 + 'A' * 70, pdf_text
+  end
+  test "write_html Character Entities test" do
+    pdf = MYPDF.new
+    pdf.set_print_header(false)
+    character_entities = {
+      '&lt;'    => '<',
+      '&gt;'    => '>',
+      '&amp;'   => '&',
+      '&quot;'  => '"',
+      '&nbsp;'  => "\xa0",
+      '&cent;'  => "\xa2",
+      '&pound;' => "\xa3",
+      '&yen;'   => "\xa5",
+      '&copy;'  => "\xa9",
+      '&reg;'   => "\xae",
+      '&euro;'  => "\x80",
+    }
+    character_entities.each {|ce, c|
+      pdf.add_page()
+      page = pdf.get_page
+      pdf.write_html(ce, true, 0, true, 0)
+      pdf_text = pdf.get_html_text(page)
+      assert_equal '[' + ce + ']:' + c, '[' + ce + ']:' + pdf_text
+    }
+  end
+  test "write_html Character Entities test pre mode" do
+    pdf = MYPDF.new
+    pdf.set_print_header(false)
+    character_entities = {
+      '&lt;'    => '<',
+      '&gt;'    => '>',
+      '&amp;'   => '&',
+      '&quot;'  => '"',
+      '&nbsp;'  => "\xa0",
+      '&cent;'  => "\xa2",
+      '&pound;' => "\xa3",
+      '&yen;'   => "\xa5",
+      '&copy;'  => "\xa9",
+      '&reg;'   => "\xae",
+      '&euro;'  => "\x80",
+    }
+    character_entities.each {|ce, c|
+      pdf.add_page()
+      page = pdf.get_page
+      pdf.write_html('<pre>' + ce + '</pre>', true, 0, true, 0)
+      pdf_text = pdf.get_html_text(page)
+      assert_equal '[' + ce + ']:' + c, '[' + ce + ']:' + pdf_text
+    }
+  end
+  test "unhtmlentities test" do
+    pdf = RBPDF.new
+    character_entities = {
+      '&lt;'    => '<',
+      '&gt;'    => '>',
+      '&amp;'   => '&',
+      '&quot;'  => '"',
+      '&nbsp;'  => "\xc2\xa0",
+      '&cent;'  => "\xc2\xa2",
+      '&pound;' => "\xc2\xa3",
+      '&yen;'   => "\xc2\xa5",
+      '&copy;'  => "\xc2\xa9",
+      '&reg;'   => "\xc2\xae",
+      '&euro;'  => "\xe2\x82\xac",
+    }
+    character_entities.each {|ce, c|
+      text = pdf.unhtmlentities(ce)
+      text.force_encoding('ASCII-8BIT') if text.respond_to?(:force_encoding)
+      assert_equal '[' + ce + ']:' + c, '[' + ce + ']:' + text
+    }
+  end
+end