RubyGems - cbeta - Versions diffs - 1.3.6 → 2.0.0 - Mend

cbeta 1.3.6 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

checksums.yaml +4 -4
data/lib/cbeta.rb +0 -1
data/lib/cbeta/p5a_to_html_for_every_edition.rb +46 -22
metadata +2 -3
data/lib/cbeta/p5a_to_epub.rb +0 -872

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 593f41e3ed434a6e6cecb82d6ab138060bdc411b
-  data.tar.gz: e66b25b39df32cf7dac8616742903865eb4dc1f3
+  metadata.gz: ff4869a9d67955fc89ddd9c5f6f8e88db19f598d
+  data.tar.gz: 716234a36f10298fa572d6c7fac10115316918ce
 SHA512:
-  metadata.gz: b346f87c1eddb9908eebd99c55c7c5a2d92acf6e131b88323a9905ea0159134a22ee446d15dbb0160228d990dc723dfca5be39bcefb793915484a845d8c64ebe
-  data.tar.gz: 657358264f56a387e2e80d84a1474b66f220e5cb4428e7995d6dfec867250777bd11f42045b9bdda20c1c01ed27322988e791c02560233a82b11f02ddd911c04
+  metadata.gz: 64cf5990e9579b23e70a861696862afaafb8738e30819cb3617e92b23a54753e33542a41a0473b7368a5cd1752ec517b9ab84a8bd9da3e017c9e901918825857
+  data.tar.gz: b42dadbd97ceb255e1300231b4f43148e1eebcce2c17a837ed91535ea6c9eed3e66021d3298770c698c1fe2520d3d9c5e723f39f301af7113fb119e71c94770f

data/lib/cbeta.rb CHANGED Viewed

@@ -121,7 +121,6 @@ require 'cbeta/bm_to_text'
 require 'cbeta/char_count'
 require 'cbeta/char_freq'
 require 'cbeta/html_to_pdf'
-require 'cbeta/p5a_to_epub'
 require 'cbeta/p5a_to_html'
 require 'cbeta/p5a_to_html_for_every_edition'
 require 'cbeta/p5a_to_html_for_pdf'

data/lib/cbeta/p5a_to_html_for_every_edition.rb CHANGED Viewed

@@ -64,6 +64,23 @@ class CBETA::P5aToHTMLForEveryEdition
   end
   private
+  def before_parse_xml(xml_fn)
+    @back = { 0 => '' }
+    @back_orig = { 0 => '' }
+    @char_count = 1
+    @dila_note = 0
+    @div_count = 0
+    @in_l = false
+    @juan = 0
+    @lg_row_open = false
+    @mod_notes = Set.new
+    @next_line_buf = ''
+    @notes_mod = {}
+    @notes_orig = {}
+    @open_divs = []
+    @sutra_no = File.basename(xml_fn, ".xml")
+  end
   def convert_all
     Dir.entries(@xml_root).sort.each do |c|
@@ -71,6 +88,15 @@ class CBETA::P5aToHTMLForEveryEdition
       handle_collection(c)
     end
   end
+  def get_editions(doc)
+    r = Set.new [@orig, "【CBETA】"] # 至少有底本及 CBETA 兩個版本
+    doc.xpath('//lem|//rdg').each do |e|
+      w = e['wit'].scan(/【.*?】/)
+      r.merge w
+    end
+    r
+  end
   def handle_anchor(e)
     id = e['id']
@@ -309,12 +335,17 @@ class CBETA::P5aToHTMLForEveryEdition
   end
   def handle_lem(e)
-    w = e['wit'].scan(/【.*?】/)
-    @editions.merge w
-    w = w.join(' ')
+    # 沒有 rdg 的版本，用字同 lem
+    editions = Set.new @editions
+    e.xpath('./following-sibling::rdg').each do |rdg|
+      rdg['wit'].scan(/【.*?】/).each do |w|
+        editions.delete w
+      end
+    end
+    w = editions.to_a.join(' ')
     r = traverse(e)
-    "<r w='#{w}' l='#{@lb}' w='#{@char_count}'>#{r}</r>"
+    "<r w='#{w}' l='#{@lb}'>#{r}</r>"
   end
   def handle_lg(e)
@@ -485,7 +516,6 @@ class CBETA::P5aToHTMLForEveryEdition
   def handle_rdg(e)
     r = traverse(e)
     w = e['wit'].scan(/【.*?】/)
-    @editions.merge w
     "<r w='#{e['wit']}' l='#{@lb}' w='#{@char_count}'>#{r}</r>"
   end
@@ -503,21 +533,8 @@ class CBETA::P5aToHTMLForEveryEdition
   def handle_sutra(xml_fn)
     puts "convert sutra #{xml_fn}"
-    @editions = Set.new [@orig, "【CBETA】"] # 至少有底本及 CBETA 兩個版本
-    @back = { 0 => '' }
-    @back_orig = { 0 => '' }
-    @char_count = 1
-    @dila_note = 0
-    @div_count = 0
-    @in_l = false
-    @juan = 0
-    @lg_row_open = false
-    @mod_notes = Set.new
-    @next_line_buf = ''
-    @notes_mod = {}
-    @notes_orig = {}
-    @open_divs = []
-    @sutra_no = File.basename(xml_fn, ".xml")
+    before_parse_xml(xml_fn)
     text = parse_xml(xml_fn)
@@ -600,6 +617,7 @@ class CBETA::P5aToHTMLForEveryEdition
     @orig = @cbeta.get_canon_symbol(vol[0])
     abort "未處理底本" if @orig.nil?
+    @orig_short = @orig.sub(/^【(.*)】$/, '\1')
     @vol = vol
     @series = vol[0]
@@ -693,6 +711,8 @@ class CBETA::P5aToHTMLForEveryEdition
     root = doc.root()
     body = root.xpath("text/body")[0]
     @pass = [true]
+    @editions = get_editions(doc)
     text = traverse(body)
     text
@@ -725,7 +745,7 @@ class CBETA::P5aToHTMLForEveryEdition
     @editions.each do |ed|
       frag = Nokogiri::HTML.fragment("<div id='body'>#{html}</div>")
       frag.search("r").each do |node|
-        if node['w'] == ed
+        if node['w'].include? ed
           node.add_previous_sibling node.inner_html
         end
         node.remove
@@ -734,7 +754,11 @@ class CBETA::P5aToHTMLForEveryEdition
       back = html_back(juan_no, ed)
-      fn = ed.sub(/^【(.*)】$/, '\1') + '.htm'
+      fn = ed.sub(/^【(.*)】$/, '\1')
+      if fn != 'CBETA' and fn != @orig_short
+        fn = @orig_short + '→' + fn
+      end
+      fn += '.htm'
       output_path = File.join(folder, fn)
       text = <<eos
 <html>

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: cbeta
 version: !ruby/object:Gem::Version
-  version: 1.3.6
+  version: 2.0.0
 platform: ruby
 authors:
 - Ray Chou
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2015-12-14 00:00:00.000000000 Z
+date: 2015-12-16 00:00:00.000000000 Z
 dependencies: []
 description: Ruby gem for use Chinese Buddhist Text resources made by CBETA (http://www.cbeta.org).
 email: zhoubx@gmail.com
@@ -23,7 +23,6 @@ files:
 - lib/cbeta/gaiji.rb
 - lib/cbeta/html_to_pdf.rb
 - lib/cbeta/html_to_text.rb
-- lib/cbeta/p5a_to_epub.rb
 - lib/cbeta/p5a_to_html.rb
 - lib/cbeta/p5a_to_html_for_every_edition.rb
 - lib/cbeta/p5a_to_html_for_pdf.rb

data/lib/cbeta/p5a_to_epub.rb DELETED Viewed

@@ -1,872 +0,0 @@
-require 'cgi'
-require 'date'
-require 'fileutils'
-require 'json'
-require 'nokogiri'
-require 'set'
-require 'gepub'
-require 'pp'
-# Convert CBETA XML P5a to EPUB
-#
-# CBETA XML P5a 可由此取得: https://github.com/cbeta-git/xml-p5a
-class CBETA::P5aToEPUB
-  # 內容不輸出的元素
-  PASS=['back', 'teiHeader']
-  # 某版用字缺的符號
-  MISSING = '－'
-  SCRIPT_FOLDER = File.dirname(__FILE__)
-  NAV_TEMPLATE = File.read(File.join(SCRIPT_FOLDER, '../data/epub-nav.xhtml'))
-  MAIN = 'main.xhtml'
-  DATA = File.join(SCRIPT_FOLDER, '../data')
-  private_constant :PASS, :MISSING, :SCRIPT_FOLDER, :NAV_TEMPLATE, :MAIN, :DATA
-  # @param temp_folder [String] 供 EPUB 暫存工作檔案的路徑
-  # @option opts [Integer] :epub_version (3) EPUB 版本
-  # @option opts [String] :graphic_base 圖檔路徑
-  #   * graphic_base/covers: 封面圖檔位置
-  #   * graphic_base/figures: 插圖圖檔位置
-  #   * graphic_base/sd-gif: 悉曇字圖檔位置
-  #   * graphic_base/rj-gif: 蘭札體圖檔位置
-  # @option opts [String] :front_page 內文前可以加一份 HTML 檔，例如「編輯說明」
-  # @option opts [String] :front_page_title 加在目錄的 front_page 標題
-  # @option opts [String] :back_page 內文後可以加一份 HTML 檔，例如「版權聲明」
-  # @option opts [String] :back_page_title 加在目錄的 back_page 標題
-  # @option opts [Boolean] :juan_toc 目次中是否要有卷目次，預設為 true
-  #
-  # @example
-  #   options = {
-  #     epub_version: 3,
-  #     front_page: '/path/to/front_page.xhtml',
-  #     front_page_title: '編輯說明',
-  #     back_page: '/path/to/back_page.xhtml',
-  #     back_page_title: '贊助資訊',
-  #     graphic_base: '/path/to/grphic/files/root'
-  #   }
-  #   c = CBETA::P5aToEPUB.new('/path/to/temp/working/folder', options)
-  #   c.convert_folder('/path/to/xml/roo', '/path/for/output/epubs')
-  def initialize(temp_folder, opts={})
-    @temp_folder = temp_folder
-    @settings = {
-      epub_version: 3,
-      juan_toc: true
-    }
-    @settings.merge!(opts)
-    @cbeta = CBETA.new
-    @gaijis = CBETA::Gaiji.new
-    # 載入 unicode 1.1 字集列表
-    fn = File.join(DATA, 'unicode-1.1.json')
-    json = File.read(fn)
-    @unicode1 = JSON.parse(json)
-  end
-  # 將某個 xml 轉為一個 EPUB
-  # @param input_path [String] 輸入 XML 檔路徑
-  # @param output_paath [String] 輸出 EPUB 檔路徑
-  def convert_file(input_path, output_path)
-    return false unless input_path.end_with? '.xml'
-    @book_id = File.basename(input_path, ".xml")
-    sutra_init
-    handle_file(input_path)
-    create_epub(output_path)
-  end
-  # 將某個資料夾下的每部作品都轉為一個對應的 EPUB。
-  # 跨冊的作品也會合成一個 EPUB。
-  #
-  # @example
-  #   require 'cbeta'
-  #
-  #   TEMP = '/temp/epub-work'
-  #   IMG = '/Users/ray/Documents/Projects/D道安/figures'
-  #
-  #   c = CBETA::P5aToEPUB.new(TEMP, IMG)
-  #   c.convert_folder('/Users/ray/Documents/Projects/D道安/xml-p5a/DA', '/temp/cbeta-epub/DA')
-  def convert_folder(input_folder, output_folder)
-    puts "convert folder: #{input_folder} to #{output_folder}"
-    @todo = {}
-    # 先檢視整個資料夾，哪些是要多檔合一
-    prepare_todo_list(input_folder, output_folder)
-    @todo.each_pair do |k, v|
-      convert_sutra(k, v[:xml_files], v[:epub])
-    end
-  end
-  # 將多個 xml 檔案合成一個 EPUB
-  #
-  # @example 大般若經 跨三冊 合成一個 EPUB
-  #   require 'cbeta'
-  #
-  #   TEMP = '/temp/epub-work'
-  #
-  #   xml_files = [
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/05/T05n0220a.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/06/T06n0220b.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220c.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220d.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220e.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220f.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220g.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220h.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220i.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220j.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220k.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220l.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220m.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220n.xml',
-  #     '/Users/ray/git-repos/cbeta-xml-p5a/T/07/T07n0220o.xml',
-  #   ]
-  #
-  #   c = CBETA::P5aToEPUB.new(TEMP)
-  #   c.convert_sutra('T0220', xml_files, '/temp/cbeta-epub/T0220.epub')
-  def convert_sutra(book_id, xml_files, out)
-    @book_id = book_id
-    sutra_init
-    xml_files.each { |f| handle_file(f) }
-    if xml_files.size > 1
-      @title.sub!(/^(.*)\(.*?\)$/, '\1')
-      @title.sub!(/^(.*?)(（.*?）)+$/, '\1')
-    end
-    create_epub(out)
-  end
-  private
-  def clear_temp_folder
-    FileUtils.remove_dir(@temp_folder, force=true)
-    FileUtils::mkdir_p @temp_folder
-  end
-  def copy_static_files(src, dest)
-    dest = File.join(@temp_folder, dest)
-    FileUtils.copy(src, dest)
-  end
-  def create_epub(output_path)
-    if @settings[:front_page]
-      copy_static_files(@settings[:front_page], 'front.xhtml')
-    end
-    if @settings[:back_page]
-      copy_static_files(@settings[:back_page], 'back.xhtml')
-    end
-    src = File.join(DATA, 'epub.css')
-    copy_static_files(src, 'cbeta.css')
-    create_html_by_juan
-    create_nav_html
-    title = @title
-    book_id = @book_id
-    creator = @author
-    builder = GEPUB::Builder.new {
-      language 'zh-TW'
-      unique_identifier "http://www.cbeta.org/#{book_id}", 'BookID', 'URL'
-      title title
-      creator creator
-      contributors 'DILA'
-      date Date.today.to_s
-    }
-    juan_dir = File.join(@temp_folder, 'juans')
-    settings = @settings
-    # in resources block, you can define resources by its relative path and datasource.
-    # item creator methods are: files, file.
-    builder.resources(:workdir => @temp_folder) {
-      glob 'img/*'
-      file 'cbeta.css'
-      # this is navigation document.
-      nav 'nav.xhtml'
-      # ordered item. will be added to spine.
-      ordered {
-        file 'front.xhtml' if settings[:front_page]
-        Dir.entries(juan_dir).sort.each do |f|
-          next if f.start_with? '.'
-          file "juans/#{f}"
-        end
-        file 'back.xhtml' if settings[:back_page]
-      }
-    }
-    builder.book.version = @settings[:epub_version]
-    canon = book_id.sub(/^([A-Z]{1,2}).*$/, '\1')
-    cover = File.join(settings[:graphic_base], 'covers', canon, "#{book_id}.jpg")
-    if File.exist? cover
-      File.open(cover) do |io|
-        builder.book.add_item(cover, io).cover_image
-      end
-    end
-    builder.generate_epub(output_path)
-    puts "output: #{output_path}\n\n"
-  end
-  def create_html_by_juan
-    juans = @main_text.split(/(<juan \d+>)/)
-    open = false
-    fo = nil
-    juan_no = nil
-    fn = ''
-    buf = ''
-    # 一卷一檔
-    juans.each do |j|
-      if j =~ /<juan (\d+)>$/
-        juan_no = $1.to_i
-        fn = "%03d.xhtml" % juan_no
-        output_path = File.join(@temp_folder, 'juans', fn)
-        fo = File.open(output_path, 'w')
-        open = true
-        s = <<eos
-<html xmlns="http://www.w3.org/1999/xhtml">
-<head>
-  <meta charset="utf-8" />
-  <title>#{@title}</title>
-  <link rel="stylesheet" type="text/css" href="../cbeta.css" />
-</head>
-<body>
-<div id='body'>
-eos
-        fo.write(s)
-        fo.write(buf)
-        buf = ''
-      elsif open
-        fo.write(j + "\n</div><!-- end of div[@id='body'] -->\n")
-        fo.write('</body></html>')
-        fo.close
-      else
-        buf = j
-      end
-    end
-  end
-  def create_nav_html
-    if @settings[:back_page_title]
-      s = @settings[:back_page_title]
-      @nav_root_ol.add_child("<li><a href='back.xhtml'>#{s}</a></li>")
-    end
-    #s = @nav_root_ol.to_xml(indent: 2, encoding: 'UTF-8', pertty: true, :save_with => Nokogiri::XML::Node::SaveOptions::AS_XML)
-    s = @nav_root_ol.to_xml
-    #s += "" % @toc_juan
-    fn = File.join(@temp_folder, 'nav.xhtml')
-    s = NAV_TEMPLATE % s
-    File.write(fn, s)
-  end
-  def handle_anchor(e)
-    if e.has_attribute?('type')
-      if e['type'] == 'circle'
-        return '◎'
-      end
-    end
-    ''
-  end
-  def handle_app(e)
-    traverse(e)
-  end
-  def handle_byline(e)
-    r = '<p class="byline">'
-    r += traverse(e)
-    r + '</p>'
-  end
-  def handle_cell(e)
-    doc = Nokogiri::XML::Document.new
-    cell = doc.create_element('td')
-    cell['rowspan'] = e['rows'] if e.key? 'rows'
-    cell['colspan'] = e['cols'] if e.key? 'cols'
-    cell.inner_html = traverse(e)
-    to_html(cell) + "\n"
-  end
-  def handle_corr(e)
-    "<span class='corr'>" + traverse(e) + "</span>"
-  end
-  def handle_div(e)
-    if e.has_attribute? 'type'
-      @open_divs << e
-      r = traverse(e)
-      @open_divs.pop
-      return "<div class='div-#{e['type']}'>#{r}</div>"
-    else
-      return traverse(e)
-    end
-  end
-  def handle_figure(e)
-    "<div class='figure'>%s</div>" % traverse(e)
-  end
-  def handle_g(e, mode)
-    # if 有 <mapping type="unicode">
-    #   if 不在 Unicode Extension C, D, E 範圍裡
-    #     直接採用
-    #   else
-    #     預設呈現 unicode, 但仍包缺字資訊，供點選開 popup
-    # else if 有 <mapping type="normal_unicode">
-    #   預設呈現 normal_unicode, 但仍包缺字資訊，供點選開 popup
-    # else if 有 normalized form
-    #   預設呈現 normalized form, 但仍包缺字資訊，供點選開 popup
-    # else
-    #   預設呈現組字式, 但仍包缺字資訊，供點選開 popup
-    gid = e['ref'][1..-1]
-    g = @gaijis[gid]
-    abort "Line:#{__LINE__} 無缺字資料:#{gid}" if g.nil?
-    zzs = g['zzs']
-    if gid.start_with?('SD')
-      case gid
-      when 'SD-E35A'
-        return '（'
-      when 'SD-E35B'
-        return '）'
-      else
-        return g['roman'] if g.key? 'roman'
-        if mode == 'txt'
-          puts "警告：純文字模式出現悉曇字：#{gid}"
-          return gid
-        else
-          # 如果沒有羅馬轉寫就顯示圖檔
-          src = File.join(@settings[:graphic_base], 'sd-gif', gid[3..4], gid+'.gif')
-          basename = File.basename(src)
-          dest = File.join(@temp_folder, 'img', basename)
-          FileUtils.copy(src, dest)
-          return "<img src='../img/#{basename}' />"
-        end
-      end
-    end
-    if gid.start_with?('RJ')
-      return g['roman'] if g.key? 'roman'
-      if mode == 'txt'
-        puts "警告：純文字模式出現蘭札體：#{gid}"
-        return gid
-      else
-        # 如果沒有羅馬轉寫就顯示圖檔
-        src = File.join(@settings[:graphic_base], 'rj-gif', gid[3..4], gid+'.gif')
-        basename = File.basename(src)
-        dest = File.join(@temp_folder, 'img', basename)
-        FileUtils.copy(src, dest)
-        return "<img src='../img/#{basename}' />"
-      end
-    end
-    if mode == 'txt'
-      abort "缺組字式：#{g}" if zzs.nil?
-      return zzs
-    end
-    default = ''
-    if g.has_key?('unicode')
-      if @unicode1.include?(g['unicode'])
-        return g['unicode-char'] # unicode 1.1 直接用
-      end
-    end
-    zzs
-  end
-  def handle_graphic(e)
-    url = e['url']
-    url.sub!(/^.*(figures\/.*)$/, '\1')
-    src = File.join(@settings[:graphic_base], url)
-    basename = File.basename(src)
-    dest = File.join(@temp_folder, 'img', basename)
-    FileUtils.copy(src, dest)
-    "<img src='../img/#{basename}' />"
-  end
-  def handle_head(e)
-    r = ''
-    unless e['type'] == 'added'
-      i = @open_divs.size
-      r = "<p class='h#{i}'>%s</p>" % traverse(e)
-    end
-    r
-  end
-  def handle_item(e)
-    "<li>%s</li>\n" % traverse(e)
-  end
-  def handle_juan(e)
-    "<p class='juan'>%s</p>" % traverse(e)
-  end
-  def handle_l(e)
-    if @lg_type == 'abnormal'
-      return traverse(e)
-    end
-    @in_l = true
-    doc = Nokogiri::XML::Document.new
-    cell = doc.create_element('div')
-    cell['class'] = 'lg-cell'
-    cell.inner_html = traverse(e)
-    if @first_l
-      parent = e.parent()
-      if parent.has_attribute?('rend')
-        indent = parent['rend'].scan(/text-indent:[^:]*/)
-        unless indent.empty?
-          cell['style'] = indent[0]
-        end
-      end
-      @first_l = false
-    end
-    r = to_html(cell)
-    unless @lg_row_open
-      r = "\n<div class='lg-row'>" + r
-      @lg_row_open = true
-    end
-    @in_l = false
-    r
-  end
-  def handle_lb(e)
-    # 卍續藏有 X 跟 R 兩種 lb, 只處理 X
-    return '' if e['ed'] != @series
-    @lb = e['n']
-    r = ''
-    #if e.parent.name == 'lg' and $lg_row_open
-    if @lg_row_open && !@in_l
-      # 每行偈頌放在一個 lg-row 裡面
-      # T46n1937, p. 914a01, l 包雙行夾註跨行
-      # T20n1092, 337c16, lb 在 l 中間，不結束 lg-row
-      r += "</div><!-- end of lg-row -->"
-      @lg_row_open = false
-    end
-    unless @next_line_buf.empty?
-      r += @next_line_buf
-      @next_line_buf = ''
-    end
-    r
-  end
-  def handle_lem(e)
-    r = ''
-    w = e['wit']
-    if w.include? 'CBETA' and not w.include? @orig
-      r = "<span class='corr'>%s</span>" % traverse(e)
-    else
-      r = traverse(e)
-    end
-    r
-  end
-  def handle_lg(e)
-    r = ''
-    @lg_type = e['type']
-    if @lg_type == 'abnormal'
-      r = "<p class='lg-abnormal'>" + traverse(e) + "</p>"
-    else
-      @first_l = true
-      doc = Nokogiri::XML::Document.new
-      node = doc.create_element('div')
-      node['class'] = 'lg'
-      if e.has_attribute?('rend')
-        rend = e['rend'].gsub(/text-indent:[^:]*/, '')
-        node['style'] = rend
-      end
-      @lg_row_open = false
-      node.inner_html = traverse(e)
-      if @lg_row_open
-        node.inner_html += '</div><!-- end of lg -->'
-        @lg_row_open = false
-      end
-      r = "\n" + to_html(node)
-    end
-    r
-  end
-  def handle_list(e)
-    doc = Nokogiri::XML::Document.new
-    node = doc.create_element('ul')
-    node.inner_html = traverse(e)
-    if e.key? 'rendition'
-      node['class'] = e['rendition']
-    end
-    to_html(node)
-  end
-  def handle_milestone(e)
-    r = ''
-    if e['unit'] == 'juan'
-      r += "</div>" * @open_divs.size  # 如果有 div 跨卷，要先結束, ex: T55n2154, p. 680a29, 跨 19, 20 兩卷
-      @juan += 1
-      r += "<juan #{@juan}>"
-      @open_divs.each { |d|
-        r += "<div class='#{d['type']}'>"
-      }
-    end
-    r
-  end
-  def handle_mulu(e)
-    @mulu_count += 1
-    fn = "juans/%03d.xhtml" % @juan
-    if e['type'] == '卷'
-      if @settings[:juan_toc]
-        label = e['n']
-        @juan_nav.add_child("<li><a href='#{fn}#mulu#{@mulu_count}'>#{label}</a></li>")
-      end
-    else
-      level = e['level'].to_i
-      while @current_nav.size > (level+1)
-        @current_nav.pop
-      end
-      label = traverse(e, 'txt')
-      li = @current_nav.last.add_child("<li><a href='#{fn}#mulu#{@mulu_count}'>#{label}</a></li>").first
-      ol = li.add_child('<ol></ol>').first
-      @current_nav << ol
-    end
-    "<a id='mulu#{@mulu_count}' />"
-  end
-  def handle_node(e, mode)
-    return '' if e.comment?
-    return handle_text(e, mode) if e.text?
-    return '' if PASS.include?(e.name)
-    r = case e.name
-    when 'anchor'    then handle_anchor(e)
-    when 'app'       then handle_app(e)
-    when 'byline'    then handle_byline(e)
-    when 'cell'      then handle_cell(e)
-    when 'corr'      then handle_corr(e)
-    when 'div'       then handle_div(e)
-    when 'figure'    then handle_figure(e)
-    when 'foreign'   then ''
-    when 'g'         then handle_g(e, mode)
-    when 'graphic'   then handle_graphic(e)
-    when 'head'      then handle_head(e)
-    when 'item'      then handle_item(e)
-    when 'juan'      then handle_juan(e)
-    when 'l'         then handle_l(e)
-    when 'lb'        then handle_lb(e)
-    when 'lem'       then handle_lem(e)
-    when 'lg'        then handle_lg(e)
-    when 'list'      then handle_list(e)
-    when 'mulu'      then handle_mulu(e)
-    when 'note'      then handle_note(e)
-    when 'milestone' then handle_milestone(e)
-    when 'p'         then handle_p(e)
-    when 'rdg'       then ''
-    when 'reg'       then ''
-    when 'row'       then handle_row(e)
-    when 'sic'       then ''
-    when 'sg'        then handle_sg(e)
-    when 't'         then handle_t(e)
-    when 'tt'        then handle_tt(e)
-    when 'table'     then handle_table(e)
-    else traverse(e)
-    end
-    r
-  end
-  def handle_note(e)
-    n = e['n']
-    if e.has_attribute?('type')
-      t = e['type']
-      case t
-      when 'equivalent'
-        return ''
-      when 'orig'
-        return ''
-      when 'orig_biao'
-        return ''
-      when 'orig_ke'
-        return ''
-      when 'mod'
-        return ""
-      when 'rest'
-        return ''
-      else
-        return '' if t.start_with?('cf')
-      end
-    end
-    if e.has_attribute?('resp')
-      return '' if e['resp'].start_with? 'CBETA'
-    end
-    if e.has_attribute?('place') && e['place']=='inline'
-      r = traverse(e)
-      return "(#{r})"
-    else
-      return traverse(e)
-    end
-  end
-  def handle_p(e)
-    r = "<div class='p'>\n"
-    r += traverse(e)
-    r + "</div>\n"
-  end
-  def handle_row(e)
-    "<tr>" + traverse(e) + "</tr>\n"
-  end
-  def handle_sg(e)
-    '(' + traverse(e) + ')'
-  end
-  def handle_file(xml_fn)
-    puts "read #{xml_fn}"
-    @in_l = false
-    @lg_row_open = false
-    @mod_notes = Set.new
-    @next_line_buf = ''
-    @open_divs = []
-    if @book_id.start_with? 'DA'
-      @orig = nil?
-    else
-      @orig = @cbeta.get_canon_abbr(@book_id[0])
-      abort "未處理底本: #{@book_id[0]}" if @orig.nil?
-    end
-    text = parse_xml(xml_fn)
-    # 註標移到 lg-cell 裡面，不然以 table 呈現 lg 會有問題
-    text.gsub!(/(<a class='noteAnchor'[^>]*><\/a>)(<div class="lg-cell"[^>]*>)/, '\2\1')
-    @main_text += text
-  end
-  def handle_t(e)
-    if e.has_attribute? 'place'
-      return '' if e['place'].include? 'foot'
-    end
-    r = traverse(e)
-    # <tt type="app"> 不是 悉漢雙行對照
-    return r if @tt_type == 'app'
-    # 處理雙行對照
-    i = e.xpath('../t').index(e)
-    case i
-    when 0
-      return r + '　'
-    when 1
-      @next_line_buf += r + '　'
-      return ''
-    else
-      return r
-    end
-  end
-  def handle_tt(e)
-    @tt_type = e['type']
-    traverse(e)
-  end
-  def handle_table(e)
-    "<table>" + traverse(e) + "</table>"
-  end
-  def handle_text(e, mode)
-    s = e.content().chomp
-    return '' if s.empty?
-    return '' if e.parent.name == 'app'
-    # cbeta xml 文字之間會有多餘的換行
-    r = s.gsub(/[\n\r]/, '')
-    # 把 & 轉為 &amp;
-    CGI.escapeHTML(r)
-  end
-  def lem_note_cf(e)
-    # ex: T32n1670A.xml, p. 703a16
-    # <note type="cf1">K30n1002_p0257a01-a23</note>
-    refs = []
-    e.xpath('./note').each { |n|
-      if n.key?('type') and n['type'].start_with? 'cf'
-        refs << n.content
-      end
-    }
-    if refs.empty?
-      ''
-    else
-      '修訂依據：' + refs.join('；') + '。'
-    end
-  end
-  def lem_note_rdg(lem)
-    r = ''
-    app = lem.parent
-    @pass << false
-    app.xpath('rdg').each { |rdg|
-      if rdg['wit'].include? @orig
-        s = traverse(rdg, 'back')
-        s = MISSING if s.empty?
-        r += @orig + s
-      end
-    }
-    @pass.pop
-    r += '。' unless r.empty?
-    r
-  end
-  def sutra_init
-    clear_temp_folder
-    s = NAV_TEMPLATE % '<ol></ol>'
-    @nav_doc = Nokogiri::XML(s)
-    @nav_doc.remove_namespaces!()
-    @nav_root_ol = @nav_doc.at_xpath('//ol')
-    @current_nav = [@nav_root_ol]
-    if @settings[:front_page_title]
-      @nav_root_ol.add_child("<li><a href='front.xhtml'>編輯說明</a></li>")
-    end
-    li = @nav_root_ol.add_child("<li><a href='#'>章節目次</a></li>").first
-    ol = li.add_child('<ol></ol>').first
-    @current_nav << ol
-    if @settings[:juan_toc]
-      li = @nav_root_ol.add_child("<li><a href='#'>卷目次</a></li>").first
-      @juan_nav = li.add_child('<ol></ol>').first
-    end
-    @mulu_count = 0
-    @main_text = ''
-    @dila_note = 0
-    @toc_juan = '' # 卷目次
-    @juan = 0
-    FileUtils::mkdir_p File.join(@temp_folder, 'img')
-    FileUtils::mkdir_p File.join(@temp_folder, 'juans')
-  end
-  def open_xml(fn)
-    s = File.read(fn)
-    if fn.include? 'T16n0657'
-      # 這個地方 雙行夾註 跨兩行偈頌
-      # 把 lb 移到 note 結束之前
-      # 讓 lg-row 先結束，再結束雙行夾註
-      s.sub!(/(<\/note>)(\n<lb n="0206b29" ed="T"\/>)/, '\2\1')
-    end
-    # <milestone unit="juan"> 前面的 lb 屬於新的這一卷
-    s.gsub!(%r{((?:<pb [^>]+>\n?)?(?:<lb [^>]+>\n?)+)(<milestone [^>]*unit="juan"[^/>]*/>)}, '\2\1')
-    doc = Nokogiri::XML(s)
-    doc.remove_namespaces!()
-    doc
-  end
-  def read_mod_notes(doc)
-    doc.xpath("//note[@type='mod']").each { |e|
-      @mod_notes << e['n']
-    }
-  end
-  def parse_xml(xml_fn)
-    @pass = [false]
-    doc = open_xml(xml_fn)
-    e = doc.xpath("//titleStmt/title")[0]
-    @title = traverse(e, 'txt')
-    @title = @title.split()[-1]
-    @author = doc.at_xpath("//titleStmt/author").text
-    read_mod_notes(doc)
-    root = doc.root()
-    body = root.xpath("text/body")[0]
-    @pass = [true]
-    text = traverse(body)
-    text
-  end
-  def prepare_todo_list(input_folder, output_folder)
-    Dir.foreach(input_folder) do |f|
-      next if f.start_with? '.'
-      p1 = File.join(input_folder, f)
-      if File.file?(p1)
-        work = f.sub(/^([A-Z]{1,2})\d{2,3}n(.*)\.xml$/, '\1\2')
-        work = 'T0220' if work.start_with? 'T0220'
-        unless @todo.key? work
-          @todo[work] = { xml_files: [] }
-        end
-        hash = @todo[work]
-        hash[:xml_files] << p1
-        folders = output_folder.split('/')
-        folders.pop if folders[-1].match(/^[A-Z]{1,2}\d{2,3}$/)
-        folder = folders.join('/')
-        FileUtils::mkdir_p folder
-        hash[:epub] = File.join(folder, "#{work}.epub")
-      else
-        p2 = File.join(output_folder, f)
-        prepare_todo_list(p1, p2)
-      end
-    end
-  end
-  def remove_empty_nav(node_list)
-    node_list.each do |n|
-      if n[:nav].empty?
-        n.delete(:nav)
-      else
-        remove_empty_nav(n[:nav])
-      end
-    end
-  end
-  def to_html(e)
-    e.to_xml(encoding: 'UTF-8', pertty: true, :save_with => Nokogiri::XML::Node::SaveOptions::AS_XML)
-  end
-  def traverse(e, mode='html')
-    r = ''
-    e.children.each { |c|
-      s = handle_node(c, mode)
-      r += s
-    }
-    r
-  end
-end