pdf2json 0.1.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (473) hide show
  1. data/README.markdown +9 -0
  2. data/bin/.gitkeep +0 -0
  3. data/ext/extconf.rb +30 -0
  4. data/lib/pdf2json.rb +8 -0
  5. data/pdf2json-0.52-source/AUTHORS +24 -0
  6. data/pdf2json-0.52-source/CHANGES +11 -0
  7. data/pdf2json-0.52-source/Makefile +84 -0
  8. data/pdf2json-0.52-source/Makefile.in +84 -0
  9. data/pdf2json-0.52-source/aclocal.m4 +274 -0
  10. data/pdf2json-0.52-source/aconf-win32.h +86 -0
  11. data/pdf2json-0.52-source/aconf.h +42 -0
  12. data/pdf2json-0.52-source/aconf.h.in +41 -0
  13. data/pdf2json-0.52-source/autom4te.cache/output.0 +6908 -0
  14. data/pdf2json-0.52-source/autom4te.cache/requests +76 -0
  15. data/pdf2json-0.52-source/autom4te.cache/traces.0 +466 -0
  16. data/pdf2json-0.52-source/config.log +1259 -0
  17. data/pdf2json-0.52-source/config.status +1050 -0
  18. data/pdf2json-0.52-source/configure +6908 -0
  19. data/pdf2json-0.52-source/configure.ac +93 -0
  20. data/pdf2json-0.52-source/doc/pdffonts.1 +130 -0
  21. data/pdf2json-0.52-source/doc/pdffonts.cat +107 -0
  22. data/pdf2json-0.52-source/doc/pdffonts.hlp +117 -0
  23. data/pdf2json-0.52-source/doc/pdfimages.1 +102 -0
  24. data/pdf2json-0.52-source/doc/pdfimages.cat +92 -0
  25. data/pdf2json-0.52-source/doc/pdfimages.hlp +101 -0
  26. data/pdf2json-0.52-source/doc/pdfinfo.1 +158 -0
  27. data/pdf2json-0.52-source/doc/pdfinfo.cat +119 -0
  28. data/pdf2json-0.52-source/doc/pdfinfo.hlp +129 -0
  29. data/pdf2json-0.52-source/doc/pdftoppm.1 +115 -0
  30. data/pdf2json-0.52-source/doc/pdftoppm.cat +105 -0
  31. data/pdf2json-0.52-source/doc/pdftoppm.hlp +114 -0
  32. data/pdf2json-0.52-source/doc/pdftops.1 +229 -0
  33. data/pdf2json-0.52-source/doc/pdftops.cat +221 -0
  34. data/pdf2json-0.52-source/doc/pdftops.hlp +231 -0
  35. data/pdf2json-0.52-source/doc/pdftotext.1 +137 -0
  36. data/pdf2json-0.52-source/doc/pdftotext.cat +120 -0
  37. data/pdf2json-0.52-source/doc/pdftotext.hlp +133 -0
  38. data/pdf2json-0.52-source/doc/sample-xpdfrc +91 -0
  39. data/pdf2json-0.52-source/doc/xpdf.1 +513 -0
  40. data/pdf2json-0.52-source/doc/xpdf.cat +476 -0
  41. data/pdf2json-0.52-source/doc/xpdf.hlp +489 -0
  42. data/pdf2json-0.52-source/doc/xpdfrc.5 +480 -0
  43. data/pdf2json-0.52-source/doc/xpdfrc.cat +474 -0
  44. data/pdf2json-0.52-source/doc/xpdfrc.hlp +479 -0
  45. data/pdf2json-0.52-source/fofi/.DS_Store +0 -0
  46. data/pdf2json-0.52-source/fofi/FoFiBase.cc +156 -0
  47. data/pdf2json-0.52-source/fofi/FoFiBase.h +57 -0
  48. data/pdf2json-0.52-source/fofi/FoFiBase.o +0 -0
  49. data/pdf2json-0.52-source/fofi/FoFiEncodings.cc +994 -0
  50. data/pdf2json-0.52-source/fofi/FoFiEncodings.h +36 -0
  51. data/pdf2json-0.52-source/fofi/FoFiEncodings.o +0 -0
  52. data/pdf2json-0.52-source/fofi/FoFiTrueType.cc +2027 -0
  53. data/pdf2json-0.52-source/fofi/FoFiTrueType.h +174 -0
  54. data/pdf2json-0.52-source/fofi/FoFiTrueType.o +0 -0
  55. data/pdf2json-0.52-source/fofi/FoFiType1.cc +252 -0
  56. data/pdf2json-0.52-source/fofi/FoFiType1.h +59 -0
  57. data/pdf2json-0.52-source/fofi/FoFiType1.o +0 -0
  58. data/pdf2json-0.52-source/fofi/FoFiType1C.cc +2603 -0
  59. data/pdf2json-0.52-source/fofi/FoFiType1C.h +233 -0
  60. data/pdf2json-0.52-source/fofi/FoFiType1C.o +0 -0
  61. data/pdf2json-0.52-source/fofi/Makefile +70 -0
  62. data/pdf2json-0.52-source/fofi/Makefile.dep +0 -0
  63. data/pdf2json-0.52-source/fofi/Makefile.in +70 -0
  64. data/pdf2json-0.52-source/fofi/libfofi.a +0 -0
  65. data/pdf2json-0.52-source/fofi/vms_make.com +0 -0
  66. data/pdf2json-0.52-source/freetype.win32/.DS_Store +0 -0
  67. data/pdf2json-0.52-source/freetype.win32/include/.DS_Store +0 -0
  68. data/pdf2json-0.52-source/freetype.win32/include/freetype/config/ftconfig.h +528 -0
  69. data/pdf2json-0.52-source/freetype.win32/include/freetype/config/ftheader.h +780 -0
  70. data/pdf2json-0.52-source/freetype.win32/include/freetype/config/ftmodule.h +32 -0
  71. data/pdf2json-0.52-source/freetype.win32/include/freetype/config/ftoption.h +733 -0
  72. data/pdf2json-0.52-source/freetype.win32/include/freetype/config/ftstdlib.h +173 -0
  73. data/pdf2json-0.52-source/freetype.win32/include/freetype/freetype.h +3919 -0
  74. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftadvanc.h +179 -0
  75. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftbbox.h +94 -0
  76. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftbdf.h +209 -0
  77. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftbitmap.h +227 -0
  78. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftcache.h +1128 -0
  79. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftchapters.h +103 -0
  80. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftcid.h +166 -0
  81. data/pdf2json-0.52-source/freetype.win32/include/freetype/fterrdef.h +244 -0
  82. data/pdf2json-0.52-source/freetype.win32/include/freetype/fterrors.h +206 -0
  83. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftgasp.h +120 -0
  84. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftglyph.h +613 -0
  85. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftgxval.h +358 -0
  86. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftgzip.h +102 -0
  87. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftimage.h +1313 -0
  88. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftincrem.h +353 -0
  89. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftlcdfil.h +213 -0
  90. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftlist.h +277 -0
  91. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftlzw.h +99 -0
  92. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftmac.h +274 -0
  93. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftmm.h +378 -0
  94. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftmodapi.h +483 -0
  95. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftmoderr.h +155 -0
  96. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftotval.h +203 -0
  97. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftoutln.h +537 -0
  98. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftpfr.h +172 -0
  99. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftrender.h +230 -0
  100. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftsizes.h +159 -0
  101. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftsnames.h +200 -0
  102. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftstroke.h +716 -0
  103. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftsynth.h +80 -0
  104. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftsystem.h +347 -0
  105. data/pdf2json-0.52-source/freetype.win32/include/freetype/fttrigon.h +350 -0
  106. data/pdf2json-0.52-source/freetype.win32/include/freetype/fttypes.h +588 -0
  107. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftwinfnt.h +274 -0
  108. data/pdf2json-0.52-source/freetype.win32/include/freetype/ftxf86.h +83 -0
  109. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/autohint.h +231 -0
  110. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftcalc.h +179 -0
  111. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftdebug.h +250 -0
  112. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftdriver.h +422 -0
  113. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftgloadr.h +168 -0
  114. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftmemory.h +380 -0
  115. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftobjs.h +1428 -0
  116. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftpic.h +67 -0
  117. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftrfork.h +196 -0
  118. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftserv.h +620 -0
  119. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftstream.h +539 -0
  120. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/fttrace.h +139 -0
  121. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftvalid.h +150 -0
  122. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/internal.h +51 -0
  123. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/pcftypes.h +56 -0
  124. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/psaux.h +873 -0
  125. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/pshints.h +712 -0
  126. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svbdf.h +77 -0
  127. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svcid.h +83 -0
  128. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svgldict.h +82 -0
  129. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svgxval.h +72 -0
  130. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svkern.h +51 -0
  131. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svmm.h +104 -0
  132. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svotval.h +55 -0
  133. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svpfr.h +66 -0
  134. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svpostnm.h +79 -0
  135. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svpscmap.h +164 -0
  136. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svpsinfo.h +92 -0
  137. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svsfnt.h +102 -0
  138. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svttcmap.h +106 -0
  139. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svtteng.h +53 -0
  140. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svttglyf.h +67 -0
  141. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svwinfnt.h +50 -0
  142. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svxf86nm.h +55 -0
  143. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/sfnt.h +897 -0
  144. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/t1types.h +270 -0
  145. data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/tttypes.h +1543 -0
  146. data/pdf2json-0.52-source/freetype.win32/include/freetype/t1tables.h +504 -0
  147. data/pdf2json-0.52-source/freetype.win32/include/freetype/ttnameid.h +1247 -0
  148. data/pdf2json-0.52-source/freetype.win32/include/freetype/tttables.h +759 -0
  149. data/pdf2json-0.52-source/freetype.win32/include/freetype/tttags.h +107 -0
  150. data/pdf2json-0.52-source/freetype.win32/include/freetype/ttunpat.h +59 -0
  151. data/pdf2json-0.52-source/freetype.win32/include/ft2build.h +39 -0
  152. data/pdf2json-0.52-source/freetype.win32/lib/freetype_a.lib +0 -0
  153. data/pdf2json-0.52-source/goo/.DS_Store +0 -0
  154. data/pdf2json-0.52-source/goo/FixedPoint.cc +118 -0
  155. data/pdf2json-0.52-source/goo/FixedPoint.h +155 -0
  156. data/pdf2json-0.52-source/goo/FixedPoint.o +0 -0
  157. data/pdf2json-0.52-source/goo/GHash.cc +380 -0
  158. data/pdf2json-0.52-source/goo/GHash.h +78 -0
  159. data/pdf2json-0.52-source/goo/GHash.o +0 -0
  160. data/pdf2json-0.52-source/goo/GList.cc +97 -0
  161. data/pdf2json-0.52-source/goo/GList.h +96 -0
  162. data/pdf2json-0.52-source/goo/GList.o +0 -0
  163. data/pdf2json-0.52-source/goo/GMutex.h +49 -0
  164. data/pdf2json-0.52-source/goo/GString.cc +724 -0
  165. data/pdf2json-0.52-source/goo/GString.cc.fixed +718 -0
  166. data/pdf2json-0.52-source/goo/GString.h +136 -0
  167. data/pdf2json-0.52-source/goo/GString.o +0 -0
  168. data/pdf2json-0.52-source/goo/ImgWriter.o +0 -0
  169. data/pdf2json-0.52-source/goo/JpegWriter.o +0 -0
  170. data/pdf2json-0.52-source/goo/Makefile +72 -0
  171. data/pdf2json-0.52-source/goo/Makefile.dep +0 -0
  172. data/pdf2json-0.52-source/goo/Makefile.in +72 -0
  173. data/pdf2json-0.52-source/goo/PNGWriter.o +0 -0
  174. data/pdf2json-0.52-source/goo/gfile.cc +731 -0
  175. data/pdf2json-0.52-source/goo/gfile.h +138 -0
  176. data/pdf2json-0.52-source/goo/gfile.o +0 -0
  177. data/pdf2json-0.52-source/goo/gmem.cc +264 -0
  178. data/pdf2json-0.52-source/goo/gmem.h +79 -0
  179. data/pdf2json-0.52-source/goo/gmem.o +0 -0
  180. data/pdf2json-0.52-source/goo/gmempp.cc +32 -0
  181. data/pdf2json-0.52-source/goo/gmempp.o +0 -0
  182. data/pdf2json-0.52-source/goo/gtypes.h +29 -0
  183. data/pdf2json-0.52-source/goo/libGoo.a +0 -0
  184. data/pdf2json-0.52-source/goo/parseargs.c +190 -0
  185. data/pdf2json-0.52-source/goo/parseargs.h +71 -0
  186. data/pdf2json-0.52-source/goo/parseargs.o +0 -0
  187. data/pdf2json-0.52-source/goo/vms_directory.c +214 -0
  188. data/pdf2json-0.52-source/goo/vms_dirent.h +67 -0
  189. data/pdf2json-0.52-source/goo/vms_make.com +82 -0
  190. data/pdf2json-0.52-source/goo/vms_sys_dirent.h +54 -0
  191. data/pdf2json-0.52-source/goo/vms_unix_time.h +102 -0
  192. data/pdf2json-0.52-source/goo/vms_unix_times.c +42 -0
  193. data/pdf2json-0.52-source/goo/vms_unlink.c +22 -0
  194. data/pdf2json-0.52-source/ms_make.bat +199 -0
  195. data/pdf2json-0.52-source/splash/.DS_Store +0 -0
  196. data/pdf2json-0.52-source/splash/Makefile +103 -0
  197. data/pdf2json-0.52-source/splash/Makefile.dep +0 -0
  198. data/pdf2json-0.52-source/splash/Makefile.in +103 -0
  199. data/pdf2json-0.52-source/splash/Splash.cc +3310 -0
  200. data/pdf2json-0.52-source/splash/Splash.h +293 -0
  201. data/pdf2json-0.52-source/splash/Splash.o +0 -0
  202. data/pdf2json-0.52-source/splash/SplashBitmap.cc +188 -0
  203. data/pdf2json-0.52-source/splash/SplashBitmap.h +64 -0
  204. data/pdf2json-0.52-source/splash/SplashBitmap.o +0 -0
  205. data/pdf2json-0.52-source/splash/SplashClip.cc +382 -0
  206. data/pdf2json-0.52-source/splash/SplashClip.h +107 -0
  207. data/pdf2json-0.52-source/splash/SplashClip.o +0 -0
  208. data/pdf2json-0.52-source/splash/SplashErrorCodes.h +32 -0
  209. data/pdf2json-0.52-source/splash/SplashFTFont.cc +357 -0
  210. data/pdf2json-0.52-source/splash/SplashFTFont.h +58 -0
  211. data/pdf2json-0.52-source/splash/SplashFTFont.o +0 -0
  212. data/pdf2json-0.52-source/splash/SplashFTFontEngine.cc +179 -0
  213. data/pdf2json-0.52-source/splash/SplashFTFontEngine.h +65 -0
  214. data/pdf2json-0.52-source/splash/SplashFTFontEngine.o +0 -0
  215. data/pdf2json-0.52-source/splash/SplashFTFontFile.cc +114 -0
  216. data/pdf2json-0.52-source/splash/SplashFTFontFile.h +73 -0
  217. data/pdf2json-0.52-source/splash/SplashFTFontFile.o +0 -0
  218. data/pdf2json-0.52-source/splash/SplashFont.cc +176 -0
  219. data/pdf2json-0.52-source/splash/SplashFont.h +104 -0
  220. data/pdf2json-0.52-source/splash/SplashFont.o +0 -0
  221. data/pdf2json-0.52-source/splash/SplashFontEngine.cc +317 -0
  222. data/pdf2json-0.52-source/splash/SplashFontEngine.h +91 -0
  223. data/pdf2json-0.52-source/splash/SplashFontEngine.o +0 -0
  224. data/pdf2json-0.52-source/splash/SplashFontFile.cc +55 -0
  225. data/pdf2json-0.52-source/splash/SplashFontFile.h +60 -0
  226. data/pdf2json-0.52-source/splash/SplashFontFile.o +0 -0
  227. data/pdf2json-0.52-source/splash/SplashFontFileID.cc +23 -0
  228. data/pdf2json-0.52-source/splash/SplashFontFileID.h +30 -0
  229. data/pdf2json-0.52-source/splash/SplashFontFileID.o +0 -0
  230. data/pdf2json-0.52-source/splash/SplashGlyphBitmap.h +26 -0
  231. data/pdf2json-0.52-source/splash/SplashMath.h +89 -0
  232. data/pdf2json-0.52-source/splash/SplashPath.cc +184 -0
  233. data/pdf2json-0.52-source/splash/SplashPath.h +121 -0
  234. data/pdf2json-0.52-source/splash/SplashPath.o +0 -0
  235. data/pdf2json-0.52-source/splash/SplashPattern.cc +40 -0
  236. data/pdf2json-0.52-source/splash/SplashPattern.h +65 -0
  237. data/pdf2json-0.52-source/splash/SplashPattern.o +0 -0
  238. data/pdf2json-0.52-source/splash/SplashScreen.cc +383 -0
  239. data/pdf2json-0.52-source/splash/SplashScreen.h +56 -0
  240. data/pdf2json-0.52-source/splash/SplashScreen.o +0 -0
  241. data/pdf2json-0.52-source/splash/SplashState.cc +165 -0
  242. data/pdf2json-0.52-source/splash/SplashState.h +103 -0
  243. data/pdf2json-0.52-source/splash/SplashState.o +0 -0
  244. data/pdf2json-0.52-source/splash/SplashT1Font.cc +287 -0
  245. data/pdf2json-0.52-source/splash/SplashT1Font.h +57 -0
  246. data/pdf2json-0.52-source/splash/SplashT1Font.o +0 -0
  247. data/pdf2json-0.52-source/splash/SplashT1FontEngine.cc +124 -0
  248. data/pdf2json-0.52-source/splash/SplashT1FontEngine.h +53 -0
  249. data/pdf2json-0.52-source/splash/SplashT1FontEngine.o +0 -0
  250. data/pdf2json-0.52-source/splash/SplashT1FontFile.cc +97 -0
  251. data/pdf2json-0.52-source/splash/SplashT1FontFile.h +58 -0
  252. data/pdf2json-0.52-source/splash/SplashT1FontFile.o +0 -0
  253. data/pdf2json-0.52-source/splash/SplashTypes.h +132 -0
  254. data/pdf2json-0.52-source/splash/SplashXPath.cc +438 -0
  255. data/pdf2json-0.52-source/splash/SplashXPath.h +100 -0
  256. data/pdf2json-0.52-source/splash/SplashXPath.o +0 -0
  257. data/pdf2json-0.52-source/splash/SplashXPathScanner.cc +428 -0
  258. data/pdf2json-0.52-source/splash/SplashXPathScanner.h +87 -0
  259. data/pdf2json-0.52-source/splash/SplashXPathScanner.o +0 -0
  260. data/pdf2json-0.52-source/splash/libsplash.a +0 -0
  261. data/pdf2json-0.52-source/splash/vms_make.com +0 -0
  262. data/pdf2json-0.52-source/src/.DS_Store +0 -0
  263. data/pdf2json-0.52-source/src/GVector.h +101 -0
  264. data/pdf2json-0.52-source/src/ImgOutputDev.cc +1243 -0
  265. data/pdf2json-0.52-source/src/ImgOutputDev.h +307 -0
  266. data/pdf2json-0.52-source/src/ImgOutputDev.o +0 -0
  267. data/pdf2json-0.52-source/src/Makefile +68 -0
  268. data/pdf2json-0.52-source/src/Makefile.in +68 -0
  269. data/pdf2json-0.52-source/src/XmlFonts.cc +367 -0
  270. data/pdf2json-0.52-source/src/XmlFonts.h +91 -0
  271. data/pdf2json-0.52-source/src/XmlFonts.o +0 -0
  272. data/pdf2json-0.52-source/src/XmlLinks.cc +101 -0
  273. data/pdf2json-0.52-source/src/XmlLinks.h +54 -0
  274. data/pdf2json-0.52-source/src/XmlLinks.o +0 -0
  275. data/pdf2json-0.52-source/src/pdf2json +0 -0
  276. data/pdf2json-0.52-source/src/pdf2json.cc +343 -0
  277. data/pdf2json-0.52-source/src/pdf2json.o +0 -0
  278. data/pdf2json-0.52-source/src/pdf2xml.dtd +22 -0
  279. data/pdf2json-0.52-source/src/pdf2xmljson.dtd +9 -0
  280. data/pdf2json-0.52-source/xpdf/.DS_Store +0 -0
  281. data/pdf2json-0.52-source/xpdf/Annot.cc +1556 -0
  282. data/pdf2json-0.52-source/xpdf/Annot.h +142 -0
  283. data/pdf2json-0.52-source/xpdf/Annot.o +0 -0
  284. data/pdf2json-0.52-source/xpdf/Array.cc +73 -0
  285. data/pdf2json-0.52-source/xpdf/Array.h +58 -0
  286. data/pdf2json-0.52-source/xpdf/Array.o +0 -0
  287. data/pdf2json-0.52-source/xpdf/BuiltinFont.cc +65 -0
  288. data/pdf2json-0.52-source/xpdf/BuiltinFont.h +57 -0
  289. data/pdf2json-0.52-source/xpdf/BuiltinFont.o +0 -0
  290. data/pdf2json-0.52-source/xpdf/BuiltinFontTables.cc +4284 -0
  291. data/pdf2json-0.52-source/xpdf/BuiltinFontTables.h +23 -0
  292. data/pdf2json-0.52-source/xpdf/BuiltinFontTables.o +0 -0
  293. data/pdf2json-0.52-source/xpdf/CMap.cc +408 -0
  294. data/pdf2json-0.52-source/xpdf/CMap.h +102 -0
  295. data/pdf2json-0.52-source/xpdf/CMap.o +0 -0
  296. data/pdf2json-0.52-source/xpdf/Catalog.cc +374 -0
  297. data/pdf2json-0.52-source/xpdf/Catalog.h +97 -0
  298. data/pdf2json-0.52-source/xpdf/Catalog.o +0 -0
  299. data/pdf2json-0.52-source/xpdf/CharCodeToUnicode.cc +540 -0
  300. data/pdf2json-0.52-source/xpdf/CharCodeToUnicode.h +117 -0
  301. data/pdf2json-0.52-source/xpdf/CharCodeToUnicode.o +0 -0
  302. data/pdf2json-0.52-source/xpdf/CharTypes.h +24 -0
  303. data/pdf2json-0.52-source/xpdf/CompactFontTables.h +464 -0
  304. data/pdf2json-0.52-source/xpdf/CoreOutputDev.cc +61 -0
  305. data/pdf2json-0.52-source/xpdf/CoreOutputDev.h +61 -0
  306. data/pdf2json-0.52-source/xpdf/Decrypt.cc +776 -0
  307. data/pdf2json-0.52-source/xpdf/Decrypt.h +95 -0
  308. data/pdf2json-0.52-source/xpdf/Decrypt.o +0 -0
  309. data/pdf2json-0.52-source/xpdf/Dict.cc +95 -0
  310. data/pdf2json-0.52-source/xpdf/Dict.h +77 -0
  311. data/pdf2json-0.52-source/xpdf/Dict.o +0 -0
  312. data/pdf2json-0.52-source/xpdf/Error.cc +38 -0
  313. data/pdf2json-0.52-source/xpdf/Error.h +23 -0
  314. data/pdf2json-0.52-source/xpdf/Error.o +0 -0
  315. data/pdf2json-0.52-source/xpdf/ErrorCodes.h +36 -0
  316. data/pdf2json-0.52-source/xpdf/FontEncodingTables.cc +1824 -0
  317. data/pdf2json-0.52-source/xpdf/FontEncodingTables.h +20 -0
  318. data/pdf2json-0.52-source/xpdf/FontEncodingTables.o +0 -0
  319. data/pdf2json-0.52-source/xpdf/Function.cc +1573 -0
  320. data/pdf2json-0.52-source/xpdf/Function.h +229 -0
  321. data/pdf2json-0.52-source/xpdf/Function.o +0 -0
  322. data/pdf2json-0.52-source/xpdf/Gfx.cc +4187 -0
  323. data/pdf2json-0.52-source/xpdf/Gfx.h +312 -0
  324. data/pdf2json-0.52-source/xpdf/Gfx.o +0 -0
  325. data/pdf2json-0.52-source/xpdf/GfxFont.cc +1568 -0
  326. data/pdf2json-0.52-source/xpdf/GfxFont.h +320 -0
  327. data/pdf2json-0.52-source/xpdf/GfxFont.o +0 -0
  328. data/pdf2json-0.52-source/xpdf/GfxState.cc +4137 -0
  329. data/pdf2json-0.52-source/xpdf/GfxState.h +1244 -0
  330. data/pdf2json-0.52-source/xpdf/GfxState.o +0 -0
  331. data/pdf2json-0.52-source/xpdf/GlobalParams.cc +2924 -0
  332. data/pdf2json-0.52-source/xpdf/GlobalParams.cc.old +2908 -0
  333. data/pdf2json-0.52-source/xpdf/GlobalParams.h +466 -0
  334. data/pdf2json-0.52-source/xpdf/GlobalParams.h.old +463 -0
  335. data/pdf2json-0.52-source/xpdf/GlobalParams.o +0 -0
  336. data/pdf2json-0.52-source/xpdf/ImageOutputDev.cc +195 -0
  337. data/pdf2json-0.52-source/xpdf/ImageOutputDev.h +76 -0
  338. data/pdf2json-0.52-source/xpdf/ImageOutputDev.o +0 -0
  339. data/pdf2json-0.52-source/xpdf/JArithmeticDecoder.cc +322 -0
  340. data/pdf2json-0.52-source/xpdf/JArithmeticDecoder.h +109 -0
  341. data/pdf2json-0.52-source/xpdf/JArithmeticDecoder.o +0 -0
  342. data/pdf2json-0.52-source/xpdf/JBIG2Stream.cc +3413 -0
  343. data/pdf2json-0.52-source/xpdf/JBIG2Stream.h +145 -0
  344. data/pdf2json-0.52-source/xpdf/JBIG2Stream.o +0 -0
  345. data/pdf2json-0.52-source/xpdf/JPXStream.cc +3144 -0
  346. data/pdf2json-0.52-source/xpdf/JPXStream.h +351 -0
  347. data/pdf2json-0.52-source/xpdf/JPXStream.o +0 -0
  348. data/pdf2json-0.52-source/xpdf/Lexer.cc +485 -0
  349. data/pdf2json-0.52-source/xpdf/Lexer.h +80 -0
  350. data/pdf2json-0.52-source/xpdf/Lexer.o +0 -0
  351. data/pdf2json-0.52-source/xpdf/Link.cc +806 -0
  352. data/pdf2json-0.52-source/xpdf/Link.cc.old +784 -0
  353. data/pdf2json-0.52-source/xpdf/Link.h +415 -0
  354. data/pdf2json-0.52-source/xpdf/Link.h.old +369 -0
  355. data/pdf2json-0.52-source/xpdf/Link.o +0 -0
  356. data/pdf2json-0.52-source/xpdf/Makefile +232 -0
  357. data/pdf2json-0.52-source/xpdf/Makefile.dep +0 -0
  358. data/pdf2json-0.52-source/xpdf/Makefile.in +232 -0
  359. data/pdf2json-0.52-source/xpdf/NameToCharCode.cc +116 -0
  360. data/pdf2json-0.52-source/xpdf/NameToCharCode.h +42 -0
  361. data/pdf2json-0.52-source/xpdf/NameToCharCode.o +0 -0
  362. data/pdf2json-0.52-source/xpdf/NameToUnicodeTable.h +1097 -0
  363. data/pdf2json-0.52-source/xpdf/Object.cc +231 -0
  364. data/pdf2json-0.52-source/xpdf/Object.h +303 -0
  365. data/pdf2json-0.52-source/xpdf/Object.o +0 -0
  366. data/pdf2json-0.52-source/xpdf/Outline.cc +151 -0
  367. data/pdf2json-0.52-source/xpdf/Outline.h +76 -0
  368. data/pdf2json-0.52-source/xpdf/Outline.o +0 -0
  369. data/pdf2json-0.52-source/xpdf/OutputDev.cc +131 -0
  370. data/pdf2json-0.52-source/xpdf/OutputDev.h +253 -0
  371. data/pdf2json-0.52-source/xpdf/OutputDev.o +0 -0
  372. data/pdf2json-0.52-source/xpdf/PDFCore.cc +2044 -0
  373. data/pdf2json-0.52-source/xpdf/PDFCore.h +321 -0
  374. data/pdf2json-0.52-source/xpdf/PDFDoc.cc +404 -0
  375. data/pdf2json-0.52-source/xpdf/PDFDoc.h +183 -0
  376. data/pdf2json-0.52-source/xpdf/PDFDoc.o +0 -0
  377. data/pdf2json-0.52-source/xpdf/PDFDocEncoding.cc +44 -0
  378. data/pdf2json-0.52-source/xpdf/PDFDocEncoding.h +16 -0
  379. data/pdf2json-0.52-source/xpdf/PDFDocEncoding.o +0 -0
  380. data/pdf2json-0.52-source/xpdf/PSOutputDev.cc +6224 -0
  381. data/pdf2json-0.52-source/xpdf/PSOutputDev.h +395 -0
  382. data/pdf2json-0.52-source/xpdf/PSOutputDev.o +0 -0
  383. data/pdf2json-0.52-source/xpdf/PSTokenizer.cc +135 -0
  384. data/pdf2json-0.52-source/xpdf/PSTokenizer.h +41 -0
  385. data/pdf2json-0.52-source/xpdf/PSTokenizer.o +0 -0
  386. data/pdf2json-0.52-source/xpdf/Page.cc +454 -0
  387. data/pdf2json-0.52-source/xpdf/Page.h +187 -0
  388. data/pdf2json-0.52-source/xpdf/Page.o +0 -0
  389. data/pdf2json-0.52-source/xpdf/Parser.cc +227 -0
  390. data/pdf2json-0.52-source/xpdf/Parser.h +59 -0
  391. data/pdf2json-0.52-source/xpdf/Parser.o +0 -0
  392. data/pdf2json-0.52-source/xpdf/PreScanOutputDev.cc +257 -0
  393. data/pdf2json-0.52-source/xpdf/PreScanOutputDev.h +130 -0
  394. data/pdf2json-0.52-source/xpdf/PreScanOutputDev.o +0 -0
  395. data/pdf2json-0.52-source/xpdf/SecurityHandler.cc +390 -0
  396. data/pdf2json-0.52-source/xpdf/SecurityHandler.h +160 -0
  397. data/pdf2json-0.52-source/xpdf/SecurityHandler.o +0 -0
  398. data/pdf2json-0.52-source/xpdf/SplashOutputDev.cc +2845 -0
  399. data/pdf2json-0.52-source/xpdf/SplashOutputDev.h +247 -0
  400. data/pdf2json-0.52-source/xpdf/SplashOutputDev.o +0 -0
  401. data/pdf2json-0.52-source/xpdf/Stream-CCITT.h +459 -0
  402. data/pdf2json-0.52-source/xpdf/Stream.cc +4627 -0
  403. data/pdf2json-0.52-source/xpdf/Stream.h +858 -0
  404. data/pdf2json-0.52-source/xpdf/Stream.o +0 -0
  405. data/pdf2json-0.52-source/xpdf/TextOutputDev.cc +4090 -0
  406. data/pdf2json-0.52-source/xpdf/TextOutputDev.h +661 -0
  407. data/pdf2json-0.52-source/xpdf/TextOutputDev.o +0 -0
  408. data/pdf2json-0.52-source/xpdf/UTF8.h +56 -0
  409. data/pdf2json-0.52-source/xpdf/UnicodeMap.cc +302 -0
  410. data/pdf2json-0.52-source/xpdf/UnicodeMap.cc.old +293 -0
  411. data/pdf2json-0.52-source/xpdf/UnicodeMap.h +135 -0
  412. data/pdf2json-0.52-source/xpdf/UnicodeMap.h.old +123 -0
  413. data/pdf2json-0.52-source/xpdf/UnicodeMap.o +0 -0
  414. data/pdf2json-0.52-source/xpdf/UnicodeMapTables.h +361 -0
  415. data/pdf2json-0.52-source/xpdf/UnicodeTypeTable.cc +949 -0
  416. data/pdf2json-0.52-source/xpdf/UnicodeTypeTable.h +20 -0
  417. data/pdf2json-0.52-source/xpdf/UnicodeTypeTable.o +0 -0
  418. data/pdf2json-0.52-source/xpdf/XPDFApp.cc +447 -0
  419. data/pdf2json-0.52-source/xpdf/XPDFApp.h +114 -0
  420. data/pdf2json-0.52-source/xpdf/XPDFCore.cc +1655 -0
  421. data/pdf2json-0.52-source/xpdf/XPDFCore.h +251 -0
  422. data/pdf2json-0.52-source/xpdf/XPDFTree.cc +931 -0
  423. data/pdf2json-0.52-source/xpdf/XPDFTree.h +45 -0
  424. data/pdf2json-0.52-source/xpdf/XPDFTreeP.h +87 -0
  425. data/pdf2json-0.52-source/xpdf/XPDFViewer.cc +3488 -0
  426. data/pdf2json-0.52-source/xpdf/XPDFViewer.h +352 -0
  427. data/pdf2json-0.52-source/xpdf/XRef.cc +896 -0
  428. data/pdf2json-0.52-source/xpdf/XRef.h +133 -0
  429. data/pdf2json-0.52-source/xpdf/XRef.o +0 -0
  430. data/pdf2json-0.52-source/xpdf/XpdfPluginAPI.cc +262 -0
  431. data/pdf2json-0.52-source/xpdf/XpdfPluginAPI.h +341 -0
  432. data/pdf2json-0.52-source/xpdf/XpdfPluginAPI.o +0 -0
  433. data/pdf2json-0.52-source/xpdf/about-text.h +48 -0
  434. data/pdf2json-0.52-source/xpdf/about.xbm +6 -0
  435. data/pdf2json-0.52-source/xpdf/backArrow.xbm +6 -0
  436. data/pdf2json-0.52-source/xpdf/backArrowDis.xbm +6 -0
  437. data/pdf2json-0.52-source/xpdf/config.h +112 -0
  438. data/pdf2json-0.52-source/xpdf/dblLeftArrow.xbm +6 -0
  439. data/pdf2json-0.52-source/xpdf/dblLeftArrowDis.xbm +6 -0
  440. data/pdf2json-0.52-source/xpdf/dblRightArrow.xbm +6 -0
  441. data/pdf2json-0.52-source/xpdf/dblRightArrowDis.xbm +6 -0
  442. data/pdf2json-0.52-source/xpdf/find.xbm +6 -0
  443. data/pdf2json-0.52-source/xpdf/findDis.xbm +6 -0
  444. data/pdf2json-0.52-source/xpdf/forwardArrow.xbm +6 -0
  445. data/pdf2json-0.52-source/xpdf/forwardArrowDis.xbm +6 -0
  446. data/pdf2json-0.52-source/xpdf/leftArrow.xbm +5 -0
  447. data/pdf2json-0.52-source/xpdf/leftArrowDis.xbm +5 -0
  448. data/pdf2json-0.52-source/xpdf/libXpdf.a +0 -0
  449. data/pdf2json-0.52-source/xpdf/pdffonts +0 -0
  450. data/pdf2json-0.52-source/xpdf/pdffonts.cc +298 -0
  451. data/pdf2json-0.52-source/xpdf/pdffonts.o +0 -0
  452. data/pdf2json-0.52-source/xpdf/pdfimages +0 -0
  453. data/pdf2json-0.52-source/xpdf/pdfimages.cc +155 -0
  454. data/pdf2json-0.52-source/xpdf/pdfimages.o +0 -0
  455. data/pdf2json-0.52-source/xpdf/pdfinfo +0 -0
  456. data/pdf2json-0.52-source/xpdf/pdfinfo.cc +387 -0
  457. data/pdf2json-0.52-source/xpdf/pdfinfo.o +0 -0
  458. data/pdf2json-0.52-source/xpdf/pdftoppm.cc +203 -0
  459. data/pdf2json-0.52-source/xpdf/pdftops +0 -0
  460. data/pdf2json-0.52-source/xpdf/pdftops.cc +344 -0
  461. data/pdf2json-0.52-source/xpdf/pdftops.o +0 -0
  462. data/pdf2json-0.52-source/xpdf/pdftotext +0 -0
  463. data/pdf2json-0.52-source/xpdf/pdftotext.cc +333 -0
  464. data/pdf2json-0.52-source/xpdf/pdftotext.o +0 -0
  465. data/pdf2json-0.52-source/xpdf/print.xbm +6 -0
  466. data/pdf2json-0.52-source/xpdf/printDis.xbm +6 -0
  467. data/pdf2json-0.52-source/xpdf/rightArrow.xbm +5 -0
  468. data/pdf2json-0.52-source/xpdf/rightArrowDis.xbm +5 -0
  469. data/pdf2json-0.52-source/xpdf/vms_make.com +129 -0
  470. data/pdf2json-0.52-source/xpdf/xpdf.cc +344 -0
  471. data/pdf2json-0.52-source/xpdf/xpdfIcon.xpm +62 -0
  472. data/pdf2json.gemspec +29 -0
  473. metadata +518 -0
@@ -0,0 +1,91 @@
1
+ #ifndef _XML_FONTS_H
2
+ #define _XML_FONTS_H
3
+ #include "GVector.h"
4
+ #include "GString.h"
5
+ #include "GfxState.h"
6
+ #include "CharTypes.h"
7
+
8
+
9
+ class XmlFontColor{
10
+ private:
11
+ unsigned int r;
12
+ unsigned int g;
13
+ unsigned int b;
14
+ GBool Ok(unsigned int xcol){ return ((xcol<=255)&&(xcol>=0));}
15
+ GString *convtoX(unsigned int xcol) const;
16
+ public:
17
+ XmlFontColor():r(0),g(0),b(0){}
18
+ XmlFontColor(GfxRGB rgb);
19
+ XmlFontColor(const XmlFontColor& x){r=x.r;g=x.g;b=x.b;}
20
+ XmlFontColor& operator=(const XmlFontColor &x){
21
+ r=x.r;g=x.g;b=x.b;
22
+ return *this;
23
+ }
24
+ ~XmlFontColor(){};
25
+ GString* toString() const;
26
+ GBool isEqual(const XmlFontColor& col) const{
27
+ return ((r==col.r)&&(g==col.g)&&(b==col.b));
28
+ }
29
+ } ;
30
+
31
+
32
+ class XmlFont{
33
+ private:
34
+ unsigned int size;
35
+ double charspace;
36
+ int lineSize;
37
+ GBool italic;
38
+ GBool bold;
39
+ GBool oblique;
40
+ int pos; // position of the font name in the fonts array
41
+ static GString *DefaultFont;
42
+ GString *FontName;
43
+ XmlFontColor color;
44
+ static GString* HtmlFilter(Unicode* u, int uLen); //char* s);
45
+ public:
46
+
47
+ XmlFont(){FontName=NULL;};
48
+ XmlFont(GString* fontname,int _size,double _charspace, GfxRGB rgb);
49
+ XmlFont(const XmlFont& x);
50
+ XmlFont& operator=(const XmlFont& x);
51
+ XmlFontColor getColor() const {return color;}
52
+ ~XmlFont();
53
+ static void clear();
54
+ GString* getFullName();
55
+ GBool isItalic() const {return italic;}
56
+ GBool isBold() const {return bold;}
57
+ GBool isOblique() const {return oblique;}
58
+ unsigned int getSize() const {return size;}
59
+ int getLineSize() const {return lineSize;}
60
+ void setLineSize(int _lineSize) { lineSize = _lineSize; }
61
+ GString* getFontName();
62
+ double getCharSpace() const {return charspace;}
63
+ void setCharSpace(double _charspace){charspace = _charspace;}
64
+ static GString* getDefaultFont();
65
+ static void setDefaultFont(GString* defaultFont);
66
+ GBool isEqual(const XmlFont& x) const;
67
+ GBool isEqualIgnoreBold(const XmlFont& x) const;
68
+ static GString* simple(XmlFont *font, Unicode *content, int uLen);
69
+ void print() const {printf("font: %s %d %s%spos: %d\n", FontName->getCString(), size, bold ? "bold " : "", italic ? "italic " : "", pos);};
70
+ };
71
+
72
+ class XmlFontAccu{
73
+ private:
74
+ GVector<XmlFont> *accu;
75
+
76
+ public:
77
+ XmlFontAccu();
78
+ ~XmlFontAccu();
79
+ int AddFont(const XmlFont& font);
80
+ XmlFont* Get(int i){
81
+ GVector<XmlFont>::iterator g=accu->begin();
82
+ g+=i;
83
+ return g;
84
+ }
85
+ GString* getCSStyle (int i, GString* content);
86
+ /* GString* EscapeSpecialChars(GString* content); */
87
+ GString* CSStyle(int i,GBool textAsJSON);
88
+ int size() const {return accu->size();}
89
+
90
+ };
91
+ #endif
Binary file
@@ -0,0 +1,101 @@
1
+ #include "XmlLinks.h"
2
+
3
+ XmlLink::XmlLink(const XmlLink& x){
4
+ Xmin=x.Xmin;
5
+ Ymin=x.Ymin;
6
+ Xmax=x.Xmax;
7
+ Ymax=x.Ymax;
8
+ dest=new GString(x.dest);
9
+ }
10
+
11
+ XmlLink::XmlLink(double xmin,double ymin,double xmax,double ymax,GString * _dest)
12
+ {
13
+ if (xmin < xmax) {
14
+ Xmin=xmin;
15
+ Xmax=xmax;
16
+ } else {
17
+ Xmin=xmax;
18
+ Xmax=xmin;
19
+ }
20
+ if (ymin < ymax) {
21
+ Ymin=ymin;
22
+ Ymax=ymax;
23
+ } else {
24
+ Ymin=ymax;
25
+ Ymax=ymin;
26
+ }
27
+ dest=new GString(_dest);
28
+ }
29
+
30
+ XmlLink::~XmlLink(){
31
+ if (dest) delete dest;
32
+ }
33
+
34
+ GBool XmlLink::isEqualDest(const XmlLink& x) const{
35
+ return (!strcmp(dest->getCString(), x.dest->getCString()));
36
+ }
37
+
38
+ GBool XmlLink::inLink(double xmin,double ymin,double xmax,double ymax) const {
39
+ double y=(ymin+ymax)/2;
40
+ if (y>Ymax) return gFalse;
41
+ return (y>Ymin)&&(xmin<Xmax)&&(xmax>Xmin);
42
+ }
43
+
44
+
45
+ XmlLink& XmlLink::operator=(const XmlLink& x){
46
+ if (this==&x) return *this;
47
+ if (dest) {delete dest;dest=NULL;}
48
+ Xmin=x.Xmin;
49
+ Ymin=x.Ymin;
50
+ Xmax=x.Xmax;
51
+ Ymax=x.Ymax;
52
+ dest=new GString(x.dest);
53
+ return *this;
54
+ }
55
+
56
+ GString* XmlLink::getLinkStart() {
57
+ GString *res = new GString("");
58
+ res->append(dest);
59
+ // res->append("\">");
60
+ return res;
61
+ }
62
+
63
+ /*GString* XmlLink::Link(GString* content){
64
+ //GString* _dest=new GString(dest);
65
+ GString *tmp=new GString("<a href=\"");
66
+ tmp->append(dest);
67
+ tmp->append("\">");
68
+ tmp->append(content);
69
+ tmp->append("</a>");
70
+ //delete _dest;
71
+ return tmp;
72
+ }*/
73
+
74
+
75
+
76
+ XmlLinks::XmlLinks(){
77
+ accu=new GVector<XmlLink>();
78
+ }
79
+
80
+ XmlLinks::~XmlLinks(){
81
+ delete accu;
82
+ accu=NULL;
83
+ }
84
+
85
+ GBool XmlLinks::inLink(double xmin,double ymin,double xmax,double ymax,int& p)const {
86
+
87
+ for(GVector<XmlLink>::iterator i=accu->begin();i!=accu->end();i++){
88
+ if (i->inLink(xmin,ymin,xmax,ymax)) {
89
+ p=(i - accu->begin());
90
+ return 1;
91
+ }
92
+ }
93
+ return 0;
94
+ }
95
+
96
+ XmlLink* XmlLinks::getLink(int i) const{
97
+ GVector<XmlLink>::iterator g=accu->begin();
98
+ g+=i;
99
+ return g;
100
+ }
101
+
@@ -0,0 +1,54 @@
1
+ #ifndef _HTML_LINKS
2
+ #define _HTML_LINKS
3
+
4
+ #include "GVector.h"
5
+ #include "GString.h"
6
+ #include <stdio.h>
7
+ #include <stdlib.h>
8
+ #include <string.h>
9
+ #ifndef _WIN32
10
+ #include <sys/unistd.h>
11
+ #endif
12
+
13
+ class XmlLink{
14
+
15
+ private:
16
+ double Xmin;
17
+ double Ymin;
18
+ double Xmax;
19
+ double Ymax;
20
+ GString* dest;
21
+
22
+ public:
23
+ XmlLink(){dest=NULL;}
24
+ XmlLink(const XmlLink& x);
25
+ XmlLink& operator=(const XmlLink& x);
26
+ XmlLink(double xmin,double ymin,double xmax,double ymax,GString *_dest);
27
+ ~XmlLink();
28
+ //GBool XmlLink::isEqualDest(const XmlLink& x) const; // this kills gcc 4.*
29
+ GBool isEqualDest(const XmlLink& x) const;
30
+ GString *getDest(){return new GString(dest);}
31
+ double getX1() const {return Xmin;}
32
+ double getX2() const {return Xmax;}
33
+ double getY1() const {return Ymin;}
34
+ double getY2() const {return Ymax;}
35
+ GBool inLink(double xmin,double ymin,double xmax,double ymax) const ;
36
+ //GString *Link(GString *content);
37
+ GString* getLinkStart();
38
+
39
+ };
40
+
41
+ class XmlLinks{
42
+ private:
43
+ GVector<XmlLink> *accu;
44
+ public:
45
+ XmlLinks();
46
+ ~XmlLinks();
47
+ void AddLink(const XmlLink& x) {accu->push_back(x);}
48
+ GBool inLink(double xmin,double ymin,double xmax,double ymax,int& p) const;
49
+ XmlLink* getLink(int i) const;
50
+
51
+ };
52
+
53
+ #endif
54
+
Binary file
Binary file
@@ -0,0 +1,343 @@
1
+ //========================================================================
2
+ //
3
+ // pdf2json.cc
4
+ //
5
+ //
6
+ // Copyright 2011 Devaldi Ltd
7
+ //
8
+ // Copyright 1997-2002 Glyph & Cog, LLC
9
+ //
10
+ // Changed 1999-2000 by G.Ovtcharov
11
+ //
12
+ // Changed 2002 by Mikhail Kruk
13
+ //========================================================================
14
+
15
+ #include <stdio.h>
16
+ #include <stdlib.h>
17
+ #include <stddef.h>
18
+ #include <string.h>
19
+ #include <aconf.h>
20
+ #include <time.h>
21
+ #include "parseargs.h"
22
+ #include "GString.h"
23
+ #include "gmem.h"
24
+ #include "Object.h"
25
+ #include "Stream.h"
26
+ #include "Array.h"
27
+ #include "Dict.h"
28
+ #include "XRef.h"
29
+ #include "Catalog.h"
30
+ #include "Page.h"
31
+ #include "PDFDoc.h"
32
+ #include "ImgOutputDev.h"
33
+ #include "GlobalParams.h"
34
+ #include "Error.h"
35
+ #include "config.h"
36
+ #include "gfile.h"
37
+
38
+ static int firstPage = 1;
39
+ static int lastPage = 0;
40
+ static GBool rawOrder = gTrue;
41
+ static GBool textAsJSON = gTrue;
42
+ static GBool compressData = gFalse;
43
+ GBool printCommands = gTrue;
44
+ static GBool printHelp = gFalse;
45
+ GBool printHtml = gFalse;
46
+ GBool complexMode=gTrue;
47
+ GBool ignore=gFalse;
48
+ double scale=1.5;
49
+ GBool noframes=gFalse;
50
+ GBool stout=gFalse;
51
+ GBool xml=gFalse;
52
+ GBool errQuiet=gFalse;
53
+
54
+ GBool showHidden = gFalse;
55
+ GBool noMerge = gTrue;
56
+ static char ownerPassword[33] = "";
57
+ static char userPassword[33] = "";
58
+ static char gsDevice[33] = "png16m";
59
+ static GBool printVersion = gFalse;
60
+
61
+ static GString* getInfoString(Dict *infoDict, char *key);
62
+ static GString* getInfoDate(Dict *infoDict, char *key);
63
+
64
+ static char textEncName[128] = "";
65
+
66
+ static ArgDesc argDesc[] = {
67
+ {"-f", argInt, &firstPage, 0,
68
+ "first page to convert"},
69
+ {"-l", argInt, &lastPage, 0,
70
+ "last page to convert"},
71
+ {"-compress", argFlag, &compressData, 0,
72
+ "Use compressed mode"},
73
+ {"-q", argFlag, &errQuiet, 0,
74
+ "don't print any messages or errors"},
75
+ {"-h", argFlag, &printHelp, 0,
76
+ "print usage information"},
77
+ {"-help", argFlag, &printHelp, 0,
78
+ "print usage information"},
79
+ {"-i", argFlag, &ignore, 0,
80
+ "ignore images"},
81
+ {"-noframes", argFlag, &noframes, 0,
82
+ "use standard output"},
83
+ /* {"-zoom", argFP, &scale, 0,
84
+ "zoom the pdf document (default 1.5)"}, */
85
+ {"-xml", argFlag, &xml, 0,
86
+ "output for XML post-processing"},
87
+ {"-hidden", argFlag, &showHidden, 0,
88
+ "output hidden text"},
89
+ {"-enc", argString, textEncName, sizeof(textEncName),
90
+ "output text encoding name"},
91
+ {"-v", argFlag, &printVersion, 0,
92
+ "print copyright and version info"},
93
+ {"-opw", argString, ownerPassword, sizeof(ownerPassword),
94
+ "owner password (for encrypted files)"},
95
+ {"-upw", argString, userPassword, sizeof(userPassword),
96
+ "user password (for encrypted files)"},
97
+ {NULL}
98
+ };
99
+
100
+ int main(int argc, char *argv[]) {
101
+ PDFDoc *doc = NULL;
102
+ GString *fileName = NULL;
103
+ GString *docTitle = NULL;
104
+ GString *author = NULL, *keywords = NULL, *subject = NULL, *date = NULL;
105
+ GString *htmlFileName = NULL;
106
+ ImgOutputDev *htmlOut = NULL;
107
+ //PSOutputDev *psOut = NULL;
108
+ GBool ok;
109
+ char *p;
110
+ char extension[16] = "png";
111
+ GString *ownerPW, *userPW;
112
+ Object info;
113
+ char * extsList[] = {"png", "jpeg", "bmp", "pcx", "tiff", "pbm", NULL};
114
+
115
+ // parse args
116
+ ok = parseArgs(argDesc, &argc, argv);
117
+ if (!ok || argc < 2 || argc > 3 || printHelp || printVersion) {
118
+ fprintf(stderr, "pdf2json version %s http://flexpaper.devaldi.com/pdf2json/, based on Xpdf version %s\n", "0.52", xpdfVersion);
119
+ fprintf(stderr, "%s\n", "Copyright 1999-2011 Devaldi Ltd, Gueorgui Ovtcharov and Rainer Dorsch");
120
+ fprintf(stderr, "%s\n\n", xpdfCopyright);
121
+ if (!printVersion) {
122
+ printUsage("pdf2json", "<PDF-file> [<xml-file>]", argDesc);
123
+ }
124
+ exit(1);
125
+ }
126
+
127
+ // read config file
128
+ globalParams = new GlobalParams("");
129
+
130
+ if (errQuiet) {
131
+ globalParams->setErrQuiet(errQuiet);
132
+ printCommands = gFalse; // I'm not 100% what is the differecne between them
133
+ }
134
+
135
+ if (textEncName[0]) {
136
+ globalParams->setTextEncoding(textEncName);
137
+ if( !globalParams->getTextEncoding() ) {
138
+ goto error;
139
+ }
140
+ }
141
+
142
+ // open PDF file
143
+ if (ownerPassword[0]) {
144
+ ownerPW = new GString(ownerPassword);
145
+ } else {
146
+ ownerPW = NULL;
147
+ }
148
+ if (userPassword[0]) {
149
+ userPW = new GString(userPassword);
150
+ } else {
151
+ userPW = NULL;
152
+ }
153
+
154
+ fileName = new GString(argv[1]);
155
+
156
+ doc = new PDFDoc(fileName, ownerPW, userPW);
157
+ if (userPW) {
158
+ delete userPW;
159
+ }
160
+ if (ownerPW) {
161
+ delete ownerPW;
162
+ }
163
+ if (!doc->isOk()) {
164
+ goto error;
165
+ }
166
+
167
+ // check for copy permission
168
+ if (!doc->okToCopy()) {
169
+ error(-1, "Copying of text from this document is not allowed.");
170
+ goto error;
171
+ }
172
+
173
+ // construct text file name
174
+ if (argc == 3) {
175
+ GString* tmp = new GString(argv[2]);
176
+ p=tmp->getCString()+tmp->getLength()-5;
177
+
178
+ if (!strcmp(p, ".xml") || !strcmp(p, ".XML"))
179
+ htmlFileName = new GString(tmp->getCString(),
180
+ tmp->getLength() - 5);
181
+ else htmlFileName =new GString(tmp);
182
+
183
+ delete tmp;
184
+ } else {
185
+ p = fileName->getCString() + fileName->getLength() - 4;
186
+ if (!strcmp(p, ".pdf") || !strcmp(p, ".PDF"))
187
+ htmlFileName = new GString(fileName->getCString(),
188
+ fileName->getLength() - 4);
189
+ else
190
+ htmlFileName = fileName->copy();
191
+ }
192
+
193
+ if (scale>3.0) scale=3.0;
194
+ if (scale<0.5) scale=0.5;
195
+
196
+ stout=gFalse;
197
+ complexMode = gTrue;
198
+ noframes = gTrue;
199
+ noMerge = gTrue;
200
+
201
+ // get page range
202
+ if (firstPage < 1)
203
+ firstPage = 1;
204
+ if (lastPage < 1 || lastPage > doc->getNumPages())
205
+ lastPage = doc->getNumPages();
206
+
207
+ doc->getDocInfo(&info);
208
+ if (info.isDict()) {
209
+ docTitle = getInfoString(info.getDict(), "Title");
210
+ author = getInfoString(info.getDict(), "Author");
211
+ keywords = getInfoString(info.getDict(), "Keywords");
212
+ subject = getInfoString(info.getDict(), "Subject");
213
+ date = getInfoDate(info.getDict(), "ModDate");
214
+ if( !date )
215
+ date = getInfoDate(info.getDict(), "CreationDate");
216
+ }
217
+ info.free();
218
+ if( !docTitle ) docTitle = new GString(htmlFileName);
219
+
220
+ /* determine extensions of output backgroun images */
221
+ {int i;
222
+ for(i = 0; extsList[i]; i++)
223
+ {
224
+ if( strstr(gsDevice, extsList[i]) != (char *) NULL )
225
+ {
226
+ strncpy(extension, extsList[i], sizeof(extension));
227
+ break;
228
+ }
229
+ }}
230
+
231
+ rawOrder = complexMode; // todo: figure out what exactly rawOrder do :)
232
+
233
+ if(textAsJSON)
234
+ xml = gTrue;
235
+
236
+ // write text file
237
+ htmlOut = new ImgOutputDev(htmlFileName->getCString(),
238
+ docTitle->getCString(),
239
+ author ? author->getCString() : NULL,
240
+ keywords ? keywords->getCString() : NULL,
241
+ subject ? subject->getCString() : NULL,
242
+ date ? date->getCString() : NULL,
243
+ extension,
244
+ rawOrder,
245
+ textAsJSON,
246
+ compressData,
247
+ firstPage,
248
+ doc->getCatalog()->getOutline()->isDict(),
249
+ doc->getNumPages());
250
+ delete docTitle;
251
+ if( author )
252
+ {
253
+ delete author;
254
+ }
255
+ if( keywords )
256
+ {
257
+ delete keywords;
258
+ }
259
+ if( subject )
260
+ {
261
+ delete subject;
262
+ }
263
+ if( date )
264
+ {
265
+ delete date;
266
+ }
267
+
268
+ if (htmlOut->isOk())
269
+ {
270
+ doc->displayPages(htmlOut, firstPage, lastPage, static_cast<int>(72*scale), static_cast<int>(72*scale), 0, gTrue, gTrue,gTrue,NULL);
271
+
272
+ if (!xml)
273
+ {
274
+ htmlOut->dumpDocOutline(doc->getCatalog());
275
+ }
276
+ }
277
+
278
+ delete htmlOut;
279
+
280
+ // clean up
281
+ error:
282
+ if(doc) delete doc;
283
+ if(globalParams) delete globalParams;
284
+
285
+ if(htmlFileName) delete htmlFileName;
286
+ XmlFont::clear();
287
+
288
+ // check for memory leaks
289
+ Object::memCheck(stderr);
290
+ gMemReport(stderr);
291
+
292
+ return 0;
293
+ }
294
+
295
+ static GString* getInfoString(Dict *infoDict, char *key) {
296
+ Object obj;
297
+ GString *s1 = NULL;
298
+
299
+ if (infoDict->lookup(key, &obj)->isString()) {
300
+ s1 = new GString(obj.getString());
301
+ }
302
+ obj.free();
303
+ return s1;
304
+ }
305
+
306
+ static GString* getInfoDate(Dict *infoDict, char *key) {
307
+ Object obj;
308
+ char *s;
309
+ int year, mon, day, hour, min, sec;
310
+ struct tm tmStruct;
311
+ GString *result = NULL;
312
+ char buf[256];
313
+
314
+ if (infoDict->lookup(key, &obj)->isString()) {
315
+ s = obj.getString()->getCString();
316
+ if (s[0] == 'D' && s[1] == ':') {
317
+ s += 2;
318
+ }
319
+ if (sscanf(s, "%4d%2d%2d%2d%2d%2d",
320
+ &year, &mon, &day, &hour, &min, &sec) == 6) {
321
+ tmStruct.tm_year = year - 1900;
322
+ tmStruct.tm_mon = mon - 1;
323
+ tmStruct.tm_mday = day;
324
+ tmStruct.tm_hour = hour;
325
+ tmStruct.tm_min = min;
326
+ tmStruct.tm_sec = sec;
327
+ tmStruct.tm_wday = -1;
328
+ tmStruct.tm_yday = -1;
329
+ tmStruct.tm_isdst = -1;
330
+ mktime(&tmStruct); // compute the tm_wday and tm_yday fields
331
+ if (strftime(buf, sizeof(buf), "%Y-%m-%dT%H:%M:%S+00:00", &tmStruct)) {
332
+ result = new GString(buf);
333
+ } else {
334
+ result = new GString(s);
335
+ }
336
+ } else {
337
+ result = new GString(s);
338
+ }
339
+ }
340
+ obj.free();
341
+ return result;
342
+ }
343
+