pdf2json 0.1.0
Sign up to get free protection for your applications and to get access to all the features.
- data/README.markdown +9 -0
- data/bin/.gitkeep +0 -0
- data/ext/extconf.rb +30 -0
- data/lib/pdf2json.rb +8 -0
- data/pdf2json-0.52-source/AUTHORS +24 -0
- data/pdf2json-0.52-source/CHANGES +11 -0
- data/pdf2json-0.52-source/Makefile +84 -0
- data/pdf2json-0.52-source/Makefile.in +84 -0
- data/pdf2json-0.52-source/aclocal.m4 +274 -0
- data/pdf2json-0.52-source/aconf-win32.h +86 -0
- data/pdf2json-0.52-source/aconf.h +42 -0
- data/pdf2json-0.52-source/aconf.h.in +41 -0
- data/pdf2json-0.52-source/autom4te.cache/output.0 +6908 -0
- data/pdf2json-0.52-source/autom4te.cache/requests +76 -0
- data/pdf2json-0.52-source/autom4te.cache/traces.0 +466 -0
- data/pdf2json-0.52-source/config.log +1259 -0
- data/pdf2json-0.52-source/config.status +1050 -0
- data/pdf2json-0.52-source/configure +6908 -0
- data/pdf2json-0.52-source/configure.ac +93 -0
- data/pdf2json-0.52-source/doc/pdffonts.1 +130 -0
- data/pdf2json-0.52-source/doc/pdffonts.cat +107 -0
- data/pdf2json-0.52-source/doc/pdffonts.hlp +117 -0
- data/pdf2json-0.52-source/doc/pdfimages.1 +102 -0
- data/pdf2json-0.52-source/doc/pdfimages.cat +92 -0
- data/pdf2json-0.52-source/doc/pdfimages.hlp +101 -0
- data/pdf2json-0.52-source/doc/pdfinfo.1 +158 -0
- data/pdf2json-0.52-source/doc/pdfinfo.cat +119 -0
- data/pdf2json-0.52-source/doc/pdfinfo.hlp +129 -0
- data/pdf2json-0.52-source/doc/pdftoppm.1 +115 -0
- data/pdf2json-0.52-source/doc/pdftoppm.cat +105 -0
- data/pdf2json-0.52-source/doc/pdftoppm.hlp +114 -0
- data/pdf2json-0.52-source/doc/pdftops.1 +229 -0
- data/pdf2json-0.52-source/doc/pdftops.cat +221 -0
- data/pdf2json-0.52-source/doc/pdftops.hlp +231 -0
- data/pdf2json-0.52-source/doc/pdftotext.1 +137 -0
- data/pdf2json-0.52-source/doc/pdftotext.cat +120 -0
- data/pdf2json-0.52-source/doc/pdftotext.hlp +133 -0
- data/pdf2json-0.52-source/doc/sample-xpdfrc +91 -0
- data/pdf2json-0.52-source/doc/xpdf.1 +513 -0
- data/pdf2json-0.52-source/doc/xpdf.cat +476 -0
- data/pdf2json-0.52-source/doc/xpdf.hlp +489 -0
- data/pdf2json-0.52-source/doc/xpdfrc.5 +480 -0
- data/pdf2json-0.52-source/doc/xpdfrc.cat +474 -0
- data/pdf2json-0.52-source/doc/xpdfrc.hlp +479 -0
- data/pdf2json-0.52-source/fofi/.DS_Store +0 -0
- data/pdf2json-0.52-source/fofi/FoFiBase.cc +156 -0
- data/pdf2json-0.52-source/fofi/FoFiBase.h +57 -0
- data/pdf2json-0.52-source/fofi/FoFiBase.o +0 -0
- data/pdf2json-0.52-source/fofi/FoFiEncodings.cc +994 -0
- data/pdf2json-0.52-source/fofi/FoFiEncodings.h +36 -0
- data/pdf2json-0.52-source/fofi/FoFiEncodings.o +0 -0
- data/pdf2json-0.52-source/fofi/FoFiTrueType.cc +2027 -0
- data/pdf2json-0.52-source/fofi/FoFiTrueType.h +174 -0
- data/pdf2json-0.52-source/fofi/FoFiTrueType.o +0 -0
- data/pdf2json-0.52-source/fofi/FoFiType1.cc +252 -0
- data/pdf2json-0.52-source/fofi/FoFiType1.h +59 -0
- data/pdf2json-0.52-source/fofi/FoFiType1.o +0 -0
- data/pdf2json-0.52-source/fofi/FoFiType1C.cc +2603 -0
- data/pdf2json-0.52-source/fofi/FoFiType1C.h +233 -0
- data/pdf2json-0.52-source/fofi/FoFiType1C.o +0 -0
- data/pdf2json-0.52-source/fofi/Makefile +70 -0
- data/pdf2json-0.52-source/fofi/Makefile.dep +0 -0
- data/pdf2json-0.52-source/fofi/Makefile.in +70 -0
- data/pdf2json-0.52-source/fofi/libfofi.a +0 -0
- data/pdf2json-0.52-source/fofi/vms_make.com +0 -0
- data/pdf2json-0.52-source/freetype.win32/.DS_Store +0 -0
- data/pdf2json-0.52-source/freetype.win32/include/.DS_Store +0 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/config/ftconfig.h +528 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/config/ftheader.h +780 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/config/ftmodule.h +32 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/config/ftoption.h +733 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/config/ftstdlib.h +173 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/freetype.h +3919 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftadvanc.h +179 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftbbox.h +94 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftbdf.h +209 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftbitmap.h +227 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftcache.h +1128 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftchapters.h +103 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftcid.h +166 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/fterrdef.h +244 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/fterrors.h +206 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftgasp.h +120 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftglyph.h +613 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftgxval.h +358 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftgzip.h +102 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftimage.h +1313 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftincrem.h +353 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftlcdfil.h +213 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftlist.h +277 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftlzw.h +99 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftmac.h +274 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftmm.h +378 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftmodapi.h +483 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftmoderr.h +155 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftotval.h +203 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftoutln.h +537 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftpfr.h +172 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftrender.h +230 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftsizes.h +159 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftsnames.h +200 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftstroke.h +716 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftsynth.h +80 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftsystem.h +347 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/fttrigon.h +350 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/fttypes.h +588 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftwinfnt.h +274 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ftxf86.h +83 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/autohint.h +231 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftcalc.h +179 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftdebug.h +250 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftdriver.h +422 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftgloadr.h +168 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftmemory.h +380 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftobjs.h +1428 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftpic.h +67 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftrfork.h +196 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftserv.h +620 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftstream.h +539 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/fttrace.h +139 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/ftvalid.h +150 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/internal.h +51 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/pcftypes.h +56 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/psaux.h +873 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/pshints.h +712 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svbdf.h +77 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svcid.h +83 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svgldict.h +82 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svgxval.h +72 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svkern.h +51 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svmm.h +104 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svotval.h +55 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svpfr.h +66 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svpostnm.h +79 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svpscmap.h +164 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svpsinfo.h +92 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svsfnt.h +102 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svttcmap.h +106 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svtteng.h +53 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svttglyf.h +67 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svwinfnt.h +50 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/services/svxf86nm.h +55 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/sfnt.h +897 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/t1types.h +270 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/internal/tttypes.h +1543 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/t1tables.h +504 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ttnameid.h +1247 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/tttables.h +759 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/tttags.h +107 -0
- data/pdf2json-0.52-source/freetype.win32/include/freetype/ttunpat.h +59 -0
- data/pdf2json-0.52-source/freetype.win32/include/ft2build.h +39 -0
- data/pdf2json-0.52-source/freetype.win32/lib/freetype_a.lib +0 -0
- data/pdf2json-0.52-source/goo/.DS_Store +0 -0
- data/pdf2json-0.52-source/goo/FixedPoint.cc +118 -0
- data/pdf2json-0.52-source/goo/FixedPoint.h +155 -0
- data/pdf2json-0.52-source/goo/FixedPoint.o +0 -0
- data/pdf2json-0.52-source/goo/GHash.cc +380 -0
- data/pdf2json-0.52-source/goo/GHash.h +78 -0
- data/pdf2json-0.52-source/goo/GHash.o +0 -0
- data/pdf2json-0.52-source/goo/GList.cc +97 -0
- data/pdf2json-0.52-source/goo/GList.h +96 -0
- data/pdf2json-0.52-source/goo/GList.o +0 -0
- data/pdf2json-0.52-source/goo/GMutex.h +49 -0
- data/pdf2json-0.52-source/goo/GString.cc +724 -0
- data/pdf2json-0.52-source/goo/GString.cc.fixed +718 -0
- data/pdf2json-0.52-source/goo/GString.h +136 -0
- data/pdf2json-0.52-source/goo/GString.o +0 -0
- data/pdf2json-0.52-source/goo/ImgWriter.o +0 -0
- data/pdf2json-0.52-source/goo/JpegWriter.o +0 -0
- data/pdf2json-0.52-source/goo/Makefile +72 -0
- data/pdf2json-0.52-source/goo/Makefile.dep +0 -0
- data/pdf2json-0.52-source/goo/Makefile.in +72 -0
- data/pdf2json-0.52-source/goo/PNGWriter.o +0 -0
- data/pdf2json-0.52-source/goo/gfile.cc +731 -0
- data/pdf2json-0.52-source/goo/gfile.h +138 -0
- data/pdf2json-0.52-source/goo/gfile.o +0 -0
- data/pdf2json-0.52-source/goo/gmem.cc +264 -0
- data/pdf2json-0.52-source/goo/gmem.h +79 -0
- data/pdf2json-0.52-source/goo/gmem.o +0 -0
- data/pdf2json-0.52-source/goo/gmempp.cc +32 -0
- data/pdf2json-0.52-source/goo/gmempp.o +0 -0
- data/pdf2json-0.52-source/goo/gtypes.h +29 -0
- data/pdf2json-0.52-source/goo/libGoo.a +0 -0
- data/pdf2json-0.52-source/goo/parseargs.c +190 -0
- data/pdf2json-0.52-source/goo/parseargs.h +71 -0
- data/pdf2json-0.52-source/goo/parseargs.o +0 -0
- data/pdf2json-0.52-source/goo/vms_directory.c +214 -0
- data/pdf2json-0.52-source/goo/vms_dirent.h +67 -0
- data/pdf2json-0.52-source/goo/vms_make.com +82 -0
- data/pdf2json-0.52-source/goo/vms_sys_dirent.h +54 -0
- data/pdf2json-0.52-source/goo/vms_unix_time.h +102 -0
- data/pdf2json-0.52-source/goo/vms_unix_times.c +42 -0
- data/pdf2json-0.52-source/goo/vms_unlink.c +22 -0
- data/pdf2json-0.52-source/ms_make.bat +199 -0
- data/pdf2json-0.52-source/splash/.DS_Store +0 -0
- data/pdf2json-0.52-source/splash/Makefile +103 -0
- data/pdf2json-0.52-source/splash/Makefile.dep +0 -0
- data/pdf2json-0.52-source/splash/Makefile.in +103 -0
- data/pdf2json-0.52-source/splash/Splash.cc +3310 -0
- data/pdf2json-0.52-source/splash/Splash.h +293 -0
- data/pdf2json-0.52-source/splash/Splash.o +0 -0
- data/pdf2json-0.52-source/splash/SplashBitmap.cc +188 -0
- data/pdf2json-0.52-source/splash/SplashBitmap.h +64 -0
- data/pdf2json-0.52-source/splash/SplashBitmap.o +0 -0
- data/pdf2json-0.52-source/splash/SplashClip.cc +382 -0
- data/pdf2json-0.52-source/splash/SplashClip.h +107 -0
- data/pdf2json-0.52-source/splash/SplashClip.o +0 -0
- data/pdf2json-0.52-source/splash/SplashErrorCodes.h +32 -0
- data/pdf2json-0.52-source/splash/SplashFTFont.cc +357 -0
- data/pdf2json-0.52-source/splash/SplashFTFont.h +58 -0
- data/pdf2json-0.52-source/splash/SplashFTFont.o +0 -0
- data/pdf2json-0.52-source/splash/SplashFTFontEngine.cc +179 -0
- data/pdf2json-0.52-source/splash/SplashFTFontEngine.h +65 -0
- data/pdf2json-0.52-source/splash/SplashFTFontEngine.o +0 -0
- data/pdf2json-0.52-source/splash/SplashFTFontFile.cc +114 -0
- data/pdf2json-0.52-source/splash/SplashFTFontFile.h +73 -0
- data/pdf2json-0.52-source/splash/SplashFTFontFile.o +0 -0
- data/pdf2json-0.52-source/splash/SplashFont.cc +176 -0
- data/pdf2json-0.52-source/splash/SplashFont.h +104 -0
- data/pdf2json-0.52-source/splash/SplashFont.o +0 -0
- data/pdf2json-0.52-source/splash/SplashFontEngine.cc +317 -0
- data/pdf2json-0.52-source/splash/SplashFontEngine.h +91 -0
- data/pdf2json-0.52-source/splash/SplashFontEngine.o +0 -0
- data/pdf2json-0.52-source/splash/SplashFontFile.cc +55 -0
- data/pdf2json-0.52-source/splash/SplashFontFile.h +60 -0
- data/pdf2json-0.52-source/splash/SplashFontFile.o +0 -0
- data/pdf2json-0.52-source/splash/SplashFontFileID.cc +23 -0
- data/pdf2json-0.52-source/splash/SplashFontFileID.h +30 -0
- data/pdf2json-0.52-source/splash/SplashFontFileID.o +0 -0
- data/pdf2json-0.52-source/splash/SplashGlyphBitmap.h +26 -0
- data/pdf2json-0.52-source/splash/SplashMath.h +89 -0
- data/pdf2json-0.52-source/splash/SplashPath.cc +184 -0
- data/pdf2json-0.52-source/splash/SplashPath.h +121 -0
- data/pdf2json-0.52-source/splash/SplashPath.o +0 -0
- data/pdf2json-0.52-source/splash/SplashPattern.cc +40 -0
- data/pdf2json-0.52-source/splash/SplashPattern.h +65 -0
- data/pdf2json-0.52-source/splash/SplashPattern.o +0 -0
- data/pdf2json-0.52-source/splash/SplashScreen.cc +383 -0
- data/pdf2json-0.52-source/splash/SplashScreen.h +56 -0
- data/pdf2json-0.52-source/splash/SplashScreen.o +0 -0
- data/pdf2json-0.52-source/splash/SplashState.cc +165 -0
- data/pdf2json-0.52-source/splash/SplashState.h +103 -0
- data/pdf2json-0.52-source/splash/SplashState.o +0 -0
- data/pdf2json-0.52-source/splash/SplashT1Font.cc +287 -0
- data/pdf2json-0.52-source/splash/SplashT1Font.h +57 -0
- data/pdf2json-0.52-source/splash/SplashT1Font.o +0 -0
- data/pdf2json-0.52-source/splash/SplashT1FontEngine.cc +124 -0
- data/pdf2json-0.52-source/splash/SplashT1FontEngine.h +53 -0
- data/pdf2json-0.52-source/splash/SplashT1FontEngine.o +0 -0
- data/pdf2json-0.52-source/splash/SplashT1FontFile.cc +97 -0
- data/pdf2json-0.52-source/splash/SplashT1FontFile.h +58 -0
- data/pdf2json-0.52-source/splash/SplashT1FontFile.o +0 -0
- data/pdf2json-0.52-source/splash/SplashTypes.h +132 -0
- data/pdf2json-0.52-source/splash/SplashXPath.cc +438 -0
- data/pdf2json-0.52-source/splash/SplashXPath.h +100 -0
- data/pdf2json-0.52-source/splash/SplashXPath.o +0 -0
- data/pdf2json-0.52-source/splash/SplashXPathScanner.cc +428 -0
- data/pdf2json-0.52-source/splash/SplashXPathScanner.h +87 -0
- data/pdf2json-0.52-source/splash/SplashXPathScanner.o +0 -0
- data/pdf2json-0.52-source/splash/libsplash.a +0 -0
- data/pdf2json-0.52-source/splash/vms_make.com +0 -0
- data/pdf2json-0.52-source/src/.DS_Store +0 -0
- data/pdf2json-0.52-source/src/GVector.h +101 -0
- data/pdf2json-0.52-source/src/ImgOutputDev.cc +1243 -0
- data/pdf2json-0.52-source/src/ImgOutputDev.h +307 -0
- data/pdf2json-0.52-source/src/ImgOutputDev.o +0 -0
- data/pdf2json-0.52-source/src/Makefile +68 -0
- data/pdf2json-0.52-source/src/Makefile.in +68 -0
- data/pdf2json-0.52-source/src/XmlFonts.cc +367 -0
- data/pdf2json-0.52-source/src/XmlFonts.h +91 -0
- data/pdf2json-0.52-source/src/XmlFonts.o +0 -0
- data/pdf2json-0.52-source/src/XmlLinks.cc +101 -0
- data/pdf2json-0.52-source/src/XmlLinks.h +54 -0
- data/pdf2json-0.52-source/src/XmlLinks.o +0 -0
- data/pdf2json-0.52-source/src/pdf2json +0 -0
- data/pdf2json-0.52-source/src/pdf2json.cc +343 -0
- data/pdf2json-0.52-source/src/pdf2json.o +0 -0
- data/pdf2json-0.52-source/src/pdf2xml.dtd +22 -0
- data/pdf2json-0.52-source/src/pdf2xmljson.dtd +9 -0
- data/pdf2json-0.52-source/xpdf/.DS_Store +0 -0
- data/pdf2json-0.52-source/xpdf/Annot.cc +1556 -0
- data/pdf2json-0.52-source/xpdf/Annot.h +142 -0
- data/pdf2json-0.52-source/xpdf/Annot.o +0 -0
- data/pdf2json-0.52-source/xpdf/Array.cc +73 -0
- data/pdf2json-0.52-source/xpdf/Array.h +58 -0
- data/pdf2json-0.52-source/xpdf/Array.o +0 -0
- data/pdf2json-0.52-source/xpdf/BuiltinFont.cc +65 -0
- data/pdf2json-0.52-source/xpdf/BuiltinFont.h +57 -0
- data/pdf2json-0.52-source/xpdf/BuiltinFont.o +0 -0
- data/pdf2json-0.52-source/xpdf/BuiltinFontTables.cc +4284 -0
- data/pdf2json-0.52-source/xpdf/BuiltinFontTables.h +23 -0
- data/pdf2json-0.52-source/xpdf/BuiltinFontTables.o +0 -0
- data/pdf2json-0.52-source/xpdf/CMap.cc +408 -0
- data/pdf2json-0.52-source/xpdf/CMap.h +102 -0
- data/pdf2json-0.52-source/xpdf/CMap.o +0 -0
- data/pdf2json-0.52-source/xpdf/Catalog.cc +374 -0
- data/pdf2json-0.52-source/xpdf/Catalog.h +97 -0
- data/pdf2json-0.52-source/xpdf/Catalog.o +0 -0
- data/pdf2json-0.52-source/xpdf/CharCodeToUnicode.cc +540 -0
- data/pdf2json-0.52-source/xpdf/CharCodeToUnicode.h +117 -0
- data/pdf2json-0.52-source/xpdf/CharCodeToUnicode.o +0 -0
- data/pdf2json-0.52-source/xpdf/CharTypes.h +24 -0
- data/pdf2json-0.52-source/xpdf/CompactFontTables.h +464 -0
- data/pdf2json-0.52-source/xpdf/CoreOutputDev.cc +61 -0
- data/pdf2json-0.52-source/xpdf/CoreOutputDev.h +61 -0
- data/pdf2json-0.52-source/xpdf/Decrypt.cc +776 -0
- data/pdf2json-0.52-source/xpdf/Decrypt.h +95 -0
- data/pdf2json-0.52-source/xpdf/Decrypt.o +0 -0
- data/pdf2json-0.52-source/xpdf/Dict.cc +95 -0
- data/pdf2json-0.52-source/xpdf/Dict.h +77 -0
- data/pdf2json-0.52-source/xpdf/Dict.o +0 -0
- data/pdf2json-0.52-source/xpdf/Error.cc +38 -0
- data/pdf2json-0.52-source/xpdf/Error.h +23 -0
- data/pdf2json-0.52-source/xpdf/Error.o +0 -0
- data/pdf2json-0.52-source/xpdf/ErrorCodes.h +36 -0
- data/pdf2json-0.52-source/xpdf/FontEncodingTables.cc +1824 -0
- data/pdf2json-0.52-source/xpdf/FontEncodingTables.h +20 -0
- data/pdf2json-0.52-source/xpdf/FontEncodingTables.o +0 -0
- data/pdf2json-0.52-source/xpdf/Function.cc +1573 -0
- data/pdf2json-0.52-source/xpdf/Function.h +229 -0
- data/pdf2json-0.52-source/xpdf/Function.o +0 -0
- data/pdf2json-0.52-source/xpdf/Gfx.cc +4187 -0
- data/pdf2json-0.52-source/xpdf/Gfx.h +312 -0
- data/pdf2json-0.52-source/xpdf/Gfx.o +0 -0
- data/pdf2json-0.52-source/xpdf/GfxFont.cc +1568 -0
- data/pdf2json-0.52-source/xpdf/GfxFont.h +320 -0
- data/pdf2json-0.52-source/xpdf/GfxFont.o +0 -0
- data/pdf2json-0.52-source/xpdf/GfxState.cc +4137 -0
- data/pdf2json-0.52-source/xpdf/GfxState.h +1244 -0
- data/pdf2json-0.52-source/xpdf/GfxState.o +0 -0
- data/pdf2json-0.52-source/xpdf/GlobalParams.cc +2924 -0
- data/pdf2json-0.52-source/xpdf/GlobalParams.cc.old +2908 -0
- data/pdf2json-0.52-source/xpdf/GlobalParams.h +466 -0
- data/pdf2json-0.52-source/xpdf/GlobalParams.h.old +463 -0
- data/pdf2json-0.52-source/xpdf/GlobalParams.o +0 -0
- data/pdf2json-0.52-source/xpdf/ImageOutputDev.cc +195 -0
- data/pdf2json-0.52-source/xpdf/ImageOutputDev.h +76 -0
- data/pdf2json-0.52-source/xpdf/ImageOutputDev.o +0 -0
- data/pdf2json-0.52-source/xpdf/JArithmeticDecoder.cc +322 -0
- data/pdf2json-0.52-source/xpdf/JArithmeticDecoder.h +109 -0
- data/pdf2json-0.52-source/xpdf/JArithmeticDecoder.o +0 -0
- data/pdf2json-0.52-source/xpdf/JBIG2Stream.cc +3413 -0
- data/pdf2json-0.52-source/xpdf/JBIG2Stream.h +145 -0
- data/pdf2json-0.52-source/xpdf/JBIG2Stream.o +0 -0
- data/pdf2json-0.52-source/xpdf/JPXStream.cc +3144 -0
- data/pdf2json-0.52-source/xpdf/JPXStream.h +351 -0
- data/pdf2json-0.52-source/xpdf/JPXStream.o +0 -0
- data/pdf2json-0.52-source/xpdf/Lexer.cc +485 -0
- data/pdf2json-0.52-source/xpdf/Lexer.h +80 -0
- data/pdf2json-0.52-source/xpdf/Lexer.o +0 -0
- data/pdf2json-0.52-source/xpdf/Link.cc +806 -0
- data/pdf2json-0.52-source/xpdf/Link.cc.old +784 -0
- data/pdf2json-0.52-source/xpdf/Link.h +415 -0
- data/pdf2json-0.52-source/xpdf/Link.h.old +369 -0
- data/pdf2json-0.52-source/xpdf/Link.o +0 -0
- data/pdf2json-0.52-source/xpdf/Makefile +232 -0
- data/pdf2json-0.52-source/xpdf/Makefile.dep +0 -0
- data/pdf2json-0.52-source/xpdf/Makefile.in +232 -0
- data/pdf2json-0.52-source/xpdf/NameToCharCode.cc +116 -0
- data/pdf2json-0.52-source/xpdf/NameToCharCode.h +42 -0
- data/pdf2json-0.52-source/xpdf/NameToCharCode.o +0 -0
- data/pdf2json-0.52-source/xpdf/NameToUnicodeTable.h +1097 -0
- data/pdf2json-0.52-source/xpdf/Object.cc +231 -0
- data/pdf2json-0.52-source/xpdf/Object.h +303 -0
- data/pdf2json-0.52-source/xpdf/Object.o +0 -0
- data/pdf2json-0.52-source/xpdf/Outline.cc +151 -0
- data/pdf2json-0.52-source/xpdf/Outline.h +76 -0
- data/pdf2json-0.52-source/xpdf/Outline.o +0 -0
- data/pdf2json-0.52-source/xpdf/OutputDev.cc +131 -0
- data/pdf2json-0.52-source/xpdf/OutputDev.h +253 -0
- data/pdf2json-0.52-source/xpdf/OutputDev.o +0 -0
- data/pdf2json-0.52-source/xpdf/PDFCore.cc +2044 -0
- data/pdf2json-0.52-source/xpdf/PDFCore.h +321 -0
- data/pdf2json-0.52-source/xpdf/PDFDoc.cc +404 -0
- data/pdf2json-0.52-source/xpdf/PDFDoc.h +183 -0
- data/pdf2json-0.52-source/xpdf/PDFDoc.o +0 -0
- data/pdf2json-0.52-source/xpdf/PDFDocEncoding.cc +44 -0
- data/pdf2json-0.52-source/xpdf/PDFDocEncoding.h +16 -0
- data/pdf2json-0.52-source/xpdf/PDFDocEncoding.o +0 -0
- data/pdf2json-0.52-source/xpdf/PSOutputDev.cc +6224 -0
- data/pdf2json-0.52-source/xpdf/PSOutputDev.h +395 -0
- data/pdf2json-0.52-source/xpdf/PSOutputDev.o +0 -0
- data/pdf2json-0.52-source/xpdf/PSTokenizer.cc +135 -0
- data/pdf2json-0.52-source/xpdf/PSTokenizer.h +41 -0
- data/pdf2json-0.52-source/xpdf/PSTokenizer.o +0 -0
- data/pdf2json-0.52-source/xpdf/Page.cc +454 -0
- data/pdf2json-0.52-source/xpdf/Page.h +187 -0
- data/pdf2json-0.52-source/xpdf/Page.o +0 -0
- data/pdf2json-0.52-source/xpdf/Parser.cc +227 -0
- data/pdf2json-0.52-source/xpdf/Parser.h +59 -0
- data/pdf2json-0.52-source/xpdf/Parser.o +0 -0
- data/pdf2json-0.52-source/xpdf/PreScanOutputDev.cc +257 -0
- data/pdf2json-0.52-source/xpdf/PreScanOutputDev.h +130 -0
- data/pdf2json-0.52-source/xpdf/PreScanOutputDev.o +0 -0
- data/pdf2json-0.52-source/xpdf/SecurityHandler.cc +390 -0
- data/pdf2json-0.52-source/xpdf/SecurityHandler.h +160 -0
- data/pdf2json-0.52-source/xpdf/SecurityHandler.o +0 -0
- data/pdf2json-0.52-source/xpdf/SplashOutputDev.cc +2845 -0
- data/pdf2json-0.52-source/xpdf/SplashOutputDev.h +247 -0
- data/pdf2json-0.52-source/xpdf/SplashOutputDev.o +0 -0
- data/pdf2json-0.52-source/xpdf/Stream-CCITT.h +459 -0
- data/pdf2json-0.52-source/xpdf/Stream.cc +4627 -0
- data/pdf2json-0.52-source/xpdf/Stream.h +858 -0
- data/pdf2json-0.52-source/xpdf/Stream.o +0 -0
- data/pdf2json-0.52-source/xpdf/TextOutputDev.cc +4090 -0
- data/pdf2json-0.52-source/xpdf/TextOutputDev.h +661 -0
- data/pdf2json-0.52-source/xpdf/TextOutputDev.o +0 -0
- data/pdf2json-0.52-source/xpdf/UTF8.h +56 -0
- data/pdf2json-0.52-source/xpdf/UnicodeMap.cc +302 -0
- data/pdf2json-0.52-source/xpdf/UnicodeMap.cc.old +293 -0
- data/pdf2json-0.52-source/xpdf/UnicodeMap.h +135 -0
- data/pdf2json-0.52-source/xpdf/UnicodeMap.h.old +123 -0
- data/pdf2json-0.52-source/xpdf/UnicodeMap.o +0 -0
- data/pdf2json-0.52-source/xpdf/UnicodeMapTables.h +361 -0
- data/pdf2json-0.52-source/xpdf/UnicodeTypeTable.cc +949 -0
- data/pdf2json-0.52-source/xpdf/UnicodeTypeTable.h +20 -0
- data/pdf2json-0.52-source/xpdf/UnicodeTypeTable.o +0 -0
- data/pdf2json-0.52-source/xpdf/XPDFApp.cc +447 -0
- data/pdf2json-0.52-source/xpdf/XPDFApp.h +114 -0
- data/pdf2json-0.52-source/xpdf/XPDFCore.cc +1655 -0
- data/pdf2json-0.52-source/xpdf/XPDFCore.h +251 -0
- data/pdf2json-0.52-source/xpdf/XPDFTree.cc +931 -0
- data/pdf2json-0.52-source/xpdf/XPDFTree.h +45 -0
- data/pdf2json-0.52-source/xpdf/XPDFTreeP.h +87 -0
- data/pdf2json-0.52-source/xpdf/XPDFViewer.cc +3488 -0
- data/pdf2json-0.52-source/xpdf/XPDFViewer.h +352 -0
- data/pdf2json-0.52-source/xpdf/XRef.cc +896 -0
- data/pdf2json-0.52-source/xpdf/XRef.h +133 -0
- data/pdf2json-0.52-source/xpdf/XRef.o +0 -0
- data/pdf2json-0.52-source/xpdf/XpdfPluginAPI.cc +262 -0
- data/pdf2json-0.52-source/xpdf/XpdfPluginAPI.h +341 -0
- data/pdf2json-0.52-source/xpdf/XpdfPluginAPI.o +0 -0
- data/pdf2json-0.52-source/xpdf/about-text.h +48 -0
- data/pdf2json-0.52-source/xpdf/about.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/backArrow.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/backArrowDis.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/config.h +112 -0
- data/pdf2json-0.52-source/xpdf/dblLeftArrow.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/dblLeftArrowDis.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/dblRightArrow.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/dblRightArrowDis.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/find.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/findDis.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/forwardArrow.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/forwardArrowDis.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/leftArrow.xbm +5 -0
- data/pdf2json-0.52-source/xpdf/leftArrowDis.xbm +5 -0
- data/pdf2json-0.52-source/xpdf/libXpdf.a +0 -0
- data/pdf2json-0.52-source/xpdf/pdffonts +0 -0
- data/pdf2json-0.52-source/xpdf/pdffonts.cc +298 -0
- data/pdf2json-0.52-source/xpdf/pdffonts.o +0 -0
- data/pdf2json-0.52-source/xpdf/pdfimages +0 -0
- data/pdf2json-0.52-source/xpdf/pdfimages.cc +155 -0
- data/pdf2json-0.52-source/xpdf/pdfimages.o +0 -0
- data/pdf2json-0.52-source/xpdf/pdfinfo +0 -0
- data/pdf2json-0.52-source/xpdf/pdfinfo.cc +387 -0
- data/pdf2json-0.52-source/xpdf/pdfinfo.o +0 -0
- data/pdf2json-0.52-source/xpdf/pdftoppm.cc +203 -0
- data/pdf2json-0.52-source/xpdf/pdftops +0 -0
- data/pdf2json-0.52-source/xpdf/pdftops.cc +344 -0
- data/pdf2json-0.52-source/xpdf/pdftops.o +0 -0
- data/pdf2json-0.52-source/xpdf/pdftotext +0 -0
- data/pdf2json-0.52-source/xpdf/pdftotext.cc +333 -0
- data/pdf2json-0.52-source/xpdf/pdftotext.o +0 -0
- data/pdf2json-0.52-source/xpdf/print.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/printDis.xbm +6 -0
- data/pdf2json-0.52-source/xpdf/rightArrow.xbm +5 -0
- data/pdf2json-0.52-source/xpdf/rightArrowDis.xbm +5 -0
- data/pdf2json-0.52-source/xpdf/vms_make.com +129 -0
- data/pdf2json-0.52-source/xpdf/xpdf.cc +344 -0
- data/pdf2json-0.52-source/xpdf/xpdfIcon.xpm +62 -0
- data/pdf2json.gemspec +29 -0
- metadata +518 -0
@@ -0,0 +1,91 @@
|
|
1
|
+
#ifndef _XML_FONTS_H
|
2
|
+
#define _XML_FONTS_H
|
3
|
+
#include "GVector.h"
|
4
|
+
#include "GString.h"
|
5
|
+
#include "GfxState.h"
|
6
|
+
#include "CharTypes.h"
|
7
|
+
|
8
|
+
|
9
|
+
class XmlFontColor{
|
10
|
+
private:
|
11
|
+
unsigned int r;
|
12
|
+
unsigned int g;
|
13
|
+
unsigned int b;
|
14
|
+
GBool Ok(unsigned int xcol){ return ((xcol<=255)&&(xcol>=0));}
|
15
|
+
GString *convtoX(unsigned int xcol) const;
|
16
|
+
public:
|
17
|
+
XmlFontColor():r(0),g(0),b(0){}
|
18
|
+
XmlFontColor(GfxRGB rgb);
|
19
|
+
XmlFontColor(const XmlFontColor& x){r=x.r;g=x.g;b=x.b;}
|
20
|
+
XmlFontColor& operator=(const XmlFontColor &x){
|
21
|
+
r=x.r;g=x.g;b=x.b;
|
22
|
+
return *this;
|
23
|
+
}
|
24
|
+
~XmlFontColor(){};
|
25
|
+
GString* toString() const;
|
26
|
+
GBool isEqual(const XmlFontColor& col) const{
|
27
|
+
return ((r==col.r)&&(g==col.g)&&(b==col.b));
|
28
|
+
}
|
29
|
+
} ;
|
30
|
+
|
31
|
+
|
32
|
+
class XmlFont{
|
33
|
+
private:
|
34
|
+
unsigned int size;
|
35
|
+
double charspace;
|
36
|
+
int lineSize;
|
37
|
+
GBool italic;
|
38
|
+
GBool bold;
|
39
|
+
GBool oblique;
|
40
|
+
int pos; // position of the font name in the fonts array
|
41
|
+
static GString *DefaultFont;
|
42
|
+
GString *FontName;
|
43
|
+
XmlFontColor color;
|
44
|
+
static GString* HtmlFilter(Unicode* u, int uLen); //char* s);
|
45
|
+
public:
|
46
|
+
|
47
|
+
XmlFont(){FontName=NULL;};
|
48
|
+
XmlFont(GString* fontname,int _size,double _charspace, GfxRGB rgb);
|
49
|
+
XmlFont(const XmlFont& x);
|
50
|
+
XmlFont& operator=(const XmlFont& x);
|
51
|
+
XmlFontColor getColor() const {return color;}
|
52
|
+
~XmlFont();
|
53
|
+
static void clear();
|
54
|
+
GString* getFullName();
|
55
|
+
GBool isItalic() const {return italic;}
|
56
|
+
GBool isBold() const {return bold;}
|
57
|
+
GBool isOblique() const {return oblique;}
|
58
|
+
unsigned int getSize() const {return size;}
|
59
|
+
int getLineSize() const {return lineSize;}
|
60
|
+
void setLineSize(int _lineSize) { lineSize = _lineSize; }
|
61
|
+
GString* getFontName();
|
62
|
+
double getCharSpace() const {return charspace;}
|
63
|
+
void setCharSpace(double _charspace){charspace = _charspace;}
|
64
|
+
static GString* getDefaultFont();
|
65
|
+
static void setDefaultFont(GString* defaultFont);
|
66
|
+
GBool isEqual(const XmlFont& x) const;
|
67
|
+
GBool isEqualIgnoreBold(const XmlFont& x) const;
|
68
|
+
static GString* simple(XmlFont *font, Unicode *content, int uLen);
|
69
|
+
void print() const {printf("font: %s %d %s%spos: %d\n", FontName->getCString(), size, bold ? "bold " : "", italic ? "italic " : "", pos);};
|
70
|
+
};
|
71
|
+
|
72
|
+
class XmlFontAccu{
|
73
|
+
private:
|
74
|
+
GVector<XmlFont> *accu;
|
75
|
+
|
76
|
+
public:
|
77
|
+
XmlFontAccu();
|
78
|
+
~XmlFontAccu();
|
79
|
+
int AddFont(const XmlFont& font);
|
80
|
+
XmlFont* Get(int i){
|
81
|
+
GVector<XmlFont>::iterator g=accu->begin();
|
82
|
+
g+=i;
|
83
|
+
return g;
|
84
|
+
}
|
85
|
+
GString* getCSStyle (int i, GString* content);
|
86
|
+
/* GString* EscapeSpecialChars(GString* content); */
|
87
|
+
GString* CSStyle(int i,GBool textAsJSON);
|
88
|
+
int size() const {return accu->size();}
|
89
|
+
|
90
|
+
};
|
91
|
+
#endif
|
Binary file
|
@@ -0,0 +1,101 @@
|
|
1
|
+
#include "XmlLinks.h"
|
2
|
+
|
3
|
+
XmlLink::XmlLink(const XmlLink& x){
|
4
|
+
Xmin=x.Xmin;
|
5
|
+
Ymin=x.Ymin;
|
6
|
+
Xmax=x.Xmax;
|
7
|
+
Ymax=x.Ymax;
|
8
|
+
dest=new GString(x.dest);
|
9
|
+
}
|
10
|
+
|
11
|
+
XmlLink::XmlLink(double xmin,double ymin,double xmax,double ymax,GString * _dest)
|
12
|
+
{
|
13
|
+
if (xmin < xmax) {
|
14
|
+
Xmin=xmin;
|
15
|
+
Xmax=xmax;
|
16
|
+
} else {
|
17
|
+
Xmin=xmax;
|
18
|
+
Xmax=xmin;
|
19
|
+
}
|
20
|
+
if (ymin < ymax) {
|
21
|
+
Ymin=ymin;
|
22
|
+
Ymax=ymax;
|
23
|
+
} else {
|
24
|
+
Ymin=ymax;
|
25
|
+
Ymax=ymin;
|
26
|
+
}
|
27
|
+
dest=new GString(_dest);
|
28
|
+
}
|
29
|
+
|
30
|
+
XmlLink::~XmlLink(){
|
31
|
+
if (dest) delete dest;
|
32
|
+
}
|
33
|
+
|
34
|
+
GBool XmlLink::isEqualDest(const XmlLink& x) const{
|
35
|
+
return (!strcmp(dest->getCString(), x.dest->getCString()));
|
36
|
+
}
|
37
|
+
|
38
|
+
GBool XmlLink::inLink(double xmin,double ymin,double xmax,double ymax) const {
|
39
|
+
double y=(ymin+ymax)/2;
|
40
|
+
if (y>Ymax) return gFalse;
|
41
|
+
return (y>Ymin)&&(xmin<Xmax)&&(xmax>Xmin);
|
42
|
+
}
|
43
|
+
|
44
|
+
|
45
|
+
XmlLink& XmlLink::operator=(const XmlLink& x){
|
46
|
+
if (this==&x) return *this;
|
47
|
+
if (dest) {delete dest;dest=NULL;}
|
48
|
+
Xmin=x.Xmin;
|
49
|
+
Ymin=x.Ymin;
|
50
|
+
Xmax=x.Xmax;
|
51
|
+
Ymax=x.Ymax;
|
52
|
+
dest=new GString(x.dest);
|
53
|
+
return *this;
|
54
|
+
}
|
55
|
+
|
56
|
+
GString* XmlLink::getLinkStart() {
|
57
|
+
GString *res = new GString("");
|
58
|
+
res->append(dest);
|
59
|
+
// res->append("\">");
|
60
|
+
return res;
|
61
|
+
}
|
62
|
+
|
63
|
+
/*GString* XmlLink::Link(GString* content){
|
64
|
+
//GString* _dest=new GString(dest);
|
65
|
+
GString *tmp=new GString("<a href=\"");
|
66
|
+
tmp->append(dest);
|
67
|
+
tmp->append("\">");
|
68
|
+
tmp->append(content);
|
69
|
+
tmp->append("</a>");
|
70
|
+
//delete _dest;
|
71
|
+
return tmp;
|
72
|
+
}*/
|
73
|
+
|
74
|
+
|
75
|
+
|
76
|
+
XmlLinks::XmlLinks(){
|
77
|
+
accu=new GVector<XmlLink>();
|
78
|
+
}
|
79
|
+
|
80
|
+
XmlLinks::~XmlLinks(){
|
81
|
+
delete accu;
|
82
|
+
accu=NULL;
|
83
|
+
}
|
84
|
+
|
85
|
+
GBool XmlLinks::inLink(double xmin,double ymin,double xmax,double ymax,int& p)const {
|
86
|
+
|
87
|
+
for(GVector<XmlLink>::iterator i=accu->begin();i!=accu->end();i++){
|
88
|
+
if (i->inLink(xmin,ymin,xmax,ymax)) {
|
89
|
+
p=(i - accu->begin());
|
90
|
+
return 1;
|
91
|
+
}
|
92
|
+
}
|
93
|
+
return 0;
|
94
|
+
}
|
95
|
+
|
96
|
+
XmlLink* XmlLinks::getLink(int i) const{
|
97
|
+
GVector<XmlLink>::iterator g=accu->begin();
|
98
|
+
g+=i;
|
99
|
+
return g;
|
100
|
+
}
|
101
|
+
|
@@ -0,0 +1,54 @@
|
|
1
|
+
#ifndef _HTML_LINKS
|
2
|
+
#define _HTML_LINKS
|
3
|
+
|
4
|
+
#include "GVector.h"
|
5
|
+
#include "GString.h"
|
6
|
+
#include <stdio.h>
|
7
|
+
#include <stdlib.h>
|
8
|
+
#include <string.h>
|
9
|
+
#ifndef _WIN32
|
10
|
+
#include <sys/unistd.h>
|
11
|
+
#endif
|
12
|
+
|
13
|
+
class XmlLink{
|
14
|
+
|
15
|
+
private:
|
16
|
+
double Xmin;
|
17
|
+
double Ymin;
|
18
|
+
double Xmax;
|
19
|
+
double Ymax;
|
20
|
+
GString* dest;
|
21
|
+
|
22
|
+
public:
|
23
|
+
XmlLink(){dest=NULL;}
|
24
|
+
XmlLink(const XmlLink& x);
|
25
|
+
XmlLink& operator=(const XmlLink& x);
|
26
|
+
XmlLink(double xmin,double ymin,double xmax,double ymax,GString *_dest);
|
27
|
+
~XmlLink();
|
28
|
+
//GBool XmlLink::isEqualDest(const XmlLink& x) const; // this kills gcc 4.*
|
29
|
+
GBool isEqualDest(const XmlLink& x) const;
|
30
|
+
GString *getDest(){return new GString(dest);}
|
31
|
+
double getX1() const {return Xmin;}
|
32
|
+
double getX2() const {return Xmax;}
|
33
|
+
double getY1() const {return Ymin;}
|
34
|
+
double getY2() const {return Ymax;}
|
35
|
+
GBool inLink(double xmin,double ymin,double xmax,double ymax) const ;
|
36
|
+
//GString *Link(GString *content);
|
37
|
+
GString* getLinkStart();
|
38
|
+
|
39
|
+
};
|
40
|
+
|
41
|
+
class XmlLinks{
|
42
|
+
private:
|
43
|
+
GVector<XmlLink> *accu;
|
44
|
+
public:
|
45
|
+
XmlLinks();
|
46
|
+
~XmlLinks();
|
47
|
+
void AddLink(const XmlLink& x) {accu->push_back(x);}
|
48
|
+
GBool inLink(double xmin,double ymin,double xmax,double ymax,int& p) const;
|
49
|
+
XmlLink* getLink(int i) const;
|
50
|
+
|
51
|
+
};
|
52
|
+
|
53
|
+
#endif
|
54
|
+
|
Binary file
|
Binary file
|
@@ -0,0 +1,343 @@
|
|
1
|
+
//========================================================================
|
2
|
+
//
|
3
|
+
// pdf2json.cc
|
4
|
+
//
|
5
|
+
//
|
6
|
+
// Copyright 2011 Devaldi Ltd
|
7
|
+
//
|
8
|
+
// Copyright 1997-2002 Glyph & Cog, LLC
|
9
|
+
//
|
10
|
+
// Changed 1999-2000 by G.Ovtcharov
|
11
|
+
//
|
12
|
+
// Changed 2002 by Mikhail Kruk
|
13
|
+
//========================================================================
|
14
|
+
|
15
|
+
#include <stdio.h>
|
16
|
+
#include <stdlib.h>
|
17
|
+
#include <stddef.h>
|
18
|
+
#include <string.h>
|
19
|
+
#include <aconf.h>
|
20
|
+
#include <time.h>
|
21
|
+
#include "parseargs.h"
|
22
|
+
#include "GString.h"
|
23
|
+
#include "gmem.h"
|
24
|
+
#include "Object.h"
|
25
|
+
#include "Stream.h"
|
26
|
+
#include "Array.h"
|
27
|
+
#include "Dict.h"
|
28
|
+
#include "XRef.h"
|
29
|
+
#include "Catalog.h"
|
30
|
+
#include "Page.h"
|
31
|
+
#include "PDFDoc.h"
|
32
|
+
#include "ImgOutputDev.h"
|
33
|
+
#include "GlobalParams.h"
|
34
|
+
#include "Error.h"
|
35
|
+
#include "config.h"
|
36
|
+
#include "gfile.h"
|
37
|
+
|
38
|
+
static int firstPage = 1;
|
39
|
+
static int lastPage = 0;
|
40
|
+
static GBool rawOrder = gTrue;
|
41
|
+
static GBool textAsJSON = gTrue;
|
42
|
+
static GBool compressData = gFalse;
|
43
|
+
GBool printCommands = gTrue;
|
44
|
+
static GBool printHelp = gFalse;
|
45
|
+
GBool printHtml = gFalse;
|
46
|
+
GBool complexMode=gTrue;
|
47
|
+
GBool ignore=gFalse;
|
48
|
+
double scale=1.5;
|
49
|
+
GBool noframes=gFalse;
|
50
|
+
GBool stout=gFalse;
|
51
|
+
GBool xml=gFalse;
|
52
|
+
GBool errQuiet=gFalse;
|
53
|
+
|
54
|
+
GBool showHidden = gFalse;
|
55
|
+
GBool noMerge = gTrue;
|
56
|
+
static char ownerPassword[33] = "";
|
57
|
+
static char userPassword[33] = "";
|
58
|
+
static char gsDevice[33] = "png16m";
|
59
|
+
static GBool printVersion = gFalse;
|
60
|
+
|
61
|
+
static GString* getInfoString(Dict *infoDict, char *key);
|
62
|
+
static GString* getInfoDate(Dict *infoDict, char *key);
|
63
|
+
|
64
|
+
static char textEncName[128] = "";
|
65
|
+
|
66
|
+
static ArgDesc argDesc[] = {
|
67
|
+
{"-f", argInt, &firstPage, 0,
|
68
|
+
"first page to convert"},
|
69
|
+
{"-l", argInt, &lastPage, 0,
|
70
|
+
"last page to convert"},
|
71
|
+
{"-compress", argFlag, &compressData, 0,
|
72
|
+
"Use compressed mode"},
|
73
|
+
{"-q", argFlag, &errQuiet, 0,
|
74
|
+
"don't print any messages or errors"},
|
75
|
+
{"-h", argFlag, &printHelp, 0,
|
76
|
+
"print usage information"},
|
77
|
+
{"-help", argFlag, &printHelp, 0,
|
78
|
+
"print usage information"},
|
79
|
+
{"-i", argFlag, &ignore, 0,
|
80
|
+
"ignore images"},
|
81
|
+
{"-noframes", argFlag, &noframes, 0,
|
82
|
+
"use standard output"},
|
83
|
+
/* {"-zoom", argFP, &scale, 0,
|
84
|
+
"zoom the pdf document (default 1.5)"}, */
|
85
|
+
{"-xml", argFlag, &xml, 0,
|
86
|
+
"output for XML post-processing"},
|
87
|
+
{"-hidden", argFlag, &showHidden, 0,
|
88
|
+
"output hidden text"},
|
89
|
+
{"-enc", argString, textEncName, sizeof(textEncName),
|
90
|
+
"output text encoding name"},
|
91
|
+
{"-v", argFlag, &printVersion, 0,
|
92
|
+
"print copyright and version info"},
|
93
|
+
{"-opw", argString, ownerPassword, sizeof(ownerPassword),
|
94
|
+
"owner password (for encrypted files)"},
|
95
|
+
{"-upw", argString, userPassword, sizeof(userPassword),
|
96
|
+
"user password (for encrypted files)"},
|
97
|
+
{NULL}
|
98
|
+
};
|
99
|
+
|
100
|
+
int main(int argc, char *argv[]) {
|
101
|
+
PDFDoc *doc = NULL;
|
102
|
+
GString *fileName = NULL;
|
103
|
+
GString *docTitle = NULL;
|
104
|
+
GString *author = NULL, *keywords = NULL, *subject = NULL, *date = NULL;
|
105
|
+
GString *htmlFileName = NULL;
|
106
|
+
ImgOutputDev *htmlOut = NULL;
|
107
|
+
//PSOutputDev *psOut = NULL;
|
108
|
+
GBool ok;
|
109
|
+
char *p;
|
110
|
+
char extension[16] = "png";
|
111
|
+
GString *ownerPW, *userPW;
|
112
|
+
Object info;
|
113
|
+
char * extsList[] = {"png", "jpeg", "bmp", "pcx", "tiff", "pbm", NULL};
|
114
|
+
|
115
|
+
// parse args
|
116
|
+
ok = parseArgs(argDesc, &argc, argv);
|
117
|
+
if (!ok || argc < 2 || argc > 3 || printHelp || printVersion) {
|
118
|
+
fprintf(stderr, "pdf2json version %s http://flexpaper.devaldi.com/pdf2json/, based on Xpdf version %s\n", "0.52", xpdfVersion);
|
119
|
+
fprintf(stderr, "%s\n", "Copyright 1999-2011 Devaldi Ltd, Gueorgui Ovtcharov and Rainer Dorsch");
|
120
|
+
fprintf(stderr, "%s\n\n", xpdfCopyright);
|
121
|
+
if (!printVersion) {
|
122
|
+
printUsage("pdf2json", "<PDF-file> [<xml-file>]", argDesc);
|
123
|
+
}
|
124
|
+
exit(1);
|
125
|
+
}
|
126
|
+
|
127
|
+
// read config file
|
128
|
+
globalParams = new GlobalParams("");
|
129
|
+
|
130
|
+
if (errQuiet) {
|
131
|
+
globalParams->setErrQuiet(errQuiet);
|
132
|
+
printCommands = gFalse; // I'm not 100% what is the differecne between them
|
133
|
+
}
|
134
|
+
|
135
|
+
if (textEncName[0]) {
|
136
|
+
globalParams->setTextEncoding(textEncName);
|
137
|
+
if( !globalParams->getTextEncoding() ) {
|
138
|
+
goto error;
|
139
|
+
}
|
140
|
+
}
|
141
|
+
|
142
|
+
// open PDF file
|
143
|
+
if (ownerPassword[0]) {
|
144
|
+
ownerPW = new GString(ownerPassword);
|
145
|
+
} else {
|
146
|
+
ownerPW = NULL;
|
147
|
+
}
|
148
|
+
if (userPassword[0]) {
|
149
|
+
userPW = new GString(userPassword);
|
150
|
+
} else {
|
151
|
+
userPW = NULL;
|
152
|
+
}
|
153
|
+
|
154
|
+
fileName = new GString(argv[1]);
|
155
|
+
|
156
|
+
doc = new PDFDoc(fileName, ownerPW, userPW);
|
157
|
+
if (userPW) {
|
158
|
+
delete userPW;
|
159
|
+
}
|
160
|
+
if (ownerPW) {
|
161
|
+
delete ownerPW;
|
162
|
+
}
|
163
|
+
if (!doc->isOk()) {
|
164
|
+
goto error;
|
165
|
+
}
|
166
|
+
|
167
|
+
// check for copy permission
|
168
|
+
if (!doc->okToCopy()) {
|
169
|
+
error(-1, "Copying of text from this document is not allowed.");
|
170
|
+
goto error;
|
171
|
+
}
|
172
|
+
|
173
|
+
// construct text file name
|
174
|
+
if (argc == 3) {
|
175
|
+
GString* tmp = new GString(argv[2]);
|
176
|
+
p=tmp->getCString()+tmp->getLength()-5;
|
177
|
+
|
178
|
+
if (!strcmp(p, ".xml") || !strcmp(p, ".XML"))
|
179
|
+
htmlFileName = new GString(tmp->getCString(),
|
180
|
+
tmp->getLength() - 5);
|
181
|
+
else htmlFileName =new GString(tmp);
|
182
|
+
|
183
|
+
delete tmp;
|
184
|
+
} else {
|
185
|
+
p = fileName->getCString() + fileName->getLength() - 4;
|
186
|
+
if (!strcmp(p, ".pdf") || !strcmp(p, ".PDF"))
|
187
|
+
htmlFileName = new GString(fileName->getCString(),
|
188
|
+
fileName->getLength() - 4);
|
189
|
+
else
|
190
|
+
htmlFileName = fileName->copy();
|
191
|
+
}
|
192
|
+
|
193
|
+
if (scale>3.0) scale=3.0;
|
194
|
+
if (scale<0.5) scale=0.5;
|
195
|
+
|
196
|
+
stout=gFalse;
|
197
|
+
complexMode = gTrue;
|
198
|
+
noframes = gTrue;
|
199
|
+
noMerge = gTrue;
|
200
|
+
|
201
|
+
// get page range
|
202
|
+
if (firstPage < 1)
|
203
|
+
firstPage = 1;
|
204
|
+
if (lastPage < 1 || lastPage > doc->getNumPages())
|
205
|
+
lastPage = doc->getNumPages();
|
206
|
+
|
207
|
+
doc->getDocInfo(&info);
|
208
|
+
if (info.isDict()) {
|
209
|
+
docTitle = getInfoString(info.getDict(), "Title");
|
210
|
+
author = getInfoString(info.getDict(), "Author");
|
211
|
+
keywords = getInfoString(info.getDict(), "Keywords");
|
212
|
+
subject = getInfoString(info.getDict(), "Subject");
|
213
|
+
date = getInfoDate(info.getDict(), "ModDate");
|
214
|
+
if( !date )
|
215
|
+
date = getInfoDate(info.getDict(), "CreationDate");
|
216
|
+
}
|
217
|
+
info.free();
|
218
|
+
if( !docTitle ) docTitle = new GString(htmlFileName);
|
219
|
+
|
220
|
+
/* determine extensions of output backgroun images */
|
221
|
+
{int i;
|
222
|
+
for(i = 0; extsList[i]; i++)
|
223
|
+
{
|
224
|
+
if( strstr(gsDevice, extsList[i]) != (char *) NULL )
|
225
|
+
{
|
226
|
+
strncpy(extension, extsList[i], sizeof(extension));
|
227
|
+
break;
|
228
|
+
}
|
229
|
+
}}
|
230
|
+
|
231
|
+
rawOrder = complexMode; // todo: figure out what exactly rawOrder do :)
|
232
|
+
|
233
|
+
if(textAsJSON)
|
234
|
+
xml = gTrue;
|
235
|
+
|
236
|
+
// write text file
|
237
|
+
htmlOut = new ImgOutputDev(htmlFileName->getCString(),
|
238
|
+
docTitle->getCString(),
|
239
|
+
author ? author->getCString() : NULL,
|
240
|
+
keywords ? keywords->getCString() : NULL,
|
241
|
+
subject ? subject->getCString() : NULL,
|
242
|
+
date ? date->getCString() : NULL,
|
243
|
+
extension,
|
244
|
+
rawOrder,
|
245
|
+
textAsJSON,
|
246
|
+
compressData,
|
247
|
+
firstPage,
|
248
|
+
doc->getCatalog()->getOutline()->isDict(),
|
249
|
+
doc->getNumPages());
|
250
|
+
delete docTitle;
|
251
|
+
if( author )
|
252
|
+
{
|
253
|
+
delete author;
|
254
|
+
}
|
255
|
+
if( keywords )
|
256
|
+
{
|
257
|
+
delete keywords;
|
258
|
+
}
|
259
|
+
if( subject )
|
260
|
+
{
|
261
|
+
delete subject;
|
262
|
+
}
|
263
|
+
if( date )
|
264
|
+
{
|
265
|
+
delete date;
|
266
|
+
}
|
267
|
+
|
268
|
+
if (htmlOut->isOk())
|
269
|
+
{
|
270
|
+
doc->displayPages(htmlOut, firstPage, lastPage, static_cast<int>(72*scale), static_cast<int>(72*scale), 0, gTrue, gTrue,gTrue,NULL);
|
271
|
+
|
272
|
+
if (!xml)
|
273
|
+
{
|
274
|
+
htmlOut->dumpDocOutline(doc->getCatalog());
|
275
|
+
}
|
276
|
+
}
|
277
|
+
|
278
|
+
delete htmlOut;
|
279
|
+
|
280
|
+
// clean up
|
281
|
+
error:
|
282
|
+
if(doc) delete doc;
|
283
|
+
if(globalParams) delete globalParams;
|
284
|
+
|
285
|
+
if(htmlFileName) delete htmlFileName;
|
286
|
+
XmlFont::clear();
|
287
|
+
|
288
|
+
// check for memory leaks
|
289
|
+
Object::memCheck(stderr);
|
290
|
+
gMemReport(stderr);
|
291
|
+
|
292
|
+
return 0;
|
293
|
+
}
|
294
|
+
|
295
|
+
static GString* getInfoString(Dict *infoDict, char *key) {
|
296
|
+
Object obj;
|
297
|
+
GString *s1 = NULL;
|
298
|
+
|
299
|
+
if (infoDict->lookup(key, &obj)->isString()) {
|
300
|
+
s1 = new GString(obj.getString());
|
301
|
+
}
|
302
|
+
obj.free();
|
303
|
+
return s1;
|
304
|
+
}
|
305
|
+
|
306
|
+
static GString* getInfoDate(Dict *infoDict, char *key) {
|
307
|
+
Object obj;
|
308
|
+
char *s;
|
309
|
+
int year, mon, day, hour, min, sec;
|
310
|
+
struct tm tmStruct;
|
311
|
+
GString *result = NULL;
|
312
|
+
char buf[256];
|
313
|
+
|
314
|
+
if (infoDict->lookup(key, &obj)->isString()) {
|
315
|
+
s = obj.getString()->getCString();
|
316
|
+
if (s[0] == 'D' && s[1] == ':') {
|
317
|
+
s += 2;
|
318
|
+
}
|
319
|
+
if (sscanf(s, "%4d%2d%2d%2d%2d%2d",
|
320
|
+
&year, &mon, &day, &hour, &min, &sec) == 6) {
|
321
|
+
tmStruct.tm_year = year - 1900;
|
322
|
+
tmStruct.tm_mon = mon - 1;
|
323
|
+
tmStruct.tm_mday = day;
|
324
|
+
tmStruct.tm_hour = hour;
|
325
|
+
tmStruct.tm_min = min;
|
326
|
+
tmStruct.tm_sec = sec;
|
327
|
+
tmStruct.tm_wday = -1;
|
328
|
+
tmStruct.tm_yday = -1;
|
329
|
+
tmStruct.tm_isdst = -1;
|
330
|
+
mktime(&tmStruct); // compute the tm_wday and tm_yday fields
|
331
|
+
if (strftime(buf, sizeof(buf), "%Y-%m-%dT%H:%M:%S+00:00", &tmStruct)) {
|
332
|
+
result = new GString(buf);
|
333
|
+
} else {
|
334
|
+
result = new GString(s);
|
335
|
+
}
|
336
|
+
} else {
|
337
|
+
result = new GString(s);
|
338
|
+
}
|
339
|
+
}
|
340
|
+
obj.free();
|
341
|
+
return result;
|
342
|
+
}
|
343
|
+
|