rhocr 0.0.3 → 0.1

Sign up to get free protection for your applications and to get access to all the features.
data/test.html ADDED
@@ -0,0 +1 @@
1
+ <div class='ocr_page' style='position:absolute; top:0px; left:0px; height:1326px; width:1326px;;background-image: url(data/test.png); width:1326px; height:1326>px ;'><span class='ocrx_block' style='position:absolute; top:32px; left:55px; height:1855px; width:1080px;' ></span><span class='ocr_par' style='position:absolute; top:32px; left:432px; height:39px; width:685px;' ></span><span class='ocr_line' style='position:absolute; top:32px; left:432px; height:39px; width:685px;' ></span><span class='ocrx_word' style='position:absolute; top:32px; left:432px; height:35px; width:156px;'>Athenobius</span><span class='ocrx_word' style='position:absolute; top:48px; left:606px; height:6px; width:34px;'>—</span><span class='ocrx_word' style='position:absolute; top:34px; left:657px; height:28px; width:92px;'>Aulon.</span><span class='ocrx_word' style='position:absolute; top:37px; left:1074px; height:34px; width:43px;'>29</span><span class='ocr_par' style='position:absolute; top:109px; left:79px; height:80px; width:1040px;' ></span><span class='ocr_line' style='position:absolute; top:109px; left:79px; height:36px; width:1040px;' ></span><span class='ocrx_word' style='position:absolute; top:109px; left:79px; height:35px; width:215px;'>Athenobius,</span><span class='ocrx_word' style='position:absolute; top:112px; left:334px; height:27px; width:64px;'>Der</span><span class='ocrx_word' style='position:absolute; top:115px; left:417px; height:24px; width:59px;'>von</span><span class='ocrx_word' style='position:absolute; top:112px; left:494px; height:27px; width:51px;'>der</span><span class='ocrx_word' style='position:absolute; top:112px; left:565px; height:28px; width:122px;'>Göttin</span><span class='ocrx_word' style='position:absolute; top:112px; left:707px; height:28px; width:150px;'>Minerva</span><span class='ocrx_word' style='position:absolute; top:112px; left:876px; height:33px; width:78px;'>lebt,</span><span class='ocrx_word' style='position:absolute; top:112px; left:974px; height:28px; width:69px;'>oder:</span><span class='ocrx_word' style='position:absolute; top:112px; left:1062px; height:28px; width:57px;'>Mi»</span><span class='ocr_line' style='position:absolute; top:155px; left:108px; height:34px; width:192px;' ></span><span class='ocrx_word' style='position:absolute; top:159px; left:108px; height:23px; width:75px;'>nerva</span><span class='ocrx_word' style='position:absolute; top:155px; left:201px; height:34px; width:99px;'>Bogen.</span><span class='ocr_par' style='position:absolute; top:196px; left:74px; height:120px; width:1043px;' ></span><span class='ocr_line' style='position:absolute; top:196px; left:160px; height:36px; width:957px;' ></span><span class='ocrx_word' style='position:absolute; top:198px; left:160px; height:27px; width:54px;'>Des</span><span class='ocrx_word' style='position:absolute; top:197px; left:242px; height:33px; width:98px;'>Königs</span><span class='ocrx_word' style='position:absolute; top:196px; left:367px; height:34px; width:136px;'>Antiochus</span><span class='ocrx_word' style='position:absolute; top:197px; left:531px; height:33px; width:95px;'>Freund</span><span class='ocrx_word' style='position:absolute; top:197px; left:655px; height:28px; width:58px;'>oder</span><span class='ocrx_word' style='position:absolute; top:196px; left:739px; height:36px; width:119px;'>geheimer</span><span class='ocrx_word' style='position:absolute; top:196px; left:885px; height:34px; width:78px;'>Nath.</span><span class='ocrx_word' style='position:absolute; top:199px; left:994px; height:25px; width:11px;'>l</span><span class='ocrx_word' style='position:absolute; top:197px; left:1033px; height:29px; width:84px;'>Mack.</span><span class='ocr_line' style='position:absolute; top:241px; left:109px; height:33px; width:97px;' ></span><span class='ocrx_word' style='position:absolute; top:241px; left:109px; height:33px; width:38px;'>15,</span><span class='ocrx_word' style='position:absolute; top:242px; left:166px; height:25px; width:40px;'>28.</span><span class='ocr_line' style='position:absolute; top:281px; left:74px; height:35px; width:1042px;' ></span><span class='ocrx_word' style='position:absolute; top:281px; left:74px; height:34px; width:131px;'>Athlai.</span><span class='ocrx_word' style='position:absolute; top:284px; left:242px; height:26px; width:68px;'>Dee</span><span class='ocrx_word' style='position:absolute; top:282px; left:337px; height:33px; width:80px;'>Herr</span><span class='ocrx_word' style='position:absolute; top:281px; left:440px; height:34px; width:158px;'>zerreißet</span><span class='ocrx_word' style='position:absolute; top:282px; left:625px; height:28px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:282px; left:706px; height:34px; width:158px;'>zerbricht.</span><span class='ocrx_word' style='position:absolute; top:282px; left:898px; height:28px; width:77px;'>Einer</span><span class='ocrx_word' style='position:absolute; top:286px; left:999px; height:24px; width:51px;'>von</span><span class='ocrx_word' style='position:absolute; top:282px; left:1069px; height:28px; width:47px;'>den</span><span class='ocr_par' style='position:absolute; top:324px; left:74px; height:77px; width:1040px;' ></span><span class='ocr_line' style='position:absolute; top:324px; left:107px; height:33px; width:487px;' ></span><span class='ocrx_word' style='position:absolute; top:325px; left:107px; height:32px; width:174px;'>Nachlommen</span><span class='ocrx_word' style='position:absolute; top:324px; left:300px; height:28px; width:92px;'>Bebai.</span><span class='ocrx_word' style='position:absolute; top:324px; left:410px; height:32px; width:62px;'>Esra</span><span class='ocrx_word' style='position:absolute; top:327px; left:496px; height:28px; width:37px;'>10,</span><span class='ocrx_word' style='position:absolute; top:326px; left:553px; height:25px; width:41px;'>28.</span><span class='ocr_line' style='position:absolute; top:366px; left:74px; height:35px; width:1040px;' ></span><span class='ocrx_word' style='position:absolute; top:366px; left:74px; height:34px; width:115px;'>Athni.</span><span class='ocrx_word' style='position:absolute; top:368px; left:217px; height:27px; width:79px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:367px; left:315px; height:34px; width:135px;'>Trübsal</span><span class='ocrx_word' style='position:absolute; top:372px; left:469px; height:22px; width:59px;'>von</span><span class='ocrx_word' style='position:absolute; top:366px; left:548px; height:28px; width:90px;'>Gott.</span><span class='ocrx_word' style='position:absolute; top:366px; left:673px; height:28px; width:49px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:366px; left:742px; height:34px; width:77px;'>Sohn</span><span class='ocrx_word' style='position:absolute; top:366px; left:838px; height:34px; width:116px;'>Semaja.</span><span class='ocrx_word' style='position:absolute; top:369px; left:986px; height:25px; width:12px;'>1</span><span class='ocrx_word' style='position:absolute; top:368px; left:1018px; height:32px; width:96px;'>Chron.</span><span class='ocr_par' style='position:absolute; top:412px; left:71px; height:76px; width:1041px;' ></span><span class='ocr_line' style='position:absolute; top:412px; left:104px; height:28px; width:83px;' ></span><span class='ocrx_word' style='position:absolute; top:412px; left:104px; height:28px; width:40px;'>27.</span><span class='ocrx_word' style='position:absolute; top:413px; left:163px; height:25px; width:24px;'>7.</span><span class='ocr_line' style='position:absolute; top:451px; left:71px; height:37px; width:1041px;' ></span><span class='ocrx_word' style='position:absolute; top:451px; left:71px; height:34px; width:146px;'>Athniel.</span><span class='ocrx_word' style='position:absolute; top:452px; left:246px; height:27px; width:118px;'>Gottes</span><span class='ocrx_word' style='position:absolute; top:451px; left:384px; height:33px; width:147px;'>Trübsal,</span><span class='ocrx_word' style='position:absolute; top:451px; left:550px; height:28px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:451px; left:591px; height:28px; width:17px;'>i.</span><span class='ocrx_word' style='position:absolute; top:451px; left:627px; height:28px; width:54px;'>eine</span><span class='ocrx_word' style='position:absolute; top:451px; left:699px; height:33px; width:120px;'>Trübsal,</span><span class='ocrx_word' style='position:absolute; top:459px; left:839px; height:20px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:452px; left:908px; height:28px; width:62px;'>Gott</span><span class='ocrx_word' style='position:absolute; top:452px; left:990px; height:36px; width:122px;'>zugesügt.</span><span class='ocr_par' style='position:absolute; top:494px; left:102px; height:34px; width:1008px;' ></span><span class='ocr_line' style='position:absolute; top:494px; left:102px; height:34px; width:1008px;' ></span><span class='ocrx_word' style='position:absolute; top:496px; left:102px; height:27px; width:50px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:495px; left:172px; height:31px; width:76px;'>Sohn</span><span class='ocrx_word' style='position:absolute; top:495px; left:268px; height:30px; width:94px;'>Kenas,</span><span class='ocrx_word' style='position:absolute; top:495px; left:380px; height:26px; width:44px;'>des</span><span class='ocrx_word' style='position:absolute; top:494px; left:445px; height:27px; width:112px;'>Bruders</span><span class='ocrx_word' style='position:absolute; top:494px; left:576px; height:32px; width:89px;'>Kaleb;</span><span class='ocrx_word' style='position:absolute; top:500px; left:693px; height:28px; width:105px;'>gewann</span><span class='ocrx_word' style='position:absolute; top:495px; left:818px; height:33px; width:98px;'>Kiriath</span><span class='ocrx_word' style='position:absolute; top:495px; left:936px; height:33px; width:106px;'>Sepher,</span><span class='ocrx_word' style='position:absolute; top:495px; left:1061px; height:28px; width:49px;'>und</span><span class='ocr_par' style='position:absolute; top:535px; left:68px; height:79px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:535px; left:100px; height:35px; width:937px;' ></span><span class='ocrx_word' style='position:absolute; top:538px; left:100px; height:27px; width:80px;'>damit</span><span class='ocrx_word' style='position:absolute; top:537px; left:199px; height:33px; width:82px;'>Achsa.</span><span class='ocrx_word' style='position:absolute; top:538px; left:300px; height:26px; width:36px;'>die</span><span class='ocrx_word' style='position:absolute; top:537px; left:356px; height:32px; width:98px;'>Tochter</span><span class='ocrx_word' style='position:absolute; top:535px; left:472px; height:32px; width:81px;'>seines</span><span class='ocrx_word' style='position:absolute; top:537px; left:574px; height:27px; width:100px;'>Betters</span><span class='ocrx_word' style='position:absolute; top:537px; left:694px; height:27px; width:86px;'>Kaleb.</span><span class='ocrx_word' style='position:absolute; top:536px; left:800px; height:34px; width:77px;'>Nicht,</span><span class='ocrx_word' style='position:absolute; top:540px; left:899px; height:29px; width:20px;'>1.</span><span class='ocrx_word' style='position:absolute; top:539px; left:940px; height:26px; width:38px;'>12.</span><span class='ocrx_word' style='position:absolute; top:539px; left:1000px; height:25px; width:37px;'>13.</span><span class='ocr_line' style='position:absolute; top:576px; left:68px; height:38px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:578px; left:68px; height:36px; width:308px;'>Atroth-Sophan,</span><span class='ocrx_word' style='position:absolute; top:580px; left:396px; height:26px; width:37px;'>die</span><span class='ocrx_word' style='position:absolute; top:580px; left:454px; height:27px; width:101px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:580px; left:580px; height:26px; width:53px;'>oder</span><span class='ocrx_word' style='position:absolute; top:579px; left:658px; height:30px; width:102px;'>Decke,</span><span class='ocrx_word' style='position:absolute; top:580px; left:785px; height:26px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:580px; left:860px; height:34px; width:177px;'>Bedeckung</span><span class='ocrx_word' style='position:absolute; top:576px; left:1057px; height:32px; width:62px;'>des'</span><span class='ocr_par' style='position:absolute; top:621px; left:100px; height:36px; width:1011px;' ></span><span class='ocr_line' style='position:absolute; top:621px; left:100px; height:36px; width:1011px;' ></span><span class='ocrx_word' style='position:absolute; top:624px; left:100px; height:33px; width:135px;'>Hügels.</span><span class='ocrx_word' style='position:absolute; top:623px; left:273px; height:27px; width:62px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:623px; left:355px; height:26px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:623px; left:456px; height:26px; width:40px;'>der</span><span class='ocrx_word' style='position:absolute; top:621px; left:515px; height:28px; width:141px;'>Rubeniten</span><span class='ocrx_word' style='position:absolute; top:621px; left:680px; height:27px; width:35px;'>im</span><span class='ocrx_word' style='position:absolute; top:622px; left:734px; height:34px; width:141px;'>Königreich</span><span class='ocrx_word' style='position:absolute; top:622px; left:895px; height:32px; width:97px;'>Sthon.</span><span class='ocrx_word' style='position:absolute; top:624px; left:1008px; height:26px; width:16px;'>4</span><span class='ocrx_word' style='position:absolute; top:623px; left:1043px; height:34px; width:68px;'>Mos.</span><span class='ocr_par' style='position:absolute; top:668px; left:67px; height:74px; width:1045px;' ></span><span class='ocr_line' style='position:absolute; top:668px; left:98px; height:30px; width:102px;' ></span><span class='ocrx_word' style='position:absolute; top:669px; left:98px; height:29px; width:41px;'>32,</span><span class='ocrx_word' style='position:absolute; top:668px; left:158px; height:25px; width:42px;'>35.</span><span class='ocr_line' style='position:absolute; top:706px; left:67px; height:36px; width:1045px;' ></span><span class='ocrx_word' style='position:absolute; top:707px; left:67px; height:35px; width:274px;'>AtrothAddar:</span><span class='ocrx_word' style='position:absolute; top:706px; left:356px; height:29px; width:62px;'>Die</span><span class='ocrx_word' style='position:absolute; top:707px; left:432px; height:27px; width:105px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:706px; left:551px; height:27px; width:110px;'>Addar</span><span class='ocrx_word' style='position:absolute; top:706px; left:675px; height:31px; width:54px;'>(des</span><span class='ocrx_word' style='position:absolute; top:706px; left:744px; height:33px; width:105px;'>Sohnes</span><span class='ocrx_word' style='position:absolute; top:706px; left:861px; height:34px; width:155px;'>Benjamin).</span><span class='ocrx_word' style='position:absolute; top:708px; left:1037px; height:33px; width:75px;'>Diese</span><span class='ocr_par' style='position:absolute; top:748px; left:98px; height:37px; width:1013px;' ></span><span class='ocr_line' style='position:absolute; top:748px; left:98px; height:37px; width:1013px;' ></span><span class='ocrx_word' style='position:absolute; top:752px; left:98px; height:28px; width:86px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:751px; left:202px; height:34px; width:98px;'>gehörte</span><span class='ocrx_word' style='position:absolute; top:750px; left:322px; height:27px; width:47px;'>den</span><span class='ocrx_word' style='position:absolute; top:748px; left:395px; height:33px; width:216px;'>Benjaminitern,</span><span class='ocrx_word' style='position:absolute; top:749px; left:635px; height:33px; width:43px;'>lag</span><span class='ocrx_word' style='position:absolute; top:748px; left:702px; height:27px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:749px; left:753px; height:27px; width:45px;'>den</span><span class='ocrx_word' style='position:absolute; top:749px; left:826px; height:35px; width:112px;'>Grenzen</span><span class='ocrx_word' style='position:absolute; top:750px; left:962px; height:33px; width:71px;'>Iuda</span><span class='ocrx_word' style='position:absolute; top:750px; left:1057px; height:28px; width:54px;'>tmd</span><span class='ocr_par' style='position:absolute; top:794px; left:64px; height:76px; width:1048px;' ></span><span class='ocr_line' style='position:absolute; top:794px; left:98px; height:31px; width:134px;' ></span><span class='ocrx_word' style='position:absolute; top:794px; left:98px; height:31px; width:134px;'>Ephraim.</span><span class='ocr_line' style='position:absolute; top:833px; left:64px; height:37px; width:1048px;' ></span><span class='ocrx_word' style='position:absolute; top:834px; left:64px; height:36px; width:355px;'>Atroth.Beth-Ioab,</span><span class='ocrx_word' style='position:absolute; top:836px; left:438px; height:26px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:835px; left:480px; height:27px; width:17px;'>i.</span><span class='ocrx_word' style='position:absolute; top:834px; left:517px; height:27px; width:48px;'>die</span><span class='ocrx_word' style='position:absolute; top:834px; left:584px; height:27px; width:104px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:833px; left:712px; height:28px; width:52px;'>des</span><span class='ocrx_word' style='position:absolute; top:833px; left:784px; height:33px; width:125px;'>Hauses</span><span class='ocrx_word' style='position:absolute; top:834px; left:926px; height:32px; width:94px;'>Ioab.</span><span class='ocrx_word' style='position:absolute; top:835px; left:1050px; height:28px; width:62px;'>Eine</span><span class='ocr_par' style='position:absolute; top:876px; left:101px; height:35px; width:1012px;' ></span><span class='ocr_line' style='position:absolute; top:876px; left:101px; height:35px; width:1012px;' ></span><span class='ocrx_word' style='position:absolute; top:879px; left:101px; height:28px; width:86px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:879px; left:201px; height:27px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:879px; left:249px; height:32px; width:80px;'>Iuda,</span><span class='ocrx_word' style='position:absolute; top:883px; left:350px; height:22px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:878px; left:408px; height:27px; width:37px;'>die</span><span class='ocrx_word' style='position:absolute; top:877px; left:456px; height:32px; width:178px;'>Nachlommen</span><span class='ocrx_word' style='position:absolute; top:876px; left:645px; height:28px; width:97px;'>Salma</span><span class='ocrx_word' style='position:absolute; top:876px; left:762px; height:34px; width:114px;'>gewohnt</span><span class='ocrx_word' style='position:absolute; top:877px; left:887px; height:33px; width:85px;'>haben.</span><span class='ocrx_word' style='position:absolute; top:880px; left:992px; height:24px; width:10px;'>1</span><span class='ocrx_word' style='position:absolute; top:877px; left:1021px; height:34px; width:92px;'>Chron.</span><span class='ocr_par' style='position:absolute; top:923px; left:64px; height:73px; width:1048px;' ></span><span class='ocr_line' style='position:absolute; top:923px; left:96px; height:30px; width:89px;' ></span><span class='ocrx_word' style='position:absolute; top:923px; left:96px; height:30px; width:24px;'>2,</span><span class='ocrx_word' style='position:absolute; top:924px; left:141px; height:25px; width:44px;'>54.</span><span class='ocr_line' style='position:absolute; top:961px; left:64px; height:35px; width:1048px;' ></span><span class='ocrx_word' style='position:absolute; top:962px; left:64px; height:31px; width:148px;'>Attalia.</span><span class='ocrx_word' style='position:absolute; top:963px; left:249px; height:27px; width:63px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:963px; left:330px; height:27px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:962px; left:428px; height:26px; width:27px;'>in</span><span class='ocrx_word' style='position:absolute; top:961px; left:474px; height:33px; width:163px;'>Pamphilien</span><span class='ocrx_word' style='position:absolute; top:962px; left:665px; height:28px; width:36px;'>od.</span><span class='ocrx_word' style='position:absolute; top:961px; left:720px; height:33px; width:104px;'>Libyen,</span><span class='ocrx_word' style='position:absolute; top:967px; left:848px; height:22px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:962px; left:916px; height:27px; width:88px;'>Attala</span><span class='ocrx_word' style='position:absolute; top:962px; left:1023px; height:34px; width:89px;'>Phila.</span><span class='ocr_par' style='position:absolute; top:1005px; left:62px; height:77px; width:1073px;' ></span><span class='ocr_line' style='position:absolute; top:1005px; left:95px; height:34px; width:499px;' ></span><span class='ocrx_word' style='position:absolute; top:1006px; left:95px; height:33px; width:90px;'>delpho</span><span class='ocrx_word' style='position:absolute; top:1006px; left:206px; height:27px; width:96px;'>erbaut.</span><span class='ocrx_word' style='position:absolute; top:1006px; left:321px; height:31px; width:47px;'>Ap.</span><span class='ocrx_word' style='position:absolute; top:1005px; left:388px; height:33px; width:83px;'>Gesch.</span><span class='ocrx_word' style='position:absolute; top:1006px; left:494px; height:32px; width:39px;'>14,</span><span class='ocrx_word' style='position:absolute; top:1006px; left:553px; height:25px; width:41px;'>25.</span><span class='ocr_line' style='position:absolute; top:1046px; left:62px; height:36px; width:1073px;' ></span><span class='ocrx_word' style='position:absolute; top:1048px; left:62px; height:29px; width:146px;'>Attalus</span><span class='ocrx_word' style='position:absolute; top:1048px; left:255px; height:27px; width:51px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:1046px; left:330px; height:34px; width:81px;'>König</span><span class='ocrx_word' style='position:absolute; top:1047px; left:436px; height:26px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:1046px; left:482px; height:32px; width:112px;'>Mysien,</span><span class='ocrx_word' style='position:absolute; top:1046px; left:623px; height:32px; width:99px;'>welches</span><span class='ocrx_word' style='position:absolute; top:1047px; left:747px; height:26px; width:72px;'>unter</span><span class='ocrx_word' style='position:absolute; top:1046px; left:843px; height:35px; width:129px;'>Phrygien</span><span class='ocrx_word' style='position:absolute; top:1047px; left:997px; height:35px; width:115px;'>gehörte;</span><span class='ocrx_word' style='position:absolute; top:1058px; left:1128px; height:9px; width:7px;'>,</span><span class='ocr_par' style='position:absolute; top:1089px; left:95px; height:36px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1089px; left:95px; height:36px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1093px; left:95px; height:32px; width:112px;'>genannt</span><span class='ocrx_word' style='position:absolute; top:1095px; left:227px; height:22px; width:47px;'>von</span><span class='ocrx_word' style='position:absolute; top:1090px; left:294px; height:29px; width:122px;'>Attale,</span><span class='ocrx_word' style='position:absolute; top:1090px; left:435px; height:30px; width:99px;'>welches</span><span class='ocrx_word' style='position:absolute; top:1089px; left:553px; height:27px; width:38px;'>bei</span><span class='ocrx_word' style='position:absolute; top:1089px; left:610px; height:26px; width:47px;'>den</span><span class='ocrx_word' style='position:absolute; top:1089px; left:676px; height:33px; width:143px;'>Phrygiern</span><span class='ocrx_word' style='position:absolute; top:1089px; left:838px; height:32px; width:79px;'>Kropf</span><span class='ocrx_word' style='position:absolute; top:1090px; left:935px; height:26px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:1090px; left:1012px; height:34px; width:99px;'>Gurgel</span><span class='ocr_par' style='position:absolute; top:1131px; left:94px; height:37px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1131px; left:94px; height:37px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1133px; left:94px; height:35px; width:119px;'>geheißen</span><span class='ocrx_word' style='position:absolute; top:1133px; left:233px; height:32px; width:77px;'>haben</span><span class='ocrx_word' style='position:absolute; top:1131px; left:329px; height:30px; width:51px;'>soll.</span><span class='ocrx_word' style='position:absolute; top:1157px; left:393px; height:4px; width:4px;'>,</span><span class='ocrx_word' style='position:absolute; top:1131px; left:417px; height:28px; width:62px;'>War</span><span class='ocrx_word' style='position:absolute; top:1132px; left:497px; height:26px; width:39px;'>ein</span><span class='ocrx_word' style='position:absolute; top:1132px; left:555px; height:33px; width:82px;'>König</span><span class='ocrx_word' style='position:absolute; top:1132px; left:660px; height:26px; width:40px;'>der</span><span class='ocrx_word' style='position:absolute; top:1132px; left:719px; height:33px; width:170px;'>Pergamener</span><span class='ocrx_word' style='position:absolute; top:1133px; left:907px; height:25px; width:49px;'>und</span><span class='ocrx_word' style='position:absolute; top:1131px; left:976px; height:34px; width:134px;'>Phrvgier.</span><span class='ocr_par' style='position:absolute; top:1175px; left:59px; height:75px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:1175px; left:95px; height:32px; width:237px;' ></span><span class='ocrx_word' style='position:absolute; top:1177px; left:95px; height:24px; width:11px;'>l</span><span class='ocrx_word' style='position:absolute; top:1175px; left:130px; height:27px; width:81px;'>Mack.</span><span class='ocrx_word' style='position:absolute; top:1176px; left:233px; height:31px; width:39px;'>15,</span><span class='ocrx_word' style='position:absolute; top:1176px; left:292px; height:25px; width:40px;'>22.</span><span class='ocr_line' style='position:absolute; top:1216px; left:59px; height:34px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:1217px; left:59px; height:29px; width:87px;'>Ava.</span><span class='ocrx_word' style='position:absolute; top:1217px; left:184px; height:33px; width:40px;'>Ist</span><span class='ocrx_word' style='position:absolute; top:1217px; left:242px; height:26px; width:38px;'>bei</span><span class='ocrx_word' style='position:absolute; top:1218px; left:299px; height:25px; width:45px;'>den</span><span class='ocrx_word' style='position:absolute; top:1217px; left:364px; height:26px; width:68px;'>alten</span><span class='ocrx_word' style='position:absolute; top:1216px; left:453px; height:32px; width:115px;'>Griechen</span><span class='ocrx_word' style='position:absolute; top:1216px; left:587px; height:26px; width:49px;'>Aia</span><span class='ocrx_word' style='position:absolute; top:1216px; left:655px; height:26px; width:36px;'>od.</span><span class='ocrx_word' style='position:absolute; top:1216px; left:711px; height:31px; width:60px;'>Aea,</span><span class='ocrx_word' style='position:absolute; top:1216px; left:790px; height:26px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1216px; left:842px; height:33px; width:151px;'>Hauptstadt</span><span class='ocrx_word' style='position:absolute; top:1217px; left:1010px; height:26px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:1216px; left:1051px; height:29px; width:59px;'>Col»</span><span class='ocr_par' style='position:absolute; top:1258px; left:92px; height:35px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1258px; left:92px; height:35px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1261px; left:92px; height:32px; width:73px;'>chide,</span><span class='ocrx_word' style='position:absolute; top:1265px; left:186px; height:21px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:1260px; left:244px; height:25px; width:79px;'>Aetas</span><span class='ocrx_word' style='position:absolute; top:1258px; left:341px; height:34px; width:110px;'>regierte.</span><span class='ocrx_word' style='position:absolute; top:1258px; left:494px; height:33px; width:99px;'>Colchis</span><span class='ocrx_word' style='position:absolute; top:1258px; left:612px; height:33px; width:66px;'>heißt</span><span class='ocrx_word' style='position:absolute; top:1258px; left:697px; height:34px; width:115px;'>heutiges</span><span class='ocrx_word' style='position:absolute; top:1258px; left:833px; height:34px; width:83px;'>Tages</span><span class='ocrx_word' style='position:absolute; top:1258px; left:938px; height:35px; width:170px;'>Mengrelicn,</span><span class='ocr_par' style='position:absolute; top:1300px; left:92px; height:35px; width:1017px;' ></span><span class='ocr_line' style='position:absolute; top:1300px; left:92px; height:35px; width:1017px;' ></span><span class='ocrx_word' style='position:absolute; top:1303px; left:92px; height:27px; width:39px;'>die</span><span class='ocrx_word' style='position:absolute; top:1303px; left:160px; height:32px; width:98px;'>meisten</span><span class='ocrx_word' style='position:absolute; top:1302px; left:277px; height:30px; width:153px;'>Einwohner</span><span class='ocrx_word' style='position:absolute; top:1300px; left:455px; height:33px; width:50px;'>sind</span><span class='ocrx_word' style='position:absolute; top:1300px; left:531px; height:34px; width:122px;'>Christen.</span><span class='ocrx_word' style='position:absolute; top:1300px; left:698px; height:28px; width:57px;'>Von</span><span class='ocrx_word' style='position:absolute; top:1300px; left:780px; height:32px; width:51px;'>hier</span><span class='ocrx_word' style='position:absolute; top:1302px; left:855px; height:26px; width:101px;'>wurden</span><span class='ocrx_word' style='position:absolute; top:1302px; left:980px; height:26px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1301px; left:1037px; height:28px; width:72px;'>Leute</span><span class='ocr_par' style='position:absolute; top:1342px; left:92px; height:36px; width:1018px;' ></span><span class='ocr_line' style='position:absolute; top:1342px; left:92px; height:36px; width:1018px;' ></span><span class='ocrx_word' style='position:absolute; top:1349px; left:92px; height:22px; width:52px;'>von</span><span class='ocrx_word' style='position:absolute; top:1344px; left:165px; height:32px; width:182px;'>Salmanasscr</span><span class='ocrx_word' style='position:absolute; top:1344px; left:371px; height:31px; width:57px;'>nach</span><span class='ocrx_word' style='position:absolute; top:1343px; left:454px; height:27px; width:128px;'>Samaria</span><span class='ocrx_word' style='position:absolute; top:1343px; left:606px; height:35px; width:110px;'>gesührt,</span><span class='ocrx_word' style='position:absolute; top:1347px; left:741px; height:22px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:1342px; left:804px; height:33px; width:31px;'>sie</span><span class='ocrx_word' style='position:absolute; top:1343px; left:859px; height:32px; width:58px;'>noch</span><span class='ocrx_word' style='position:absolute; top:1343px; left:942px; height:33px; width:51px;'>ihre</span><span class='ocrx_word' style='position:absolute; top:1344px; left:1019px; height:27px; width:91px;'>Götter</span><span class='ocr_par' style='position:absolute; top:1386px; left:58px; height:76px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:1386px; left:93px; height:33px; width:782px;' ></span><span class='ocrx_word' style='position:absolute; top:1387px; left:93px; height:32px; width:118px;'>Nibehas</span><span class='ocrx_word' style='position:absolute; top:1387px; left:231px; height:26px; width:48px;'>und</span><span class='ocrx_word' style='position:absolute; top:1386px; left:298px; height:32px; width:123px;'>Tharthac</span><span class='ocrx_word' style='position:absolute; top:1386px; left:440px; height:27px; width:138px;'>anbeteten.</span><span class='ocrx_word' style='position:absolute; top:1388px; left:597px; height:24px; width:15px;'>2</span><span class='ocrx_word' style='position:absolute; top:1387px; left:630px; height:26px; width:64px;'>Kön.</span><span class='ocrx_word' style='position:absolute; top:1388px; left:716px; height:28px; width:38px;'>l7,</span><span class='ocrx_word' style='position:absolute; top:1386px; left:775px; height:27px; width:41px;'>24.</span><span class='ocrx_word' style='position:absolute; top:1387px; left:835px; height:26px; width:40px;'>31.</span><span class='ocr_line' style='position:absolute; top:1428px; left:58px; height:34px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:1428px; left:58px; height:30px; width:117px;'>Aven.</span><span class='ocrx_word' style='position:absolute; top:1429px; left:213px; height:33px; width:101px;'>Götze,</span><span class='ocrx_word' style='position:absolute; top:1428px; left:339px; height:27px; width:163px;'>Eitelleit.</span><span class='ocrx_word' style='position:absolute; top:1428px; left:538px; height:27px; width:42px;'>So</span><span class='ocrx_word' style='position:absolute; top:1429px; left:605px; height:26px; width:60px;'>wird</span><span class='ocrx_word' style='position:absolute; top:1428px; left:690px; height:33px; width:88px;'>Bethel</span><span class='ocrx_word' style='position:absolute; top:1429px; left:802px; height:33px; width:118px;'>genannt.</span><span class='ocrx_word' style='position:absolute; top:1428px; left:939px; height:34px; width:56px;'>Hos.</span><span class='ocrx_word' style='position:absolute; top:1431px; left:1023px; height:29px; width:38px;'>10,</span><span class='ocrx_word' style='position:absolute; top:1431px; left:1086px; height:25px; width:23px;'>8.</span><span class='ocr_par' style='position:absolute; top:1471px; left:92px; height:34px; width:1018px;' ></span><span class='ocr_line' style='position:absolute; top:1471px; left:92px; height:34px; width:1018px;' ></span><span class='ocrx_word' style='position:absolute; top:1478px; left:92px; height:27px; width:88px;'>wegen</span><span class='ocrx_word' style='position:absolute; top:1472px; left:199px; height:26px; width:42px;'>der</span><span class='ocrx_word' style='position:absolute; top:1471px; left:261px; height:33px; width:104px;'>Götzen,</span><span class='ocrx_word' style='position:absolute; top:1471px; left:390px; height:26px; width:39px;'>die</span><span class='ocrx_word' style='position:absolute; top:1471px; left:456px; height:32px; width:100px;'>daselbst</span><span class='ocrx_word' style='position:absolute; top:1476px; left:579px; height:21px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:1472px; left:651px; height:25px; width:43px;'>den</span><span class='ocrx_word' style='position:absolute; top:1471px; left:715px; height:32px; width:137px;'>Israeliten</span><span class='ocrx_word' style='position:absolute; top:1471px; left:877px; height:32px; width:96px;'>verehrt</span><span class='ocrx_word' style='position:absolute; top:1472px; left:1000px; height:26px; width:110px;'>wurden.</span><span class='ocr_par' style='position:absolute; top:1513px; left:91px; height:35px; width:1019px;' ></span><span class='ocr_line' style='position:absolute; top:1513px; left:91px; height:35px; width:1019px;' ></span><span class='ocrx_word' style='position:absolute; top:1515px; left:91px; height:26px; width:58px;'>Mit</span><span class='ocrx_word' style='position:absolute; top:1515px; left:167px; height:26px; width:53px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1520px; left:240px; height:28px; width:92px;'>ganzen</span><span class='ocrx_word' style='position:absolute; top:1513px; left:352px; height:27px; width:109px;'>Namen:</span><span class='ocrx_word' style='position:absolute; top:1513px; left:482px; height:31px; width:158px;'>Beth»Aven,</span><span class='ocrx_word' style='position:absolute; top:1513px; left:658px; height:27px; width:50px;'>das</span><span class='ocrx_word' style='position:absolute; top:1513px; left:726px; height:35px; width:167px;'>Götzenhaus,</span><span class='ocrx_word' style='position:absolute; top:1513px; left:914px; height:33px; width:65px;'>oder,</span><span class='ocrx_word' style='position:absolute; top:1514px; left:997px; height:26px; width:32px;'>da</span><span class='ocrx_word' style='position:absolute; top:1520px; left:1048px; height:21px; width:62px;'>man</span><span class='ocr_par' style='position:absolute; top:1555px; left:56px; height:78px; width:1054px;' ></span><span class='ocr_line' style='position:absolute; top:1555px; left:91px; height:33px; width:540px;' ></span><span class='ocrx_word' style='position:absolute; top:1558px; left:91px; height:26px; width:58px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1557px; left:169px; height:26px; width:85px;'>Eiteln</span><span class='ocrx_word' style='position:absolute; top:1556px; left:275px; height:31px; width:178px;'>nachwandelt.</span><span class='ocrx_word' style='position:absolute; top:1555px; left:473px; height:33px; width:59px;'>Hos.</span><span class='ocrx_word' style='position:absolute; top:1558px; left:549px; height:26px; width:22px;'>4,</span><span class='ocrx_word' style='position:absolute; top:1558px; left:593px; height:23px; width:38px;'>15.</span><span class='ocr_line' style='position:absolute; top:1597px; left:56px; height:36px; width:1054px;' ></span><span class='ocrx_word' style='position:absolute; top:1597px; left:56px; height:36px; width:186px;'>Augustus.</span><span class='ocrx_word' style='position:absolute; top:1597px; left:287px; height:34px; width:132px;'>Würdig</span><span class='ocrx_word' style='position:absolute; top:1598px; left:448px; height:32px; width:129px;'>verehrt</span><span class='ocrx_word' style='position:absolute; top:1598px; left:608px; height:26px; width:60px;'>und</span><span class='ocrx_word' style='position:absolute; top:1599px; left:704px; height:33px; width:172px;'>angebetet</span><span class='ocrx_word' style='position:absolute; top:1605px; left:908px; height:27px; width:36px;'>zu</span><span class='ocrx_word' style='position:absolute; top:1599px; left:978px; height:28px; width:132px;'>werden.</span><span class='ocr_par' style='position:absolute; top:1640px; left:92px; height:34px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1640px; left:92px; height:34px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1640px; left:92px; height:34px; width:97px;'>Diesen</span><span class='ocrx_word' style='position:absolute; top:1640px; left:211px; height:27px; width:100px;'>Namen</span><span class='ocrx_word' style='position:absolute; top:1641px; left:340px; height:33px; width:46px;'>gab</span><span class='ocrx_word' style='position:absolute; top:1641px; left:413px; height:26px; width:46px;'>das</span><span class='ocrx_word' style='position:absolute; top:1640px; left:487px; height:32px; width:109px;'>romische</span><span class='ocrx_word' style='position:absolute; top:1640px; left:616px; height:27px; width:62px;'>Voll</span><span class='ocrx_word' style='position:absolute; top:1641px; left:706px; height:26px; width:52px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1641px; left:781px; height:31px; width:88px;'>Kaiser</span><span class='ocrx_word' style='position:absolute; top:1641px; left:887px; height:31px; width:143px;'>Octavian,</span><span class='ocrx_word' style='position:absolute; top:1642px; left:1058px; height:26px; width:50px;'>und</span><span class='ocr_par' style='position:absolute; top:1682px; left:93px; height:34px; width:1015px;' ></span><span class='ocr_line' style='position:absolute; top:1682px; left:93px; height:34px; width:1015px;' ></span><span class='ocrx_word' style='position:absolute; top:1683px; left:93px; height:27px; width:49px;'>alle</span><span class='ocrx_word' style='position:absolute; top:1683px; left:161px; height:32px; width:130px;'>romischen</span><span class='ocrx_word' style='position:absolute; top:1683px; left:310px; height:32px; width:86px;'>Kaiser</span><span class='ocrx_word' style='position:absolute; top:1683px; left:416px; height:30px; width:79px;'>haben</span><span class='ocrx_word' style='position:absolute; top:1682px; left:514px; height:32px; width:80px;'>diesen</span><span class='ocrx_word' style='position:absolute; top:1682px; left:614px; height:27px; width:95px;'>Namen</span><span class='ocrx_word' style='position:absolute; top:1683px; left:728px; height:33px; width:170px;'>beibehalten,</span><span class='ocrx_word' style='position:absolute; top:1682px; left:917px; height:33px; width:47px;'>daß</span><span class='ocrx_word' style='position:absolute; top:1682px; left:983px; height:33px; width:31px;'>sie</span><span class='ocrx_word' style='position:absolute; top:1692px; left:1033px; height:18px; width:75px;'>«au,-</span><span class='ocr_par' style='position:absolute; top:1724px; left:55px; height:119px; width:1052px;' ></span><span class='ocr_line' style='position:absolute; top:1724px; left:90px; height:35px; width:907px;' ></span><span class='ocrx_word' style='position:absolute; top:1733px; left:90px; height:25px; width:52px;'>per</span><span class='ocrx_word' style='position:absolute; top:1727px; left:160px; height:31px; width:124px;'>2ußr>«ti,</span><span class='ocrx_word' style='position:absolute; top:1726px; left:304px; height:25px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:1724px; left:345px; height:26px; width:15px;'>i,</span><span class='ocrx_word' style='position:absolute; top:1725px; left:382px; height:32px; width:80px;'>allzeit</span><span class='ocrx_word' style='position:absolute; top:1725px; left:482px; height:31px; width:99px;'>Mehrer</span><span class='ocrx_word' style='position:absolute; top:1725px; left:600px; height:26px; width:43px;'>des</span><span class='ocrx_word' style='position:absolute; top:1724px; left:664px; height:32px; width:86px;'>Reichs</span><span class='ocrx_word' style='position:absolute; top:1725px; left:770px; height:34px; width:115px;'>geheißen</span><span class='ocrx_word' style='position:absolute; top:1725px; left:904px; height:33px; width:93px;'>haben.</span><span class='ocr_line' style='position:absolute; top:1766px; left:55px; height:34px; width:897px;' ></span><span class='ocrx_word' style='position:absolute; top:1766px; left:55px; height:34px; width:121px;'>Avith.</span><span class='ocrx_word' style='position:absolute; top:1767px; left:212px; height:32px; width:112px;'>Haufe.</span><span class='ocrx_word' style='position:absolute; top:1766px; left:361px; height:27px; width:63px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:1766px; left:443px; height:28px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:1768px; left:542px; height:25px; width:27px;'>in</span><span class='ocrx_word' style='position:absolute; top:1767px; left:587px; height:32px; width:122px;'>Idumäa.</span><span class='ocrx_word' style='position:absolute; top:1769px; left:732px; height:24px; width:10px;'>1</span><span class='ocrx_word' style='position:absolute; top:1767px; left:763px; height:32px; width:68px;'>Mos.</span><span class='ocrx_word' style='position:absolute; top:1769px; left:849px; height:29px; width:43px;'>36,</span><span class='ocrx_word' style='position:absolute; top:1769px; left:910px; height:26px; width:42px;'>35.</span><span class='ocr_line' style='position:absolute; top:1809px; left:57px; height:34px; width:1050px;' ></span><span class='ocrx_word' style='position:absolute; top:1809px; left:57px; height:30px; width:125px;'>Aulon.</span><span class='ocrx_word' style='position:absolute; top:1809px; left:236px; height:34px; width:209px;'>Ausgehöhlt.</span><span class='ocrx_word' style='position:absolute; top:1809px; left:491px; height:27px; width:62px;'>Das</span><span class='ocrx_word' style='position:absolute; top:1809px; left:581px; height:34px; width:72px;'>große</span><span class='ocrx_word' style='position:absolute; top:1809px; left:681px; height:32px; width:76px;'>Thal,</span><span class='ocrx_word' style='position:absolute; top:1810px; left:791px; height:27px; width:80px;'>worin</span><span class='ocrx_word' style='position:absolute; top:1810px; left:897px; height:27px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1809px; left:962px; height:34px; width:145px;'>berühmten</span><span class='ocr_par' style='position:absolute; top:1851px; left:89px; height:36px; width:1017px;' ></span><span class='ocr_line' style='position:absolute; top:1851px; left:89px; height:36px; width:1017px;' ></span><span class='ocrx_word' style='position:absolute; top:1853px; left:89px; height:29px; width:97px;'>Städte</span><span class='ocrx_word' style='position:absolute; top:1852px; left:204px; height:34px; width:111px;'>Vethsan</span><span class='ocrx_word' style='position:absolute; top:1852px; left:334px; height:27px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:1852px; left:409px; height:34px; width:179px;'>Scythopolis,</span><span class='ocrx_word' style='position:absolute; top:1851px; left:605px; height:34px; width:127px;'>Tlberias,</span><span class='ocrx_word' style='position:absolute; top:1852px; left:751px; height:35px; width:111px;'>Iericho,</span><span class='ocrx_word' style='position:absolute; top:1851px; left:881px; height:29px; width:48px;'>das</span><span class='ocrx_word' style='position:absolute; top:1853px; left:949px; height:27px; width:64px;'>todte</span><span class='ocrx_word' style='position:absolute; top:1852px; left:1033px; height:28px; width:73px;'>Meer</span></div>
metadata CHANGED
@@ -1,82 +1,95 @@
1
- --- !ruby/object:Gem::Specification
1
+ --- !ruby/object:Gem::Specification
2
2
  name: rhocr
3
- version: !ruby/object:Gem::Version
3
+ version: !ruby/object:Gem::Version
4
+ version: '0.1'
4
5
  prerelease:
5
- version: 0.0.3
6
6
  platform: ruby
7
- authors:
7
+ authors:
8
8
  - Andreas Neumann
9
9
  autorequire:
10
10
  bindir: bin
11
11
  cert_chain: []
12
-
13
- date: 2011-07-03 00:00:00 +02:00
14
- default_executable:
15
- dependencies: []
16
-
12
+ date: 2011-09-08 00:00:00.000000000Z
13
+ dependencies:
14
+ - !ruby/object:Gem::Dependency
15
+ name: nokogiri
16
+ requirement: &70276550001820 !ruby/object:Gem::Requirement
17
+ none: false
18
+ requirements:
19
+ - - ! '>='
20
+ - !ruby/object:Gem::Version
21
+ version: '0'
22
+ type: :runtime
23
+ prerelease: false
24
+ version_requirements: *70276550001820
17
25
  description: Manipulate and use OCR data encode in HOCR
18
- email: info @nospam@ an-it.com
26
+ email: andreas@neumann.biz
19
27
  executables: []
20
-
21
28
  extensions: []
22
-
23
- extra_rdoc_files:
29
+ extra_rdoc_files:
24
30
  - README
25
- - lib/ocr_box.rb
31
+ - TODO.txt
32
+ - lib/hocr_box.rb
33
+ - lib/ocr_document.rb
34
+ - lib/ocr_element.rb
26
35
  - lib/ocr_page.rb
27
- - lib/ocrx_word.rb
28
36
  - lib/rhocr.rb
29
- files:
37
+ files:
30
38
  - Manifest
31
39
  - README
32
40
  - Rakefile
41
+ - TODO.txt
42
+ - data/Seite_Die_Gartenlaube_242.html
33
43
  - data/Seite_Tagebuch_H_C_Lang_08.html
44
+ - data/Seite_Tagebuch_H_C_Lang_08.jpg
45
+ - data/test.html
46
+ - data/test.png
34
47
  - example/example_server.rb
35
48
  - example/public/OCRTest.css
36
49
  - example/public/OCRTest.html
37
50
  - example/public/OCRTest_marker.js
38
- - example/public/img/Seite_Tagebuch_H_C_Lang_05.jpg
51
+ - example/public/Seite_Tagebuch_H_C_Lang_08.jpg
39
52
  - example/public/img/Seite_Tagebuch_H_C_Lang_08.jpg
40
- - lib/ocr_box.rb
53
+ - lib/hocr_box.rb
54
+ - lib/ocr_document.rb
55
+ - lib/ocr_element.rb
41
56
  - lib/ocr_page.rb
42
- - lib/ocrx_word.rb
43
57
  - lib/rhocr.rb
44
58
  - rhocr.gemspec
45
- - rspec/ocr_box_spec.rb
46
- - rspec/ocr_page_spec.rb
47
- - rspec/ocrx_word_spec.rb
48
- has_rdoc: true
59
+ - spec/hocr_box_spec.rb
60
+ - spec/ocr_document_spec.rb
61
+ - spec/ocr_element_spec.rb
62
+ - spec/ocr_page_spec.rb
63
+ - spec/rhocr_spec.rb
64
+ - test.html
49
65
  homepage: http://github.com/daandi/rhocr
50
66
  licenses: []
51
-
52
67
  post_install_message:
53
- rdoc_options:
68
+ rdoc_options:
54
69
  - --line-numbers
55
70
  - --inline-source
56
71
  - --title
57
72
  - Rhocr
58
73
  - --main
59
74
  - README
60
- require_paths:
75
+ require_paths:
61
76
  - lib
62
- required_ruby_version: !ruby/object:Gem::Requirement
77
+ required_ruby_version: !ruby/object:Gem::Requirement
63
78
  none: false
64
- requirements:
65
- - - ">="
66
- - !ruby/object:Gem::Version
67
- version: "0"
68
- required_rubygems_version: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - ! '>='
81
+ - !ruby/object:Gem::Version
82
+ version: '0'
83
+ required_rubygems_version: !ruby/object:Gem::Requirement
69
84
  none: false
70
- requirements:
71
- - - ">="
72
- - !ruby/object:Gem::Version
73
- version: "1.2"
85
+ requirements:
86
+ - - ! '>='
87
+ - !ruby/object:Gem::Version
88
+ version: '1.2'
74
89
  requirements: []
75
-
76
90
  rubyforge_project: rhocr
77
- rubygems_version: 1.6.2
91
+ rubygems_version: 1.8.6
78
92
  signing_key:
79
93
  specification_version: 3
80
94
  summary: Manipulate and use OCR data encode in HOCR
81
95
  test_files: []
82
-
data/lib/ocr_box.rb DELETED
@@ -1,43 +0,0 @@
1
- #coding: utf-8
2
-
3
- class OCRBox
4
-
5
- attr_reader :x1, :y1, :x2, :y2
6
-
7
- def initialize(x1, y1 , x2, y2)
8
- @x1 = x1
9
- @y1 = y1
10
- @x2 = x2
11
- @y2 = y2
12
- end
13
-
14
- def encloses?(element)
15
- @x1 <= element.x1 and
16
- @x2 >= element.x2 and
17
- @y1 <= element.y1 and
18
- @y2 >= element.y2
19
- end
20
-
21
- def enclosed_by?(element)
22
- return element.encloses? self
23
- end
24
-
25
- def to_s
26
- "tl->(x:#{@x1} y:#{@y1})/br->:(x:#{@x2} y:#{@y2})"
27
- end
28
-
29
- def to_css_style
30
- top = @y1
31
- left = @x1
32
- height = @y2 - @y1
33
- width = @x2 - @x1
34
-
35
- "position:absolute; top:#{top}px; left:#{left}px; height:#{height}px; width:#{width}px;"
36
- end
37
-
38
- def to_json
39
-
40
- end
41
-
42
- end
43
-
data/lib/ocrx_word.rb DELETED
@@ -1,23 +0,0 @@
1
- #coding: utf-8
2
-
3
- require 'cgi'
4
- require_relative 'ocr_box'
5
-
6
- class OCRXWord < OCRBox
7
-
8
- attr_reader :text
9
-
10
- def initialize(x1,y1,x2,y2,word)
11
- super(x1.to_i, y1.to_i, x2.to_i, y2.to_i)
12
- @text = word
13
- end
14
-
15
- def to_html(css_class = 'ocrx_word')
16
- "<span style='#{ to_css_style }' class='#{css_class}'><span class='word'>" + CGI::escapeHTML(@text) +"</span></span>"
17
- end
18
-
19
- def to_s
20
- "#{@text}\t#{super}"
21
- end
22
-
23
- end
@@ -1,48 +0,0 @@
1
- #coding: utf-8
2
-
3
- require_relative '../lib/ocr_box'
4
-
5
- describe OCRBox do
6
-
7
- before(:each) do
8
- @box ||= OCRBox.new(1,2,20,8)
9
- end
10
-
11
- describe "#to_s" do
12
- it "prints a human readable Box-Version with coordinates upper_left(x,y) bottom_right(x,y)" do
13
- @box.to_s.should == "tl->(x:1 y:2)/br->:(x:20 y:8)"
14
- end
15
- end
16
-
17
- describe '#encloses?(element)' do
18
- it "tests wather given OCRBox is enclosed by the current OCRBox" do
19
- @box.encloses?( OCRBox.new(0,3,19,7) ).should be_false
20
- @box.encloses?( OCRBox.new(2,3,19,7) ).should be_true
21
- end
22
- it "encloses also itself" do
23
- @box.encloses?( @box ).should be_true
24
- end
25
- end
26
-
27
- describe '#to_css_style' do
28
- it 'should create css-style attributes' do
29
- @box.to_css_style.should == 'position:absolute; top:2px; left:1px; height:6px; width:19px;'
30
- end
31
- end
32
-
33
- describe '#enclosed_by?(element)' do
34
- it 'should be enclosed by Boxes bigger than itself' do
35
- @box.enclosed_by?( OCRBox.new(0,1,21,9) ).should be_true
36
- end
37
- it 'should not be enclosed by Boxes smaller than itself' do
38
- @box.enclosed_by?( OCRBox.new(2,3,19,7) ).should be_false
39
- end
40
- it 'should be enclosed by Boxes of the same size' do
41
- @box.enclosed_by?( @box ).should be_true
42
- end
43
- end
44
-
45
-
46
-
47
-
48
- end
@@ -1,17 +0,0 @@
1
- #coding: utf-8
2
-
3
- require_relative '../lib/ocr_page'
4
-
5
- describe OCRPage do
6
-
7
- before(:each) do
8
- @ocr_page ||= OCRPage.new('../data/Seite_Tagebuch_H_C_Lang_08.html')
9
- end
10
-
11
- describe '' do
12
- it '' do
13
- p @ocr_page.enclosed_words( OCRBox.new(500,1703,1200,1800) )
14
- end
15
- end
16
-
17
- end
@@ -1,32 +0,0 @@
1
- #coding: utf-8
2
-
3
- require_relative '../lib/ocrx_word'
4
-
5
- describe OCRXWord do
6
-
7
- before(:each) do
8
- @ocrx_word = OCRXWord.new(10,15,20,20,'WORT')
9
- end
10
-
11
- describe '#to_s' do
12
- it 'should print the coordinates of the box and the textual information' do
13
- p @ocrx_word
14
- @ocrx_word.to_s.should == "WORT\ttl->(x:10 y:15)/br->:(x:20 y:20)"
15
- end
16
- end
17
-
18
- describe '#to_html(css_class)' do
19
- it 'should create an span elment to overlay an image on an html-page' do
20
- @ocrx_word.to_html.should == "<span style='position:absolute; top:15px; left:10px; height:5px; width:10px;' class='ocrx_word'><span class='word'>WORT</span></span>"
21
- end
22
-
23
- it 'no css_class_class given should default to ocrx_word' do
24
- @ocrx_word.to_html.should =~ /class='ocrx_word'/
25
- end
26
-
27
- it 'css_class given should be part of genearted html' do
28
- @ocrx_word.to_html('rosebud').should =~ /class='rosebud'/
29
- end
30
- end
31
-
32
- end