rhocr 0.0.3 → 0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
data/test.html ADDED
@@ -0,0 +1 @@
1
+ <div class='ocr_page' style='position:absolute; top:0px; left:0px; height:1326px; width:1326px;;background-image: url(data/test.png); width:1326px; height:1326>px ;'><span class='ocrx_block' style='position:absolute; top:32px; left:55px; height:1855px; width:1080px;' ></span><span class='ocr_par' style='position:absolute; top:32px; left:432px; height:39px; width:685px;' ></span><span class='ocr_line' style='position:absolute; top:32px; left:432px; height:39px; width:685px;' ></span><span class='ocrx_word' style='position:absolute; top:32px; left:432px; height:35px; width:156px;'>Athenobius</span><span class='ocrx_word' style='position:absolute; top:48px; left:606px; height:6px; width:34px;'>—</span><span class='ocrx_word' style='position:absolute; top:34px; left:657px; height:28px; width:92px;'>Aulon.</span><span class='ocrx_word' style='position:absolute; top:37px; left:1074px; height:34px; width:43px;'>29</span><span class='ocr_par' style='position:absolute; top:109px; left:79px; height:80px; width:1040px;' ></span><span class='ocr_line' style='position:absolute; top:109px; left:79px; height:36px; width:1040px;' ></span><span class='ocrx_word' style='position:absolute; top:109px; left:79px; height:35px; width:215px;'>Athenobius,</span><span class='ocrx_word' style='position:absolute; top:112px; left:334px; height:27px; width:64px;'>Der</span><span class='ocrx_word' style='position:absolute; top:115px; left:417px; height:24px; width:59px;'>von</span><span class='ocrx_word' style='position:absolute; top:112px; left:494px; height:27px; width:51px;'>der</span><span class='ocrx_word' style='position:absolute; top:112px; left:565px; height:28px; width:122px;'>Göttin</span><span class='ocrx_word' style='position:absolute; top:112px; left:707px; height:28px; width:150px;'>Minerva</span><span class='ocrx_word' style='position:absolute; top:112px; left:876px; height:33px; width:78px;'>lebt,</span><span class='ocrx_word' style='position:absolute; top:112px; left:974px; height:28px; width:69px;'>oder:</span><span class='ocrx_word' style='position:absolute; top:112px; left:1062px; height:28px; width:57px;'>Mi»</span><span class='ocr_line' style='position:absolute; top:155px; left:108px; height:34px; width:192px;' ></span><span class='ocrx_word' style='position:absolute; top:159px; left:108px; height:23px; width:75px;'>nerva</span><span class='ocrx_word' style='position:absolute; top:155px; left:201px; height:34px; width:99px;'>Bogen.</span><span class='ocr_par' style='position:absolute; top:196px; left:74px; height:120px; width:1043px;' ></span><span class='ocr_line' style='position:absolute; top:196px; left:160px; height:36px; width:957px;' ></span><span class='ocrx_word' style='position:absolute; top:198px; left:160px; height:27px; width:54px;'>Des</span><span class='ocrx_word' style='position:absolute; top:197px; left:242px; height:33px; width:98px;'>Königs</span><span class='ocrx_word' style='position:absolute; top:196px; left:367px; height:34px; width:136px;'>Antiochus</span><span class='ocrx_word' style='position:absolute; top:197px; left:531px; height:33px; width:95px;'>Freund</span><span class='ocrx_word' style='position:absolute; top:197px; left:655px; height:28px; width:58px;'>oder</span><span class='ocrx_word' style='position:absolute; top:196px; left:739px; height:36px; width:119px;'>geheimer</span><span class='ocrx_word' style='position:absolute; top:196px; left:885px; height:34px; width:78px;'>Nath.</span><span class='ocrx_word' style='position:absolute; top:199px; left:994px; height:25px; width:11px;'>l</span><span class='ocrx_word' style='position:absolute; top:197px; left:1033px; height:29px; width:84px;'>Mack.</span><span class='ocr_line' style='position:absolute; top:241px; left:109px; height:33px; width:97px;' ></span><span class='ocrx_word' style='position:absolute; top:241px; left:109px; height:33px; width:38px;'>15,</span><span class='ocrx_word' style='position:absolute; top:242px; left:166px; height:25px; width:40px;'>28.</span><span class='ocr_line' style='position:absolute; top:281px; left:74px; height:35px; width:1042px;' ></span><span class='ocrx_word' style='position:absolute; top:281px; left:74px; height:34px; width:131px;'>Athlai.</span><span class='ocrx_word' style='position:absolute; top:284px; left:242px; height:26px; width:68px;'>Dee</span><span class='ocrx_word' style='position:absolute; top:282px; left:337px; height:33px; width:80px;'>Herr</span><span class='ocrx_word' style='position:absolute; top:281px; left:440px; height:34px; width:158px;'>zerreißet</span><span class='ocrx_word' style='position:absolute; top:282px; left:625px; height:28px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:282px; left:706px; height:34px; width:158px;'>zerbricht.</span><span class='ocrx_word' style='position:absolute; top:282px; left:898px; height:28px; width:77px;'>Einer</span><span class='ocrx_word' style='position:absolute; top:286px; left:999px; height:24px; width:51px;'>von</span><span class='ocrx_word' style='position:absolute; top:282px; left:1069px; height:28px; width:47px;'>den</span><span class='ocr_par' style='position:absolute; top:324px; left:74px; height:77px; width:1040px;' ></span><span class='ocr_line' style='position:absolute; top:324px; left:107px; height:33px; width:487px;' ></span><span class='ocrx_word' style='position:absolute; top:325px; left:107px; height:32px; width:174px;'>Nachlommen</span><span class='ocrx_word' style='position:absolute; top:324px; left:300px; height:28px; width:92px;'>Bebai.</span><span class='ocrx_word' style='position:absolute; top:324px; left:410px; height:32px; width:62px;'>Esra</span><span class='ocrx_word' style='position:absolute; top:327px; left:496px; height:28px; width:37px;'>10,</span><span class='ocrx_word' style='position:absolute; top:326px; left:553px; height:25px; width:41px;'>28.</span><span class='ocr_line' style='position:absolute; top:366px; left:74px; height:35px; width:1040px;' ></span><span class='ocrx_word' style='position:absolute; top:366px; left:74px; height:34px; width:115px;'>Athni.</span><span class='ocrx_word' style='position:absolute; top:368px; left:217px; height:27px; width:79px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:367px; left:315px; height:34px; width:135px;'>Trübsal</span><span class='ocrx_word' style='position:absolute; top:372px; left:469px; height:22px; width:59px;'>von</span><span class='ocrx_word' style='position:absolute; top:366px; left:548px; height:28px; width:90px;'>Gott.</span><span class='ocrx_word' style='position:absolute; top:366px; left:673px; height:28px; width:49px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:366px; left:742px; height:34px; width:77px;'>Sohn</span><span class='ocrx_word' style='position:absolute; top:366px; left:838px; height:34px; width:116px;'>Semaja.</span><span class='ocrx_word' style='position:absolute; top:369px; left:986px; height:25px; width:12px;'>1</span><span class='ocrx_word' style='position:absolute; top:368px; left:1018px; height:32px; width:96px;'>Chron.</span><span class='ocr_par' style='position:absolute; top:412px; left:71px; height:76px; width:1041px;' ></span><span class='ocr_line' style='position:absolute; top:412px; left:104px; height:28px; width:83px;' ></span><span class='ocrx_word' style='position:absolute; top:412px; left:104px; height:28px; width:40px;'>27.</span><span class='ocrx_word' style='position:absolute; top:413px; left:163px; height:25px; width:24px;'>7.</span><span class='ocr_line' style='position:absolute; top:451px; left:71px; height:37px; width:1041px;' ></span><span class='ocrx_word' style='position:absolute; top:451px; left:71px; height:34px; width:146px;'>Athniel.</span><span class='ocrx_word' style='position:absolute; top:452px; left:246px; height:27px; width:118px;'>Gottes</span><span class='ocrx_word' style='position:absolute; top:451px; left:384px; height:33px; width:147px;'>Trübsal,</span><span class='ocrx_word' style='position:absolute; top:451px; left:550px; height:28px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:451px; left:591px; height:28px; width:17px;'>i.</span><span class='ocrx_word' style='position:absolute; top:451px; left:627px; height:28px; width:54px;'>eine</span><span class='ocrx_word' style='position:absolute; top:451px; left:699px; height:33px; width:120px;'>Trübsal,</span><span class='ocrx_word' style='position:absolute; top:459px; left:839px; height:20px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:452px; left:908px; height:28px; width:62px;'>Gott</span><span class='ocrx_word' style='position:absolute; top:452px; left:990px; height:36px; width:122px;'>zugesügt.</span><span class='ocr_par' style='position:absolute; top:494px; left:102px; height:34px; width:1008px;' ></span><span class='ocr_line' style='position:absolute; top:494px; left:102px; height:34px; width:1008px;' ></span><span class='ocrx_word' style='position:absolute; top:496px; left:102px; height:27px; width:50px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:495px; left:172px; height:31px; width:76px;'>Sohn</span><span class='ocrx_word' style='position:absolute; top:495px; left:268px; height:30px; width:94px;'>Kenas,</span><span class='ocrx_word' style='position:absolute; top:495px; left:380px; height:26px; width:44px;'>des</span><span class='ocrx_word' style='position:absolute; top:494px; left:445px; height:27px; width:112px;'>Bruders</span><span class='ocrx_word' style='position:absolute; top:494px; left:576px; height:32px; width:89px;'>Kaleb;</span><span class='ocrx_word' style='position:absolute; top:500px; left:693px; height:28px; width:105px;'>gewann</span><span class='ocrx_word' style='position:absolute; top:495px; left:818px; height:33px; width:98px;'>Kiriath</span><span class='ocrx_word' style='position:absolute; top:495px; left:936px; height:33px; width:106px;'>Sepher,</span><span class='ocrx_word' style='position:absolute; top:495px; left:1061px; height:28px; width:49px;'>und</span><span class='ocr_par' style='position:absolute; top:535px; left:68px; height:79px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:535px; left:100px; height:35px; width:937px;' ></span><span class='ocrx_word' style='position:absolute; top:538px; left:100px; height:27px; width:80px;'>damit</span><span class='ocrx_word' style='position:absolute; top:537px; left:199px; height:33px; width:82px;'>Achsa.</span><span class='ocrx_word' style='position:absolute; top:538px; left:300px; height:26px; width:36px;'>die</span><span class='ocrx_word' style='position:absolute; top:537px; left:356px; height:32px; width:98px;'>Tochter</span><span class='ocrx_word' style='position:absolute; top:535px; left:472px; height:32px; width:81px;'>seines</span><span class='ocrx_word' style='position:absolute; top:537px; left:574px; height:27px; width:100px;'>Betters</span><span class='ocrx_word' style='position:absolute; top:537px; left:694px; height:27px; width:86px;'>Kaleb.</span><span class='ocrx_word' style='position:absolute; top:536px; left:800px; height:34px; width:77px;'>Nicht,</span><span class='ocrx_word' style='position:absolute; top:540px; left:899px; height:29px; width:20px;'>1.</span><span class='ocrx_word' style='position:absolute; top:539px; left:940px; height:26px; width:38px;'>12.</span><span class='ocrx_word' style='position:absolute; top:539px; left:1000px; height:25px; width:37px;'>13.</span><span class='ocr_line' style='position:absolute; top:576px; left:68px; height:38px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:578px; left:68px; height:36px; width:308px;'>Atroth-Sophan,</span><span class='ocrx_word' style='position:absolute; top:580px; left:396px; height:26px; width:37px;'>die</span><span class='ocrx_word' style='position:absolute; top:580px; left:454px; height:27px; width:101px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:580px; left:580px; height:26px; width:53px;'>oder</span><span class='ocrx_word' style='position:absolute; top:579px; left:658px; height:30px; width:102px;'>Decke,</span><span class='ocrx_word' style='position:absolute; top:580px; left:785px; height:26px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:580px; left:860px; height:34px; width:177px;'>Bedeckung</span><span class='ocrx_word' style='position:absolute; top:576px; left:1057px; height:32px; width:62px;'>des'</span><span class='ocr_par' style='position:absolute; top:621px; left:100px; height:36px; width:1011px;' ></span><span class='ocr_line' style='position:absolute; top:621px; left:100px; height:36px; width:1011px;' ></span><span class='ocrx_word' style='position:absolute; top:624px; left:100px; height:33px; width:135px;'>Hügels.</span><span class='ocrx_word' style='position:absolute; top:623px; left:273px; height:27px; width:62px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:623px; left:355px; height:26px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:623px; left:456px; height:26px; width:40px;'>der</span><span class='ocrx_word' style='position:absolute; top:621px; left:515px; height:28px; width:141px;'>Rubeniten</span><span class='ocrx_word' style='position:absolute; top:621px; left:680px; height:27px; width:35px;'>im</span><span class='ocrx_word' style='position:absolute; top:622px; left:734px; height:34px; width:141px;'>Königreich</span><span class='ocrx_word' style='position:absolute; top:622px; left:895px; height:32px; width:97px;'>Sthon.</span><span class='ocrx_word' style='position:absolute; top:624px; left:1008px; height:26px; width:16px;'>4</span><span class='ocrx_word' style='position:absolute; top:623px; left:1043px; height:34px; width:68px;'>Mos.</span><span class='ocr_par' style='position:absolute; top:668px; left:67px; height:74px; width:1045px;' ></span><span class='ocr_line' style='position:absolute; top:668px; left:98px; height:30px; width:102px;' ></span><span class='ocrx_word' style='position:absolute; top:669px; left:98px; height:29px; width:41px;'>32,</span><span class='ocrx_word' style='position:absolute; top:668px; left:158px; height:25px; width:42px;'>35.</span><span class='ocr_line' style='position:absolute; top:706px; left:67px; height:36px; width:1045px;' ></span><span class='ocrx_word' style='position:absolute; top:707px; left:67px; height:35px; width:274px;'>AtrothAddar:</span><span class='ocrx_word' style='position:absolute; top:706px; left:356px; height:29px; width:62px;'>Die</span><span class='ocrx_word' style='position:absolute; top:707px; left:432px; height:27px; width:105px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:706px; left:551px; height:27px; width:110px;'>Addar</span><span class='ocrx_word' style='position:absolute; top:706px; left:675px; height:31px; width:54px;'>(des</span><span class='ocrx_word' style='position:absolute; top:706px; left:744px; height:33px; width:105px;'>Sohnes</span><span class='ocrx_word' style='position:absolute; top:706px; left:861px; height:34px; width:155px;'>Benjamin).</span><span class='ocrx_word' style='position:absolute; top:708px; left:1037px; height:33px; width:75px;'>Diese</span><span class='ocr_par' style='position:absolute; top:748px; left:98px; height:37px; width:1013px;' ></span><span class='ocr_line' style='position:absolute; top:748px; left:98px; height:37px; width:1013px;' ></span><span class='ocrx_word' style='position:absolute; top:752px; left:98px; height:28px; width:86px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:751px; left:202px; height:34px; width:98px;'>gehörte</span><span class='ocrx_word' style='position:absolute; top:750px; left:322px; height:27px; width:47px;'>den</span><span class='ocrx_word' style='position:absolute; top:748px; left:395px; height:33px; width:216px;'>Benjaminitern,</span><span class='ocrx_word' style='position:absolute; top:749px; left:635px; height:33px; width:43px;'>lag</span><span class='ocrx_word' style='position:absolute; top:748px; left:702px; height:27px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:749px; left:753px; height:27px; width:45px;'>den</span><span class='ocrx_word' style='position:absolute; top:749px; left:826px; height:35px; width:112px;'>Grenzen</span><span class='ocrx_word' style='position:absolute; top:750px; left:962px; height:33px; width:71px;'>Iuda</span><span class='ocrx_word' style='position:absolute; top:750px; left:1057px; height:28px; width:54px;'>tmd</span><span class='ocr_par' style='position:absolute; top:794px; left:64px; height:76px; width:1048px;' ></span><span class='ocr_line' style='position:absolute; top:794px; left:98px; height:31px; width:134px;' ></span><span class='ocrx_word' style='position:absolute; top:794px; left:98px; height:31px; width:134px;'>Ephraim.</span><span class='ocr_line' style='position:absolute; top:833px; left:64px; height:37px; width:1048px;' ></span><span class='ocrx_word' style='position:absolute; top:834px; left:64px; height:36px; width:355px;'>Atroth.Beth-Ioab,</span><span class='ocrx_word' style='position:absolute; top:836px; left:438px; height:26px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:835px; left:480px; height:27px; width:17px;'>i.</span><span class='ocrx_word' style='position:absolute; top:834px; left:517px; height:27px; width:48px;'>die</span><span class='ocrx_word' style='position:absolute; top:834px; left:584px; height:27px; width:104px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:833px; left:712px; height:28px; width:52px;'>des</span><span class='ocrx_word' style='position:absolute; top:833px; left:784px; height:33px; width:125px;'>Hauses</span><span class='ocrx_word' style='position:absolute; top:834px; left:926px; height:32px; width:94px;'>Ioab.</span><span class='ocrx_word' style='position:absolute; top:835px; left:1050px; height:28px; width:62px;'>Eine</span><span class='ocr_par' style='position:absolute; top:876px; left:101px; height:35px; width:1012px;' ></span><span class='ocr_line' style='position:absolute; top:876px; left:101px; height:35px; width:1012px;' ></span><span class='ocrx_word' style='position:absolute; top:879px; left:101px; height:28px; width:86px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:879px; left:201px; height:27px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:879px; left:249px; height:32px; width:80px;'>Iuda,</span><span class='ocrx_word' style='position:absolute; top:883px; left:350px; height:22px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:878px; left:408px; height:27px; width:37px;'>die</span><span class='ocrx_word' style='position:absolute; top:877px; left:456px; height:32px; width:178px;'>Nachlommen</span><span class='ocrx_word' style='position:absolute; top:876px; left:645px; height:28px; width:97px;'>Salma</span><span class='ocrx_word' style='position:absolute; top:876px; left:762px; height:34px; width:114px;'>gewohnt</span><span class='ocrx_word' style='position:absolute; top:877px; left:887px; height:33px; width:85px;'>haben.</span><span class='ocrx_word' style='position:absolute; top:880px; left:992px; height:24px; width:10px;'>1</span><span class='ocrx_word' style='position:absolute; top:877px; left:1021px; height:34px; width:92px;'>Chron.</span><span class='ocr_par' style='position:absolute; top:923px; left:64px; height:73px; width:1048px;' ></span><span class='ocr_line' style='position:absolute; top:923px; left:96px; height:30px; width:89px;' ></span><span class='ocrx_word' style='position:absolute; top:923px; left:96px; height:30px; width:24px;'>2,</span><span class='ocrx_word' style='position:absolute; top:924px; left:141px; height:25px; width:44px;'>54.</span><span class='ocr_line' style='position:absolute; top:961px; left:64px; height:35px; width:1048px;' ></span><span class='ocrx_word' style='position:absolute; top:962px; left:64px; height:31px; width:148px;'>Attalia.</span><span class='ocrx_word' style='position:absolute; top:963px; left:249px; height:27px; width:63px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:963px; left:330px; height:27px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:962px; left:428px; height:26px; width:27px;'>in</span><span class='ocrx_word' style='position:absolute; top:961px; left:474px; height:33px; width:163px;'>Pamphilien</span><span class='ocrx_word' style='position:absolute; top:962px; left:665px; height:28px; width:36px;'>od.</span><span class='ocrx_word' style='position:absolute; top:961px; left:720px; height:33px; width:104px;'>Libyen,</span><span class='ocrx_word' style='position:absolute; top:967px; left:848px; height:22px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:962px; left:916px; height:27px; width:88px;'>Attala</span><span class='ocrx_word' style='position:absolute; top:962px; left:1023px; height:34px; width:89px;'>Phila.</span><span class='ocr_par' style='position:absolute; top:1005px; left:62px; height:77px; width:1073px;' ></span><span class='ocr_line' style='position:absolute; top:1005px; left:95px; height:34px; width:499px;' ></span><span class='ocrx_word' style='position:absolute; top:1006px; left:95px; height:33px; width:90px;'>delpho</span><span class='ocrx_word' style='position:absolute; top:1006px; left:206px; height:27px; width:96px;'>erbaut.</span><span class='ocrx_word' style='position:absolute; top:1006px; left:321px; height:31px; width:47px;'>Ap.</span><span class='ocrx_word' style='position:absolute; top:1005px; left:388px; height:33px; width:83px;'>Gesch.</span><span class='ocrx_word' style='position:absolute; top:1006px; left:494px; height:32px; width:39px;'>14,</span><span class='ocrx_word' style='position:absolute; top:1006px; left:553px; height:25px; width:41px;'>25.</span><span class='ocr_line' style='position:absolute; top:1046px; left:62px; height:36px; width:1073px;' ></span><span class='ocrx_word' style='position:absolute; top:1048px; left:62px; height:29px; width:146px;'>Attalus</span><span class='ocrx_word' style='position:absolute; top:1048px; left:255px; height:27px; width:51px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:1046px; left:330px; height:34px; width:81px;'>König</span><span class='ocrx_word' style='position:absolute; top:1047px; left:436px; height:26px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:1046px; left:482px; height:32px; width:112px;'>Mysien,</span><span class='ocrx_word' style='position:absolute; top:1046px; left:623px; height:32px; width:99px;'>welches</span><span class='ocrx_word' style='position:absolute; top:1047px; left:747px; height:26px; width:72px;'>unter</span><span class='ocrx_word' style='position:absolute; top:1046px; left:843px; height:35px; width:129px;'>Phrygien</span><span class='ocrx_word' style='position:absolute; top:1047px; left:997px; height:35px; width:115px;'>gehörte;</span><span class='ocrx_word' style='position:absolute; top:1058px; left:1128px; height:9px; width:7px;'>,</span><span class='ocr_par' style='position:absolute; top:1089px; left:95px; height:36px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1089px; left:95px; height:36px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1093px; left:95px; height:32px; width:112px;'>genannt</span><span class='ocrx_word' style='position:absolute; top:1095px; left:227px; height:22px; width:47px;'>von</span><span class='ocrx_word' style='position:absolute; top:1090px; left:294px; height:29px; width:122px;'>Attale,</span><span class='ocrx_word' style='position:absolute; top:1090px; left:435px; height:30px; width:99px;'>welches</span><span class='ocrx_word' style='position:absolute; top:1089px; left:553px; height:27px; width:38px;'>bei</span><span class='ocrx_word' style='position:absolute; top:1089px; left:610px; height:26px; width:47px;'>den</span><span class='ocrx_word' style='position:absolute; top:1089px; left:676px; height:33px; width:143px;'>Phrygiern</span><span class='ocrx_word' style='position:absolute; top:1089px; left:838px; height:32px; width:79px;'>Kropf</span><span class='ocrx_word' style='position:absolute; top:1090px; left:935px; height:26px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:1090px; left:1012px; height:34px; width:99px;'>Gurgel</span><span class='ocr_par' style='position:absolute; top:1131px; left:94px; height:37px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1131px; left:94px; height:37px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1133px; left:94px; height:35px; width:119px;'>geheißen</span><span class='ocrx_word' style='position:absolute; top:1133px; left:233px; height:32px; width:77px;'>haben</span><span class='ocrx_word' style='position:absolute; top:1131px; left:329px; height:30px; width:51px;'>soll.</span><span class='ocrx_word' style='position:absolute; top:1157px; left:393px; height:4px; width:4px;'>,</span><span class='ocrx_word' style='position:absolute; top:1131px; left:417px; height:28px; width:62px;'>War</span><span class='ocrx_word' style='position:absolute; top:1132px; left:497px; height:26px; width:39px;'>ein</span><span class='ocrx_word' style='position:absolute; top:1132px; left:555px; height:33px; width:82px;'>König</span><span class='ocrx_word' style='position:absolute; top:1132px; left:660px; height:26px; width:40px;'>der</span><span class='ocrx_word' style='position:absolute; top:1132px; left:719px; height:33px; width:170px;'>Pergamener</span><span class='ocrx_word' style='position:absolute; top:1133px; left:907px; height:25px; width:49px;'>und</span><span class='ocrx_word' style='position:absolute; top:1131px; left:976px; height:34px; width:134px;'>Phrvgier.</span><span class='ocr_par' style='position:absolute; top:1175px; left:59px; height:75px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:1175px; left:95px; height:32px; width:237px;' ></span><span class='ocrx_word' style='position:absolute; top:1177px; left:95px; height:24px; width:11px;'>l</span><span class='ocrx_word' style='position:absolute; top:1175px; left:130px; height:27px; width:81px;'>Mack.</span><span class='ocrx_word' style='position:absolute; top:1176px; left:233px; height:31px; width:39px;'>15,</span><span class='ocrx_word' style='position:absolute; top:1176px; left:292px; height:25px; width:40px;'>22.</span><span class='ocr_line' style='position:absolute; top:1216px; left:59px; height:34px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:1217px; left:59px; height:29px; width:87px;'>Ava.</span><span class='ocrx_word' style='position:absolute; top:1217px; left:184px; height:33px; width:40px;'>Ist</span><span class='ocrx_word' style='position:absolute; top:1217px; left:242px; height:26px; width:38px;'>bei</span><span class='ocrx_word' style='position:absolute; top:1218px; left:299px; height:25px; width:45px;'>den</span><span class='ocrx_word' style='position:absolute; top:1217px; left:364px; height:26px; width:68px;'>alten</span><span class='ocrx_word' style='position:absolute; top:1216px; left:453px; height:32px; width:115px;'>Griechen</span><span class='ocrx_word' style='position:absolute; top:1216px; left:587px; height:26px; width:49px;'>Aia</span><span class='ocrx_word' style='position:absolute; top:1216px; left:655px; height:26px; width:36px;'>od.</span><span class='ocrx_word' style='position:absolute; top:1216px; left:711px; height:31px; width:60px;'>Aea,</span><span class='ocrx_word' style='position:absolute; top:1216px; left:790px; height:26px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1216px; left:842px; height:33px; width:151px;'>Hauptstadt</span><span class='ocrx_word' style='position:absolute; top:1217px; left:1010px; height:26px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:1216px; left:1051px; height:29px; width:59px;'>Col»</span><span class='ocr_par' style='position:absolute; top:1258px; left:92px; height:35px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1258px; left:92px; height:35px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1261px; left:92px; height:32px; width:73px;'>chide,</span><span class='ocrx_word' style='position:absolute; top:1265px; left:186px; height:21px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:1260px; left:244px; height:25px; width:79px;'>Aetas</span><span class='ocrx_word' style='position:absolute; top:1258px; left:341px; height:34px; width:110px;'>regierte.</span><span class='ocrx_word' style='position:absolute; top:1258px; left:494px; height:33px; width:99px;'>Colchis</span><span class='ocrx_word' style='position:absolute; top:1258px; left:612px; height:33px; width:66px;'>heißt</span><span class='ocrx_word' style='position:absolute; top:1258px; left:697px; height:34px; width:115px;'>heutiges</span><span class='ocrx_word' style='position:absolute; top:1258px; left:833px; height:34px; width:83px;'>Tages</span><span class='ocrx_word' style='position:absolute; top:1258px; left:938px; height:35px; width:170px;'>Mengrelicn,</span><span class='ocr_par' style='position:absolute; top:1300px; left:92px; height:35px; width:1017px;' ></span><span class='ocr_line' style='position:absolute; top:1300px; left:92px; height:35px; width:1017px;' ></span><span class='ocrx_word' style='position:absolute; top:1303px; left:92px; height:27px; width:39px;'>die</span><span class='ocrx_word' style='position:absolute; top:1303px; left:160px; height:32px; width:98px;'>meisten</span><span class='ocrx_word' style='position:absolute; top:1302px; left:277px; height:30px; width:153px;'>Einwohner</span><span class='ocrx_word' style='position:absolute; top:1300px; left:455px; height:33px; width:50px;'>sind</span><span class='ocrx_word' style='position:absolute; top:1300px; left:531px; height:34px; width:122px;'>Christen.</span><span class='ocrx_word' style='position:absolute; top:1300px; left:698px; height:28px; width:57px;'>Von</span><span class='ocrx_word' style='position:absolute; top:1300px; left:780px; height:32px; width:51px;'>hier</span><span class='ocrx_word' style='position:absolute; top:1302px; left:855px; height:26px; width:101px;'>wurden</span><span class='ocrx_word' style='position:absolute; top:1302px; left:980px; height:26px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1301px; left:1037px; height:28px; width:72px;'>Leute</span><span class='ocr_par' style='position:absolute; top:1342px; left:92px; height:36px; width:1018px;' ></span><span class='ocr_line' style='position:absolute; top:1342px; left:92px; height:36px; width:1018px;' ></span><span class='ocrx_word' style='position:absolute; top:1349px; left:92px; height:22px; width:52px;'>von</span><span class='ocrx_word' style='position:absolute; top:1344px; left:165px; height:32px; width:182px;'>Salmanasscr</span><span class='ocrx_word' style='position:absolute; top:1344px; left:371px; height:31px; width:57px;'>nach</span><span class='ocrx_word' style='position:absolute; top:1343px; left:454px; height:27px; width:128px;'>Samaria</span><span class='ocrx_word' style='position:absolute; top:1343px; left:606px; height:35px; width:110px;'>gesührt,</span><span class='ocrx_word' style='position:absolute; top:1347px; left:741px; height:22px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:1342px; left:804px; height:33px; width:31px;'>sie</span><span class='ocrx_word' style='position:absolute; top:1343px; left:859px; height:32px; width:58px;'>noch</span><span class='ocrx_word' style='position:absolute; top:1343px; left:942px; height:33px; width:51px;'>ihre</span><span class='ocrx_word' style='position:absolute; top:1344px; left:1019px; height:27px; width:91px;'>Götter</span><span class='ocr_par' style='position:absolute; top:1386px; left:58px; height:76px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:1386px; left:93px; height:33px; width:782px;' ></span><span class='ocrx_word' style='position:absolute; top:1387px; left:93px; height:32px; width:118px;'>Nibehas</span><span class='ocrx_word' style='position:absolute; top:1387px; left:231px; height:26px; width:48px;'>und</span><span class='ocrx_word' style='position:absolute; top:1386px; left:298px; height:32px; width:123px;'>Tharthac</span><span class='ocrx_word' style='position:absolute; top:1386px; left:440px; height:27px; width:138px;'>anbeteten.</span><span class='ocrx_word' style='position:absolute; top:1388px; left:597px; height:24px; width:15px;'>2</span><span class='ocrx_word' style='position:absolute; top:1387px; left:630px; height:26px; width:64px;'>Kön.</span><span class='ocrx_word' style='position:absolute; top:1388px; left:716px; height:28px; width:38px;'>l7,</span><span class='ocrx_word' style='position:absolute; top:1386px; left:775px; height:27px; width:41px;'>24.</span><span class='ocrx_word' style='position:absolute; top:1387px; left:835px; height:26px; width:40px;'>31.</span><span class='ocr_line' style='position:absolute; top:1428px; left:58px; height:34px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:1428px; left:58px; height:30px; width:117px;'>Aven.</span><span class='ocrx_word' style='position:absolute; top:1429px; left:213px; height:33px; width:101px;'>Götze,</span><span class='ocrx_word' style='position:absolute; top:1428px; left:339px; height:27px; width:163px;'>Eitelleit.</span><span class='ocrx_word' style='position:absolute; top:1428px; left:538px; height:27px; width:42px;'>So</span><span class='ocrx_word' style='position:absolute; top:1429px; left:605px; height:26px; width:60px;'>wird</span><span class='ocrx_word' style='position:absolute; top:1428px; left:690px; height:33px; width:88px;'>Bethel</span><span class='ocrx_word' style='position:absolute; top:1429px; left:802px; height:33px; width:118px;'>genannt.</span><span class='ocrx_word' style='position:absolute; top:1428px; left:939px; height:34px; width:56px;'>Hos.</span><span class='ocrx_word' style='position:absolute; top:1431px; left:1023px; height:29px; width:38px;'>10,</span><span class='ocrx_word' style='position:absolute; top:1431px; left:1086px; height:25px; width:23px;'>8.</span><span class='ocr_par' style='position:absolute; top:1471px; left:92px; height:34px; width:1018px;' ></span><span class='ocr_line' style='position:absolute; top:1471px; left:92px; height:34px; width:1018px;' ></span><span class='ocrx_word' style='position:absolute; top:1478px; left:92px; height:27px; width:88px;'>wegen</span><span class='ocrx_word' style='position:absolute; top:1472px; left:199px; height:26px; width:42px;'>der</span><span class='ocrx_word' style='position:absolute; top:1471px; left:261px; height:33px; width:104px;'>Götzen,</span><span class='ocrx_word' style='position:absolute; top:1471px; left:390px; height:26px; width:39px;'>die</span><span class='ocrx_word' style='position:absolute; top:1471px; left:456px; height:32px; width:100px;'>daselbst</span><span class='ocrx_word' style='position:absolute; top:1476px; left:579px; height:21px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:1472px; left:651px; height:25px; width:43px;'>den</span><span class='ocrx_word' style='position:absolute; top:1471px; left:715px; height:32px; width:137px;'>Israeliten</span><span class='ocrx_word' style='position:absolute; top:1471px; left:877px; height:32px; width:96px;'>verehrt</span><span class='ocrx_word' style='position:absolute; top:1472px; left:1000px; height:26px; width:110px;'>wurden.</span><span class='ocr_par' style='position:absolute; top:1513px; left:91px; height:35px; width:1019px;' ></span><span class='ocr_line' style='position:absolute; top:1513px; left:91px; height:35px; width:1019px;' ></span><span class='ocrx_word' style='position:absolute; top:1515px; left:91px; height:26px; width:58px;'>Mit</span><span class='ocrx_word' style='position:absolute; top:1515px; left:167px; height:26px; width:53px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1520px; left:240px; height:28px; width:92px;'>ganzen</span><span class='ocrx_word' style='position:absolute; top:1513px; left:352px; height:27px; width:109px;'>Namen:</span><span class='ocrx_word' style='position:absolute; top:1513px; left:482px; height:31px; width:158px;'>Beth»Aven,</span><span class='ocrx_word' style='position:absolute; top:1513px; left:658px; height:27px; width:50px;'>das</span><span class='ocrx_word' style='position:absolute; top:1513px; left:726px; height:35px; width:167px;'>Götzenhaus,</span><span class='ocrx_word' style='position:absolute; top:1513px; left:914px; height:33px; width:65px;'>oder,</span><span class='ocrx_word' style='position:absolute; top:1514px; left:997px; height:26px; width:32px;'>da</span><span class='ocrx_word' style='position:absolute; top:1520px; left:1048px; height:21px; width:62px;'>man</span><span class='ocr_par' style='position:absolute; top:1555px; left:56px; height:78px; width:1054px;' ></span><span class='ocr_line' style='position:absolute; top:1555px; left:91px; height:33px; width:540px;' ></span><span class='ocrx_word' style='position:absolute; top:1558px; left:91px; height:26px; width:58px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1557px; left:169px; height:26px; width:85px;'>Eiteln</span><span class='ocrx_word' style='position:absolute; top:1556px; left:275px; height:31px; width:178px;'>nachwandelt.</span><span class='ocrx_word' style='position:absolute; top:1555px; left:473px; height:33px; width:59px;'>Hos.</span><span class='ocrx_word' style='position:absolute; top:1558px; left:549px; height:26px; width:22px;'>4,</span><span class='ocrx_word' style='position:absolute; top:1558px; left:593px; height:23px; width:38px;'>15.</span><span class='ocr_line' style='position:absolute; top:1597px; left:56px; height:36px; width:1054px;' ></span><span class='ocrx_word' style='position:absolute; top:1597px; left:56px; height:36px; width:186px;'>Augustus.</span><span class='ocrx_word' style='position:absolute; top:1597px; left:287px; height:34px; width:132px;'>Würdig</span><span class='ocrx_word' style='position:absolute; top:1598px; left:448px; height:32px; width:129px;'>verehrt</span><span class='ocrx_word' style='position:absolute; top:1598px; left:608px; height:26px; width:60px;'>und</span><span class='ocrx_word' style='position:absolute; top:1599px; left:704px; height:33px; width:172px;'>angebetet</span><span class='ocrx_word' style='position:absolute; top:1605px; left:908px; height:27px; width:36px;'>zu</span><span class='ocrx_word' style='position:absolute; top:1599px; left:978px; height:28px; width:132px;'>werden.</span><span class='ocr_par' style='position:absolute; top:1640px; left:92px; height:34px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1640px; left:92px; height:34px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1640px; left:92px; height:34px; width:97px;'>Diesen</span><span class='ocrx_word' style='position:absolute; top:1640px; left:211px; height:27px; width:100px;'>Namen</span><span class='ocrx_word' style='position:absolute; top:1641px; left:340px; height:33px; width:46px;'>gab</span><span class='ocrx_word' style='position:absolute; top:1641px; left:413px; height:26px; width:46px;'>das</span><span class='ocrx_word' style='position:absolute; top:1640px; left:487px; height:32px; width:109px;'>romische</span><span class='ocrx_word' style='position:absolute; top:1640px; left:616px; height:27px; width:62px;'>Voll</span><span class='ocrx_word' style='position:absolute; top:1641px; left:706px; height:26px; width:52px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1641px; left:781px; height:31px; width:88px;'>Kaiser</span><span class='ocrx_word' style='position:absolute; top:1641px; left:887px; height:31px; width:143px;'>Octavian,</span><span class='ocrx_word' style='position:absolute; top:1642px; left:1058px; height:26px; width:50px;'>und</span><span class='ocr_par' style='position:absolute; top:1682px; left:93px; height:34px; width:1015px;' ></span><span class='ocr_line' style='position:absolute; top:1682px; left:93px; height:34px; width:1015px;' ></span><span class='ocrx_word' style='position:absolute; top:1683px; left:93px; height:27px; width:49px;'>alle</span><span class='ocrx_word' style='position:absolute; top:1683px; left:161px; height:32px; width:130px;'>romischen</span><span class='ocrx_word' style='position:absolute; top:1683px; left:310px; height:32px; width:86px;'>Kaiser</span><span class='ocrx_word' style='position:absolute; top:1683px; left:416px; height:30px; width:79px;'>haben</span><span class='ocrx_word' style='position:absolute; top:1682px; left:514px; height:32px; width:80px;'>diesen</span><span class='ocrx_word' style='position:absolute; top:1682px; left:614px; height:27px; width:95px;'>Namen</span><span class='ocrx_word' style='position:absolute; top:1683px; left:728px; height:33px; width:170px;'>beibehalten,</span><span class='ocrx_word' style='position:absolute; top:1682px; left:917px; height:33px; width:47px;'>daß</span><span class='ocrx_word' style='position:absolute; top:1682px; left:983px; height:33px; width:31px;'>sie</span><span class='ocrx_word' style='position:absolute; top:1692px; left:1033px; height:18px; width:75px;'>«au,-</span><span class='ocr_par' style='position:absolute; top:1724px; left:55px; height:119px; width:1052px;' ></span><span class='ocr_line' style='position:absolute; top:1724px; left:90px; height:35px; width:907px;' ></span><span class='ocrx_word' style='position:absolute; top:1733px; left:90px; height:25px; width:52px;'>per</span><span class='ocrx_word' style='position:absolute; top:1727px; left:160px; height:31px; width:124px;'>2ußr>«ti,</span><span class='ocrx_word' style='position:absolute; top:1726px; left:304px; height:25px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:1724px; left:345px; height:26px; width:15px;'>i,</span><span class='ocrx_word' style='position:absolute; top:1725px; left:382px; height:32px; width:80px;'>allzeit</span><span class='ocrx_word' style='position:absolute; top:1725px; left:482px; height:31px; width:99px;'>Mehrer</span><span class='ocrx_word' style='position:absolute; top:1725px; left:600px; height:26px; width:43px;'>des</span><span class='ocrx_word' style='position:absolute; top:1724px; left:664px; height:32px; width:86px;'>Reichs</span><span class='ocrx_word' style='position:absolute; top:1725px; left:770px; height:34px; width:115px;'>geheißen</span><span class='ocrx_word' style='position:absolute; top:1725px; left:904px; height:33px; width:93px;'>haben.</span><span class='ocr_line' style='position:absolute; top:1766px; left:55px; height:34px; width:897px;' ></span><span class='ocrx_word' style='position:absolute; top:1766px; left:55px; height:34px; width:121px;'>Avith.</span><span class='ocrx_word' style='position:absolute; top:1767px; left:212px; height:32px; width:112px;'>Haufe.</span><span class='ocrx_word' style='position:absolute; top:1766px; left:361px; height:27px; width:63px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:1766px; left:443px; height:28px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:1768px; left:542px; height:25px; width:27px;'>in</span><span class='ocrx_word' style='position:absolute; top:1767px; left:587px; height:32px; width:122px;'>Idumäa.</span><span class='ocrx_word' style='position:absolute; top:1769px; left:732px; height:24px; width:10px;'>1</span><span class='ocrx_word' style='position:absolute; top:1767px; left:763px; height:32px; width:68px;'>Mos.</span><span class='ocrx_word' style='position:absolute; top:1769px; left:849px; height:29px; width:43px;'>36,</span><span class='ocrx_word' style='position:absolute; top:1769px; left:910px; height:26px; width:42px;'>35.</span><span class='ocr_line' style='position:absolute; top:1809px; left:57px; height:34px; width:1050px;' ></span><span class='ocrx_word' style='position:absolute; top:1809px; left:57px; height:30px; width:125px;'>Aulon.</span><span class='ocrx_word' style='position:absolute; top:1809px; left:236px; height:34px; width:209px;'>Ausgehöhlt.</span><span class='ocrx_word' style='position:absolute; top:1809px; left:491px; height:27px; width:62px;'>Das</span><span class='ocrx_word' style='position:absolute; top:1809px; left:581px; height:34px; width:72px;'>große</span><span class='ocrx_word' style='position:absolute; top:1809px; left:681px; height:32px; width:76px;'>Thal,</span><span class='ocrx_word' style='position:absolute; top:1810px; left:791px; height:27px; width:80px;'>worin</span><span class='ocrx_word' style='position:absolute; top:1810px; left:897px; height:27px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1809px; left:962px; height:34px; width:145px;'>berühmten</span><span class='ocr_par' style='position:absolute; top:1851px; left:89px; height:36px; width:1017px;' ></span><span class='ocr_line' style='position:absolute; top:1851px; left:89px; height:36px; width:1017px;' ></span><span class='ocrx_word' style='position:absolute; top:1853px; left:89px; height:29px; width:97px;'>Städte</span><span class='ocrx_word' style='position:absolute; top:1852px; left:204px; height:34px; width:111px;'>Vethsan</span><span class='ocrx_word' style='position:absolute; top:1852px; left:334px; height:27px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:1852px; left:409px; height:34px; width:179px;'>Scythopolis,</span><span class='ocrx_word' style='position:absolute; top:1851px; left:605px; height:34px; width:127px;'>Tlberias,</span><span class='ocrx_word' style='position:absolute; top:1852px; left:751px; height:35px; width:111px;'>Iericho,</span><span class='ocrx_word' style='position:absolute; top:1851px; left:881px; height:29px; width:48px;'>das</span><span class='ocrx_word' style='position:absolute; top:1853px; left:949px; height:27px; width:64px;'>todte</span><span class='ocrx_word' style='position:absolute; top:1852px; left:1033px; height:28px; width:73px;'>Meer</span></div>
metadata CHANGED
@@ -1,82 +1,95 @@
1
- --- !ruby/object:Gem::Specification
1
+ --- !ruby/object:Gem::Specification
2
2
  name: rhocr
3
- version: !ruby/object:Gem::Version
3
+ version: !ruby/object:Gem::Version
4
+ version: '0.1'
4
5
  prerelease:
5
- version: 0.0.3
6
6
  platform: ruby
7
- authors:
7
+ authors:
8
8
  - Andreas Neumann
9
9
  autorequire:
10
10
  bindir: bin
11
11
  cert_chain: []
12
-
13
- date: 2011-07-03 00:00:00 +02:00
14
- default_executable:
15
- dependencies: []
16
-
12
+ date: 2011-09-08 00:00:00.000000000Z
13
+ dependencies:
14
+ - !ruby/object:Gem::Dependency
15
+ name: nokogiri
16
+ requirement: &70276550001820 !ruby/object:Gem::Requirement
17
+ none: false
18
+ requirements:
19
+ - - ! '>='
20
+ - !ruby/object:Gem::Version
21
+ version: '0'
22
+ type: :runtime
23
+ prerelease: false
24
+ version_requirements: *70276550001820
17
25
  description: Manipulate and use OCR data encode in HOCR
18
- email: info @nospam@ an-it.com
26
+ email: andreas@neumann.biz
19
27
  executables: []
20
-
21
28
  extensions: []
22
-
23
- extra_rdoc_files:
29
+ extra_rdoc_files:
24
30
  - README
25
- - lib/ocr_box.rb
31
+ - TODO.txt
32
+ - lib/hocr_box.rb
33
+ - lib/ocr_document.rb
34
+ - lib/ocr_element.rb
26
35
  - lib/ocr_page.rb
27
- - lib/ocrx_word.rb
28
36
  - lib/rhocr.rb
29
- files:
37
+ files:
30
38
  - Manifest
31
39
  - README
32
40
  - Rakefile
41
+ - TODO.txt
42
+ - data/Seite_Die_Gartenlaube_242.html
33
43
  - data/Seite_Tagebuch_H_C_Lang_08.html
44
+ - data/Seite_Tagebuch_H_C_Lang_08.jpg
45
+ - data/test.html
46
+ - data/test.png
34
47
  - example/example_server.rb
35
48
  - example/public/OCRTest.css
36
49
  - example/public/OCRTest.html
37
50
  - example/public/OCRTest_marker.js
38
- - example/public/img/Seite_Tagebuch_H_C_Lang_05.jpg
51
+ - example/public/Seite_Tagebuch_H_C_Lang_08.jpg
39
52
  - example/public/img/Seite_Tagebuch_H_C_Lang_08.jpg
40
- - lib/ocr_box.rb
53
+ - lib/hocr_box.rb
54
+ - lib/ocr_document.rb
55
+ - lib/ocr_element.rb
41
56
  - lib/ocr_page.rb
42
- - lib/ocrx_word.rb
43
57
  - lib/rhocr.rb
44
58
  - rhocr.gemspec
45
- - rspec/ocr_box_spec.rb
46
- - rspec/ocr_page_spec.rb
47
- - rspec/ocrx_word_spec.rb
48
- has_rdoc: true
59
+ - spec/hocr_box_spec.rb
60
+ - spec/ocr_document_spec.rb
61
+ - spec/ocr_element_spec.rb
62
+ - spec/ocr_page_spec.rb
63
+ - spec/rhocr_spec.rb
64
+ - test.html
49
65
  homepage: http://github.com/daandi/rhocr
50
66
  licenses: []
51
-
52
67
  post_install_message:
53
- rdoc_options:
68
+ rdoc_options:
54
69
  - --line-numbers
55
70
  - --inline-source
56
71
  - --title
57
72
  - Rhocr
58
73
  - --main
59
74
  - README
60
- require_paths:
75
+ require_paths:
61
76
  - lib
62
- required_ruby_version: !ruby/object:Gem::Requirement
77
+ required_ruby_version: !ruby/object:Gem::Requirement
63
78
  none: false
64
- requirements:
65
- - - ">="
66
- - !ruby/object:Gem::Version
67
- version: "0"
68
- required_rubygems_version: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - ! '>='
81
+ - !ruby/object:Gem::Version
82
+ version: '0'
83
+ required_rubygems_version: !ruby/object:Gem::Requirement
69
84
  none: false
70
- requirements:
71
- - - ">="
72
- - !ruby/object:Gem::Version
73
- version: "1.2"
85
+ requirements:
86
+ - - ! '>='
87
+ - !ruby/object:Gem::Version
88
+ version: '1.2'
74
89
  requirements: []
75
-
76
90
  rubyforge_project: rhocr
77
- rubygems_version: 1.6.2
91
+ rubygems_version: 1.8.6
78
92
  signing_key:
79
93
  specification_version: 3
80
94
  summary: Manipulate and use OCR data encode in HOCR
81
95
  test_files: []
82
-
data/lib/ocr_box.rb DELETED
@@ -1,43 +0,0 @@
1
- #coding: utf-8
2
-
3
- class OCRBox
4
-
5
- attr_reader :x1, :y1, :x2, :y2
6
-
7
- def initialize(x1, y1 , x2, y2)
8
- @x1 = x1
9
- @y1 = y1
10
- @x2 = x2
11
- @y2 = y2
12
- end
13
-
14
- def encloses?(element)
15
- @x1 <= element.x1 and
16
- @x2 >= element.x2 and
17
- @y1 <= element.y1 and
18
- @y2 >= element.y2
19
- end
20
-
21
- def enclosed_by?(element)
22
- return element.encloses? self
23
- end
24
-
25
- def to_s
26
- "tl->(x:#{@x1} y:#{@y1})/br->:(x:#{@x2} y:#{@y2})"
27
- end
28
-
29
- def to_css_style
30
- top = @y1
31
- left = @x1
32
- height = @y2 - @y1
33
- width = @x2 - @x1
34
-
35
- "position:absolute; top:#{top}px; left:#{left}px; height:#{height}px; width:#{width}px;"
36
- end
37
-
38
- def to_json
39
-
40
- end
41
-
42
- end
43
-
data/lib/ocrx_word.rb DELETED
@@ -1,23 +0,0 @@
1
- #coding: utf-8
2
-
3
- require 'cgi'
4
- require_relative 'ocr_box'
5
-
6
- class OCRXWord < OCRBox
7
-
8
- attr_reader :text
9
-
10
- def initialize(x1,y1,x2,y2,word)
11
- super(x1.to_i, y1.to_i, x2.to_i, y2.to_i)
12
- @text = word
13
- end
14
-
15
- def to_html(css_class = 'ocrx_word')
16
- "<span style='#{ to_css_style }' class='#{css_class}'><span class='word'>" + CGI::escapeHTML(@text) +"</span></span>"
17
- end
18
-
19
- def to_s
20
- "#{@text}\t#{super}"
21
- end
22
-
23
- end
@@ -1,48 +0,0 @@
1
- #coding: utf-8
2
-
3
- require_relative '../lib/ocr_box'
4
-
5
- describe OCRBox do
6
-
7
- before(:each) do
8
- @box ||= OCRBox.new(1,2,20,8)
9
- end
10
-
11
- describe "#to_s" do
12
- it "prints a human readable Box-Version with coordinates upper_left(x,y) bottom_right(x,y)" do
13
- @box.to_s.should == "tl->(x:1 y:2)/br->:(x:20 y:8)"
14
- end
15
- end
16
-
17
- describe '#encloses?(element)' do
18
- it "tests wather given OCRBox is enclosed by the current OCRBox" do
19
- @box.encloses?( OCRBox.new(0,3,19,7) ).should be_false
20
- @box.encloses?( OCRBox.new(2,3,19,7) ).should be_true
21
- end
22
- it "encloses also itself" do
23
- @box.encloses?( @box ).should be_true
24
- end
25
- end
26
-
27
- describe '#to_css_style' do
28
- it 'should create css-style attributes' do
29
- @box.to_css_style.should == 'position:absolute; top:2px; left:1px; height:6px; width:19px;'
30
- end
31
- end
32
-
33
- describe '#enclosed_by?(element)' do
34
- it 'should be enclosed by Boxes bigger than itself' do
35
- @box.enclosed_by?( OCRBox.new(0,1,21,9) ).should be_true
36
- end
37
- it 'should not be enclosed by Boxes smaller than itself' do
38
- @box.enclosed_by?( OCRBox.new(2,3,19,7) ).should be_false
39
- end
40
- it 'should be enclosed by Boxes of the same size' do
41
- @box.enclosed_by?( @box ).should be_true
42
- end
43
- end
44
-
45
-
46
-
47
-
48
- end
@@ -1,17 +0,0 @@
1
- #coding: utf-8
2
-
3
- require_relative '../lib/ocr_page'
4
-
5
- describe OCRPage do
6
-
7
- before(:each) do
8
- @ocr_page ||= OCRPage.new('../data/Seite_Tagebuch_H_C_Lang_08.html')
9
- end
10
-
11
- describe '' do
12
- it '' do
13
- p @ocr_page.enclosed_words( OCRBox.new(500,1703,1200,1800) )
14
- end
15
- end
16
-
17
- end
@@ -1,32 +0,0 @@
1
- #coding: utf-8
2
-
3
- require_relative '../lib/ocrx_word'
4
-
5
- describe OCRXWord do
6
-
7
- before(:each) do
8
- @ocrx_word = OCRXWord.new(10,15,20,20,'WORT')
9
- end
10
-
11
- describe '#to_s' do
12
- it 'should print the coordinates of the box and the textual information' do
13
- p @ocrx_word
14
- @ocrx_word.to_s.should == "WORT\ttl->(x:10 y:15)/br->:(x:20 y:20)"
15
- end
16
- end
17
-
18
- describe '#to_html(css_class)' do
19
- it 'should create an span elment to overlay an image on an html-page' do
20
- @ocrx_word.to_html.should == "<span style='position:absolute; top:15px; left:10px; height:5px; width:10px;' class='ocrx_word'><span class='word'>WORT</span></span>"
21
- end
22
-
23
- it 'no css_class_class given should default to ocrx_word' do
24
- @ocrx_word.to_html.should =~ /class='ocrx_word'/
25
- end
26
-
27
- it 'css_class given should be part of genearted html' do
28
- @ocrx_word.to_html('rosebud').should =~ /class='rosebud'/
29
- end
30
- end
31
-
32
- end