rhocr 0.0.3 → 0.1
Sign up to get free protection for your applications and to get access to all the features.
- data/Manifest +15 -6
- data/Rakefile +3 -3
- data/TODO.txt +42 -0
- data/data/Seite_Die_Gartenlaube_242.html +42 -0
- data/data/Seite_Tagebuch_H_C_Lang_08.jpg +0 -0
- data/data/test.html +71 -0
- data/data/test.png +0 -0
- data/example/example_server.rb +2 -2
- data/example/public/Seite_Tagebuch_H_C_Lang_08.jpg +0 -0
- data/lib/hocr_box.rb +67 -0
- data/lib/ocr_document.rb +50 -0
- data/lib/ocr_element.rb +149 -0
- data/lib/ocr_page.rb +80 -25
- data/lib/rhocr.rb +30 -1
- data/rhocr.gemspec +12 -9
- data/spec/hocr_box_spec.rb +94 -0
- data/spec/ocr_document_spec.rb +80 -0
- data/spec/ocr_element_spec.rb +86 -0
- data/spec/ocr_page_spec.rb +116 -0
- data/spec/rhocr_spec.rb +34 -0
- data/test.html +1 -0
- metadata +52 -39
- data/example/public/img/Seite_Tagebuch_H_C_Lang_05.jpg +0 -0
- data/lib/ocr_box.rb +0 -43
- data/lib/ocrx_word.rb +0 -23
- data/rspec/ocr_box_spec.rb +0 -48
- data/rspec/ocr_page_spec.rb +0 -17
- data/rspec/ocrx_word_spec.rb +0 -32
data/test.html
ADDED
@@ -0,0 +1 @@
|
|
1
|
+
<div class='ocr_page' style='position:absolute; top:0px; left:0px; height:1326px; width:1326px;;background-image: url(data/test.png); width:1326px; height:1326>px ;'><span class='ocrx_block' style='position:absolute; top:32px; left:55px; height:1855px; width:1080px;' ></span><span class='ocr_par' style='position:absolute; top:32px; left:432px; height:39px; width:685px;' ></span><span class='ocr_line' style='position:absolute; top:32px; left:432px; height:39px; width:685px;' ></span><span class='ocrx_word' style='position:absolute; top:32px; left:432px; height:35px; width:156px;'>Athenobius</span><span class='ocrx_word' style='position:absolute; top:48px; left:606px; height:6px; width:34px;'>—</span><span class='ocrx_word' style='position:absolute; top:34px; left:657px; height:28px; width:92px;'>Aulon.</span><span class='ocrx_word' style='position:absolute; top:37px; left:1074px; height:34px; width:43px;'>29</span><span class='ocr_par' style='position:absolute; top:109px; left:79px; height:80px; width:1040px;' ></span><span class='ocr_line' style='position:absolute; top:109px; left:79px; height:36px; width:1040px;' ></span><span class='ocrx_word' style='position:absolute; top:109px; left:79px; height:35px; width:215px;'>Athenobius,</span><span class='ocrx_word' style='position:absolute; top:112px; left:334px; height:27px; width:64px;'>Der</span><span class='ocrx_word' style='position:absolute; top:115px; left:417px; height:24px; width:59px;'>von</span><span class='ocrx_word' style='position:absolute; top:112px; left:494px; height:27px; width:51px;'>der</span><span class='ocrx_word' style='position:absolute; top:112px; left:565px; height:28px; width:122px;'>Göttin</span><span class='ocrx_word' style='position:absolute; top:112px; left:707px; height:28px; width:150px;'>Minerva</span><span class='ocrx_word' style='position:absolute; top:112px; left:876px; height:33px; width:78px;'>lebt,</span><span class='ocrx_word' style='position:absolute; top:112px; left:974px; height:28px; width:69px;'>oder:</span><span class='ocrx_word' style='position:absolute; top:112px; left:1062px; height:28px; width:57px;'>Mi»</span><span class='ocr_line' style='position:absolute; top:155px; left:108px; height:34px; width:192px;' ></span><span class='ocrx_word' style='position:absolute; top:159px; left:108px; height:23px; width:75px;'>nerva</span><span class='ocrx_word' style='position:absolute; top:155px; left:201px; height:34px; width:99px;'>Bogen.</span><span class='ocr_par' style='position:absolute; top:196px; left:74px; height:120px; width:1043px;' ></span><span class='ocr_line' style='position:absolute; top:196px; left:160px; height:36px; width:957px;' ></span><span class='ocrx_word' style='position:absolute; top:198px; left:160px; height:27px; width:54px;'>Des</span><span class='ocrx_word' style='position:absolute; top:197px; left:242px; height:33px; width:98px;'>Königs</span><span class='ocrx_word' style='position:absolute; top:196px; left:367px; height:34px; width:136px;'>Antiochus</span><span class='ocrx_word' style='position:absolute; top:197px; left:531px; height:33px; width:95px;'>Freund</span><span class='ocrx_word' style='position:absolute; top:197px; left:655px; height:28px; width:58px;'>oder</span><span class='ocrx_word' style='position:absolute; top:196px; left:739px; height:36px; width:119px;'>geheimer</span><span class='ocrx_word' style='position:absolute; top:196px; left:885px; height:34px; width:78px;'>Nath.</span><span class='ocrx_word' style='position:absolute; top:199px; left:994px; height:25px; width:11px;'>l</span><span class='ocrx_word' style='position:absolute; top:197px; left:1033px; height:29px; width:84px;'>Mack.</span><span class='ocr_line' style='position:absolute; top:241px; left:109px; height:33px; width:97px;' ></span><span class='ocrx_word' style='position:absolute; top:241px; left:109px; height:33px; width:38px;'>15,</span><span class='ocrx_word' style='position:absolute; top:242px; left:166px; height:25px; width:40px;'>28.</span><span class='ocr_line' style='position:absolute; top:281px; left:74px; height:35px; width:1042px;' ></span><span class='ocrx_word' style='position:absolute; top:281px; left:74px; height:34px; width:131px;'>Athlai.</span><span class='ocrx_word' style='position:absolute; top:284px; left:242px; height:26px; width:68px;'>Dee</span><span class='ocrx_word' style='position:absolute; top:282px; left:337px; height:33px; width:80px;'>Herr</span><span class='ocrx_word' style='position:absolute; top:281px; left:440px; height:34px; width:158px;'>zerreißet</span><span class='ocrx_word' style='position:absolute; top:282px; left:625px; height:28px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:282px; left:706px; height:34px; width:158px;'>zerbricht.</span><span class='ocrx_word' style='position:absolute; top:282px; left:898px; height:28px; width:77px;'>Einer</span><span class='ocrx_word' style='position:absolute; top:286px; left:999px; height:24px; width:51px;'>von</span><span class='ocrx_word' style='position:absolute; top:282px; left:1069px; height:28px; width:47px;'>den</span><span class='ocr_par' style='position:absolute; top:324px; left:74px; height:77px; width:1040px;' ></span><span class='ocr_line' style='position:absolute; top:324px; left:107px; height:33px; width:487px;' ></span><span class='ocrx_word' style='position:absolute; top:325px; left:107px; height:32px; width:174px;'>Nachlommen</span><span class='ocrx_word' style='position:absolute; top:324px; left:300px; height:28px; width:92px;'>Bebai.</span><span class='ocrx_word' style='position:absolute; top:324px; left:410px; height:32px; width:62px;'>Esra</span><span class='ocrx_word' style='position:absolute; top:327px; left:496px; height:28px; width:37px;'>10,</span><span class='ocrx_word' style='position:absolute; top:326px; left:553px; height:25px; width:41px;'>28.</span><span class='ocr_line' style='position:absolute; top:366px; left:74px; height:35px; width:1040px;' ></span><span class='ocrx_word' style='position:absolute; top:366px; left:74px; height:34px; width:115px;'>Athni.</span><span class='ocrx_word' style='position:absolute; top:368px; left:217px; height:27px; width:79px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:367px; left:315px; height:34px; width:135px;'>Trübsal</span><span class='ocrx_word' style='position:absolute; top:372px; left:469px; height:22px; width:59px;'>von</span><span class='ocrx_word' style='position:absolute; top:366px; left:548px; height:28px; width:90px;'>Gott.</span><span class='ocrx_word' style='position:absolute; top:366px; left:673px; height:28px; width:49px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:366px; left:742px; height:34px; width:77px;'>Sohn</span><span class='ocrx_word' style='position:absolute; top:366px; left:838px; height:34px; width:116px;'>Semaja.</span><span class='ocrx_word' style='position:absolute; top:369px; left:986px; height:25px; width:12px;'>1</span><span class='ocrx_word' style='position:absolute; top:368px; left:1018px; height:32px; width:96px;'>Chron.</span><span class='ocr_par' style='position:absolute; top:412px; left:71px; height:76px; width:1041px;' ></span><span class='ocr_line' style='position:absolute; top:412px; left:104px; height:28px; width:83px;' ></span><span class='ocrx_word' style='position:absolute; top:412px; left:104px; height:28px; width:40px;'>27.</span><span class='ocrx_word' style='position:absolute; top:413px; left:163px; height:25px; width:24px;'>7.</span><span class='ocr_line' style='position:absolute; top:451px; left:71px; height:37px; width:1041px;' ></span><span class='ocrx_word' style='position:absolute; top:451px; left:71px; height:34px; width:146px;'>Athniel.</span><span class='ocrx_word' style='position:absolute; top:452px; left:246px; height:27px; width:118px;'>Gottes</span><span class='ocrx_word' style='position:absolute; top:451px; left:384px; height:33px; width:147px;'>Trübsal,</span><span class='ocrx_word' style='position:absolute; top:451px; left:550px; height:28px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:451px; left:591px; height:28px; width:17px;'>i.</span><span class='ocrx_word' style='position:absolute; top:451px; left:627px; height:28px; width:54px;'>eine</span><span class='ocrx_word' style='position:absolute; top:451px; left:699px; height:33px; width:120px;'>Trübsal,</span><span class='ocrx_word' style='position:absolute; top:459px; left:839px; height:20px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:452px; left:908px; height:28px; width:62px;'>Gott</span><span class='ocrx_word' style='position:absolute; top:452px; left:990px; height:36px; width:122px;'>zugesügt.</span><span class='ocr_par' style='position:absolute; top:494px; left:102px; height:34px; width:1008px;' ></span><span class='ocr_line' style='position:absolute; top:494px; left:102px; height:34px; width:1008px;' ></span><span class='ocrx_word' style='position:absolute; top:496px; left:102px; height:27px; width:50px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:495px; left:172px; height:31px; width:76px;'>Sohn</span><span class='ocrx_word' style='position:absolute; top:495px; left:268px; height:30px; width:94px;'>Kenas,</span><span class='ocrx_word' style='position:absolute; top:495px; left:380px; height:26px; width:44px;'>des</span><span class='ocrx_word' style='position:absolute; top:494px; left:445px; height:27px; width:112px;'>Bruders</span><span class='ocrx_word' style='position:absolute; top:494px; left:576px; height:32px; width:89px;'>Kaleb;</span><span class='ocrx_word' style='position:absolute; top:500px; left:693px; height:28px; width:105px;'>gewann</span><span class='ocrx_word' style='position:absolute; top:495px; left:818px; height:33px; width:98px;'>Kiriath</span><span class='ocrx_word' style='position:absolute; top:495px; left:936px; height:33px; width:106px;'>Sepher,</span><span class='ocrx_word' style='position:absolute; top:495px; left:1061px; height:28px; width:49px;'>und</span><span class='ocr_par' style='position:absolute; top:535px; left:68px; height:79px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:535px; left:100px; height:35px; width:937px;' ></span><span class='ocrx_word' style='position:absolute; top:538px; left:100px; height:27px; width:80px;'>damit</span><span class='ocrx_word' style='position:absolute; top:537px; left:199px; height:33px; width:82px;'>Achsa.</span><span class='ocrx_word' style='position:absolute; top:538px; left:300px; height:26px; width:36px;'>die</span><span class='ocrx_word' style='position:absolute; top:537px; left:356px; height:32px; width:98px;'>Tochter</span><span class='ocrx_word' style='position:absolute; top:535px; left:472px; height:32px; width:81px;'>seines</span><span class='ocrx_word' style='position:absolute; top:537px; left:574px; height:27px; width:100px;'>Betters</span><span class='ocrx_word' style='position:absolute; top:537px; left:694px; height:27px; width:86px;'>Kaleb.</span><span class='ocrx_word' style='position:absolute; top:536px; left:800px; height:34px; width:77px;'>Nicht,</span><span class='ocrx_word' style='position:absolute; top:540px; left:899px; height:29px; width:20px;'>1.</span><span class='ocrx_word' style='position:absolute; top:539px; left:940px; height:26px; width:38px;'>12.</span><span class='ocrx_word' style='position:absolute; top:539px; left:1000px; height:25px; width:37px;'>13.</span><span class='ocr_line' style='position:absolute; top:576px; left:68px; height:38px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:578px; left:68px; height:36px; width:308px;'>Atroth-Sophan,</span><span class='ocrx_word' style='position:absolute; top:580px; left:396px; height:26px; width:37px;'>die</span><span class='ocrx_word' style='position:absolute; top:580px; left:454px; height:27px; width:101px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:580px; left:580px; height:26px; width:53px;'>oder</span><span class='ocrx_word' style='position:absolute; top:579px; left:658px; height:30px; width:102px;'>Decke,</span><span class='ocrx_word' style='position:absolute; top:580px; left:785px; height:26px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:580px; left:860px; height:34px; width:177px;'>Bedeckung</span><span class='ocrx_word' style='position:absolute; top:576px; left:1057px; height:32px; width:62px;'>des'</span><span class='ocr_par' style='position:absolute; top:621px; left:100px; height:36px; width:1011px;' ></span><span class='ocr_line' style='position:absolute; top:621px; left:100px; height:36px; width:1011px;' ></span><span class='ocrx_word' style='position:absolute; top:624px; left:100px; height:33px; width:135px;'>Hügels.</span><span class='ocrx_word' style='position:absolute; top:623px; left:273px; height:27px; width:62px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:623px; left:355px; height:26px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:623px; left:456px; height:26px; width:40px;'>der</span><span class='ocrx_word' style='position:absolute; top:621px; left:515px; height:28px; width:141px;'>Rubeniten</span><span class='ocrx_word' style='position:absolute; top:621px; left:680px; height:27px; width:35px;'>im</span><span class='ocrx_word' style='position:absolute; top:622px; left:734px; height:34px; width:141px;'>Königreich</span><span class='ocrx_word' style='position:absolute; top:622px; left:895px; height:32px; width:97px;'>Sthon.</span><span class='ocrx_word' style='position:absolute; top:624px; left:1008px; height:26px; width:16px;'>4</span><span class='ocrx_word' style='position:absolute; top:623px; left:1043px; height:34px; width:68px;'>Mos.</span><span class='ocr_par' style='position:absolute; top:668px; left:67px; height:74px; width:1045px;' ></span><span class='ocr_line' style='position:absolute; top:668px; left:98px; height:30px; width:102px;' ></span><span class='ocrx_word' style='position:absolute; top:669px; left:98px; height:29px; width:41px;'>32,</span><span class='ocrx_word' style='position:absolute; top:668px; left:158px; height:25px; width:42px;'>35.</span><span class='ocr_line' style='position:absolute; top:706px; left:67px; height:36px; width:1045px;' ></span><span class='ocrx_word' style='position:absolute; top:707px; left:67px; height:35px; width:274px;'>AtrothAddar:</span><span class='ocrx_word' style='position:absolute; top:706px; left:356px; height:29px; width:62px;'>Die</span><span class='ocrx_word' style='position:absolute; top:707px; left:432px; height:27px; width:105px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:706px; left:551px; height:27px; width:110px;'>Addar</span><span class='ocrx_word' style='position:absolute; top:706px; left:675px; height:31px; width:54px;'>(des</span><span class='ocrx_word' style='position:absolute; top:706px; left:744px; height:33px; width:105px;'>Sohnes</span><span class='ocrx_word' style='position:absolute; top:706px; left:861px; height:34px; width:155px;'>Benjamin).</span><span class='ocrx_word' style='position:absolute; top:708px; left:1037px; height:33px; width:75px;'>Diese</span><span class='ocr_par' style='position:absolute; top:748px; left:98px; height:37px; width:1013px;' ></span><span class='ocr_line' style='position:absolute; top:748px; left:98px; height:37px; width:1013px;' ></span><span class='ocrx_word' style='position:absolute; top:752px; left:98px; height:28px; width:86px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:751px; left:202px; height:34px; width:98px;'>gehörte</span><span class='ocrx_word' style='position:absolute; top:750px; left:322px; height:27px; width:47px;'>den</span><span class='ocrx_word' style='position:absolute; top:748px; left:395px; height:33px; width:216px;'>Benjaminitern,</span><span class='ocrx_word' style='position:absolute; top:749px; left:635px; height:33px; width:43px;'>lag</span><span class='ocrx_word' style='position:absolute; top:748px; left:702px; height:27px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:749px; left:753px; height:27px; width:45px;'>den</span><span class='ocrx_word' style='position:absolute; top:749px; left:826px; height:35px; width:112px;'>Grenzen</span><span class='ocrx_word' style='position:absolute; top:750px; left:962px; height:33px; width:71px;'>Iuda</span><span class='ocrx_word' style='position:absolute; top:750px; left:1057px; height:28px; width:54px;'>tmd</span><span class='ocr_par' style='position:absolute; top:794px; left:64px; height:76px; width:1048px;' ></span><span class='ocr_line' style='position:absolute; top:794px; left:98px; height:31px; width:134px;' ></span><span class='ocrx_word' style='position:absolute; top:794px; left:98px; height:31px; width:134px;'>Ephraim.</span><span class='ocr_line' style='position:absolute; top:833px; left:64px; height:37px; width:1048px;' ></span><span class='ocrx_word' style='position:absolute; top:834px; left:64px; height:36px; width:355px;'>Atroth.Beth-Ioab,</span><span class='ocrx_word' style='position:absolute; top:836px; left:438px; height:26px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:835px; left:480px; height:27px; width:17px;'>i.</span><span class='ocrx_word' style='position:absolute; top:834px; left:517px; height:27px; width:48px;'>die</span><span class='ocrx_word' style='position:absolute; top:834px; left:584px; height:27px; width:104px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:833px; left:712px; height:28px; width:52px;'>des</span><span class='ocrx_word' style='position:absolute; top:833px; left:784px; height:33px; width:125px;'>Hauses</span><span class='ocrx_word' style='position:absolute; top:834px; left:926px; height:32px; width:94px;'>Ioab.</span><span class='ocrx_word' style='position:absolute; top:835px; left:1050px; height:28px; width:62px;'>Eine</span><span class='ocr_par' style='position:absolute; top:876px; left:101px; height:35px; width:1012px;' ></span><span class='ocr_line' style='position:absolute; top:876px; left:101px; height:35px; width:1012px;' ></span><span class='ocrx_word' style='position:absolute; top:879px; left:101px; height:28px; width:86px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:879px; left:201px; height:27px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:879px; left:249px; height:32px; width:80px;'>Iuda,</span><span class='ocrx_word' style='position:absolute; top:883px; left:350px; height:22px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:878px; left:408px; height:27px; width:37px;'>die</span><span class='ocrx_word' style='position:absolute; top:877px; left:456px; height:32px; width:178px;'>Nachlommen</span><span class='ocrx_word' style='position:absolute; top:876px; left:645px; height:28px; width:97px;'>Salma</span><span class='ocrx_word' style='position:absolute; top:876px; left:762px; height:34px; width:114px;'>gewohnt</span><span class='ocrx_word' style='position:absolute; top:877px; left:887px; height:33px; width:85px;'>haben.</span><span class='ocrx_word' style='position:absolute; top:880px; left:992px; height:24px; width:10px;'>1</span><span class='ocrx_word' style='position:absolute; top:877px; left:1021px; height:34px; width:92px;'>Chron.</span><span class='ocr_par' style='position:absolute; top:923px; left:64px; height:73px; width:1048px;' ></span><span class='ocr_line' style='position:absolute; top:923px; left:96px; height:30px; width:89px;' ></span><span class='ocrx_word' style='position:absolute; top:923px; left:96px; height:30px; width:24px;'>2,</span><span class='ocrx_word' style='position:absolute; top:924px; left:141px; height:25px; width:44px;'>54.</span><span class='ocr_line' style='position:absolute; top:961px; left:64px; height:35px; width:1048px;' ></span><span class='ocrx_word' style='position:absolute; top:962px; left:64px; height:31px; width:148px;'>Attalia.</span><span class='ocrx_word' style='position:absolute; top:963px; left:249px; height:27px; width:63px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:963px; left:330px; height:27px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:962px; left:428px; height:26px; width:27px;'>in</span><span class='ocrx_word' style='position:absolute; top:961px; left:474px; height:33px; width:163px;'>Pamphilien</span><span class='ocrx_word' style='position:absolute; top:962px; left:665px; height:28px; width:36px;'>od.</span><span class='ocrx_word' style='position:absolute; top:961px; left:720px; height:33px; width:104px;'>Libyen,</span><span class='ocrx_word' style='position:absolute; top:967px; left:848px; height:22px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:962px; left:916px; height:27px; width:88px;'>Attala</span><span class='ocrx_word' style='position:absolute; top:962px; left:1023px; height:34px; width:89px;'>Phila.</span><span class='ocr_par' style='position:absolute; top:1005px; left:62px; height:77px; width:1073px;' ></span><span class='ocr_line' style='position:absolute; top:1005px; left:95px; height:34px; width:499px;' ></span><span class='ocrx_word' style='position:absolute; top:1006px; left:95px; height:33px; width:90px;'>delpho</span><span class='ocrx_word' style='position:absolute; top:1006px; left:206px; height:27px; width:96px;'>erbaut.</span><span class='ocrx_word' style='position:absolute; top:1006px; left:321px; height:31px; width:47px;'>Ap.</span><span class='ocrx_word' style='position:absolute; top:1005px; left:388px; height:33px; width:83px;'>Gesch.</span><span class='ocrx_word' style='position:absolute; top:1006px; left:494px; height:32px; width:39px;'>14,</span><span class='ocrx_word' style='position:absolute; top:1006px; left:553px; height:25px; width:41px;'>25.</span><span class='ocr_line' style='position:absolute; top:1046px; left:62px; height:36px; width:1073px;' ></span><span class='ocrx_word' style='position:absolute; top:1048px; left:62px; height:29px; width:146px;'>Attalus</span><span class='ocrx_word' style='position:absolute; top:1048px; left:255px; height:27px; width:51px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:1046px; left:330px; height:34px; width:81px;'>König</span><span class='ocrx_word' style='position:absolute; top:1047px; left:436px; height:26px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:1046px; left:482px; height:32px; width:112px;'>Mysien,</span><span class='ocrx_word' style='position:absolute; top:1046px; left:623px; height:32px; width:99px;'>welches</span><span class='ocrx_word' style='position:absolute; top:1047px; left:747px; height:26px; width:72px;'>unter</span><span class='ocrx_word' style='position:absolute; top:1046px; left:843px; height:35px; width:129px;'>Phrygien</span><span class='ocrx_word' style='position:absolute; top:1047px; left:997px; height:35px; width:115px;'>gehörte;</span><span class='ocrx_word' style='position:absolute; top:1058px; left:1128px; height:9px; width:7px;'>,</span><span class='ocr_par' style='position:absolute; top:1089px; left:95px; height:36px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1089px; left:95px; height:36px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1093px; left:95px; height:32px; width:112px;'>genannt</span><span class='ocrx_word' style='position:absolute; top:1095px; left:227px; height:22px; width:47px;'>von</span><span class='ocrx_word' style='position:absolute; top:1090px; left:294px; height:29px; width:122px;'>Attale,</span><span class='ocrx_word' style='position:absolute; top:1090px; left:435px; height:30px; width:99px;'>welches</span><span class='ocrx_word' style='position:absolute; top:1089px; left:553px; height:27px; width:38px;'>bei</span><span class='ocrx_word' style='position:absolute; top:1089px; left:610px; height:26px; width:47px;'>den</span><span class='ocrx_word' style='position:absolute; top:1089px; left:676px; height:33px; width:143px;'>Phrygiern</span><span class='ocrx_word' style='position:absolute; top:1089px; left:838px; height:32px; width:79px;'>Kropf</span><span class='ocrx_word' style='position:absolute; top:1090px; left:935px; height:26px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:1090px; left:1012px; height:34px; width:99px;'>Gurgel</span><span class='ocr_par' style='position:absolute; top:1131px; left:94px; height:37px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1131px; left:94px; height:37px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1133px; left:94px; height:35px; width:119px;'>geheißen</span><span class='ocrx_word' style='position:absolute; top:1133px; left:233px; height:32px; width:77px;'>haben</span><span class='ocrx_word' style='position:absolute; top:1131px; left:329px; height:30px; width:51px;'>soll.</span><span class='ocrx_word' style='position:absolute; top:1157px; left:393px; height:4px; width:4px;'>,</span><span class='ocrx_word' style='position:absolute; top:1131px; left:417px; height:28px; width:62px;'>War</span><span class='ocrx_word' style='position:absolute; top:1132px; left:497px; height:26px; width:39px;'>ein</span><span class='ocrx_word' style='position:absolute; top:1132px; left:555px; height:33px; width:82px;'>König</span><span class='ocrx_word' style='position:absolute; top:1132px; left:660px; height:26px; width:40px;'>der</span><span class='ocrx_word' style='position:absolute; top:1132px; left:719px; height:33px; width:170px;'>Pergamener</span><span class='ocrx_word' style='position:absolute; top:1133px; left:907px; height:25px; width:49px;'>und</span><span class='ocrx_word' style='position:absolute; top:1131px; left:976px; height:34px; width:134px;'>Phrvgier.</span><span class='ocr_par' style='position:absolute; top:1175px; left:59px; height:75px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:1175px; left:95px; height:32px; width:237px;' ></span><span class='ocrx_word' style='position:absolute; top:1177px; left:95px; height:24px; width:11px;'>l</span><span class='ocrx_word' style='position:absolute; top:1175px; left:130px; height:27px; width:81px;'>Mack.</span><span class='ocrx_word' style='position:absolute; top:1176px; left:233px; height:31px; width:39px;'>15,</span><span class='ocrx_word' style='position:absolute; top:1176px; left:292px; height:25px; width:40px;'>22.</span><span class='ocr_line' style='position:absolute; top:1216px; left:59px; height:34px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:1217px; left:59px; height:29px; width:87px;'>Ava.</span><span class='ocrx_word' style='position:absolute; top:1217px; left:184px; height:33px; width:40px;'>Ist</span><span class='ocrx_word' style='position:absolute; top:1217px; left:242px; height:26px; width:38px;'>bei</span><span class='ocrx_word' style='position:absolute; top:1218px; left:299px; height:25px; width:45px;'>den</span><span class='ocrx_word' style='position:absolute; top:1217px; left:364px; height:26px; width:68px;'>alten</span><span class='ocrx_word' style='position:absolute; top:1216px; left:453px; height:32px; width:115px;'>Griechen</span><span class='ocrx_word' style='position:absolute; top:1216px; left:587px; height:26px; width:49px;'>Aia</span><span class='ocrx_word' style='position:absolute; top:1216px; left:655px; height:26px; width:36px;'>od.</span><span class='ocrx_word' style='position:absolute; top:1216px; left:711px; height:31px; width:60px;'>Aea,</span><span class='ocrx_word' style='position:absolute; top:1216px; left:790px; height:26px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1216px; left:842px; height:33px; width:151px;'>Hauptstadt</span><span class='ocrx_word' style='position:absolute; top:1217px; left:1010px; height:26px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:1216px; left:1051px; height:29px; width:59px;'>Col»</span><span class='ocr_par' style='position:absolute; top:1258px; left:92px; height:35px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1258px; left:92px; height:35px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1261px; left:92px; height:32px; width:73px;'>chide,</span><span class='ocrx_word' style='position:absolute; top:1265px; left:186px; height:21px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:1260px; left:244px; height:25px; width:79px;'>Aetas</span><span class='ocrx_word' style='position:absolute; top:1258px; left:341px; height:34px; width:110px;'>regierte.</span><span class='ocrx_word' style='position:absolute; top:1258px; left:494px; height:33px; width:99px;'>Colchis</span><span class='ocrx_word' style='position:absolute; top:1258px; left:612px; height:33px; width:66px;'>heißt</span><span class='ocrx_word' style='position:absolute; top:1258px; left:697px; height:34px; width:115px;'>heutiges</span><span class='ocrx_word' style='position:absolute; top:1258px; left:833px; height:34px; width:83px;'>Tages</span><span class='ocrx_word' style='position:absolute; top:1258px; left:938px; height:35px; width:170px;'>Mengrelicn,</span><span class='ocr_par' style='position:absolute; top:1300px; left:92px; height:35px; width:1017px;' ></span><span class='ocr_line' style='position:absolute; top:1300px; left:92px; height:35px; width:1017px;' ></span><span class='ocrx_word' style='position:absolute; top:1303px; left:92px; height:27px; width:39px;'>die</span><span class='ocrx_word' style='position:absolute; top:1303px; left:160px; height:32px; width:98px;'>meisten</span><span class='ocrx_word' style='position:absolute; top:1302px; left:277px; height:30px; width:153px;'>Einwohner</span><span class='ocrx_word' style='position:absolute; top:1300px; left:455px; height:33px; width:50px;'>sind</span><span class='ocrx_word' style='position:absolute; top:1300px; left:531px; height:34px; width:122px;'>Christen.</span><span class='ocrx_word' style='position:absolute; top:1300px; left:698px; height:28px; width:57px;'>Von</span><span class='ocrx_word' style='position:absolute; top:1300px; left:780px; height:32px; width:51px;'>hier</span><span class='ocrx_word' style='position:absolute; top:1302px; left:855px; height:26px; width:101px;'>wurden</span><span class='ocrx_word' style='position:absolute; top:1302px; left:980px; height:26px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1301px; left:1037px; height:28px; width:72px;'>Leute</span><span class='ocr_par' style='position:absolute; top:1342px; left:92px; height:36px; width:1018px;' ></span><span class='ocr_line' style='position:absolute; top:1342px; left:92px; height:36px; width:1018px;' ></span><span class='ocrx_word' style='position:absolute; top:1349px; left:92px; height:22px; width:52px;'>von</span><span class='ocrx_word' style='position:absolute; top:1344px; left:165px; height:32px; width:182px;'>Salmanasscr</span><span class='ocrx_word' style='position:absolute; top:1344px; left:371px; height:31px; width:57px;'>nach</span><span class='ocrx_word' style='position:absolute; top:1343px; left:454px; height:27px; width:128px;'>Samaria</span><span class='ocrx_word' style='position:absolute; top:1343px; left:606px; height:35px; width:110px;'>gesührt,</span><span class='ocrx_word' style='position:absolute; top:1347px; left:741px; height:22px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:1342px; left:804px; height:33px; width:31px;'>sie</span><span class='ocrx_word' style='position:absolute; top:1343px; left:859px; height:32px; width:58px;'>noch</span><span class='ocrx_word' style='position:absolute; top:1343px; left:942px; height:33px; width:51px;'>ihre</span><span class='ocrx_word' style='position:absolute; top:1344px; left:1019px; height:27px; width:91px;'>Götter</span><span class='ocr_par' style='position:absolute; top:1386px; left:58px; height:76px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:1386px; left:93px; height:33px; width:782px;' ></span><span class='ocrx_word' style='position:absolute; top:1387px; left:93px; height:32px; width:118px;'>Nibehas</span><span class='ocrx_word' style='position:absolute; top:1387px; left:231px; height:26px; width:48px;'>und</span><span class='ocrx_word' style='position:absolute; top:1386px; left:298px; height:32px; width:123px;'>Tharthac</span><span class='ocrx_word' style='position:absolute; top:1386px; left:440px; height:27px; width:138px;'>anbeteten.</span><span class='ocrx_word' style='position:absolute; top:1388px; left:597px; height:24px; width:15px;'>2</span><span class='ocrx_word' style='position:absolute; top:1387px; left:630px; height:26px; width:64px;'>Kön.</span><span class='ocrx_word' style='position:absolute; top:1388px; left:716px; height:28px; width:38px;'>l7,</span><span class='ocrx_word' style='position:absolute; top:1386px; left:775px; height:27px; width:41px;'>24.</span><span class='ocrx_word' style='position:absolute; top:1387px; left:835px; height:26px; width:40px;'>31.</span><span class='ocr_line' style='position:absolute; top:1428px; left:58px; height:34px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:1428px; left:58px; height:30px; width:117px;'>Aven.</span><span class='ocrx_word' style='position:absolute; top:1429px; left:213px; height:33px; width:101px;'>Götze,</span><span class='ocrx_word' style='position:absolute; top:1428px; left:339px; height:27px; width:163px;'>Eitelleit.</span><span class='ocrx_word' style='position:absolute; top:1428px; left:538px; height:27px; width:42px;'>So</span><span class='ocrx_word' style='position:absolute; top:1429px; left:605px; height:26px; width:60px;'>wird</span><span class='ocrx_word' style='position:absolute; top:1428px; left:690px; height:33px; width:88px;'>Bethel</span><span class='ocrx_word' style='position:absolute; top:1429px; left:802px; height:33px; width:118px;'>genannt.</span><span class='ocrx_word' style='position:absolute; top:1428px; left:939px; height:34px; width:56px;'>Hos.</span><span class='ocrx_word' style='position:absolute; top:1431px; left:1023px; height:29px; width:38px;'>10,</span><span class='ocrx_word' style='position:absolute; top:1431px; left:1086px; height:25px; width:23px;'>8.</span><span class='ocr_par' style='position:absolute; top:1471px; left:92px; height:34px; width:1018px;' ></span><span class='ocr_line' style='position:absolute; top:1471px; left:92px; height:34px; width:1018px;' ></span><span class='ocrx_word' style='position:absolute; top:1478px; left:92px; height:27px; width:88px;'>wegen</span><span class='ocrx_word' style='position:absolute; top:1472px; left:199px; height:26px; width:42px;'>der</span><span class='ocrx_word' style='position:absolute; top:1471px; left:261px; height:33px; width:104px;'>Götzen,</span><span class='ocrx_word' style='position:absolute; top:1471px; left:390px; height:26px; width:39px;'>die</span><span class='ocrx_word' style='position:absolute; top:1471px; left:456px; height:32px; width:100px;'>daselbst</span><span class='ocrx_word' style='position:absolute; top:1476px; left:579px; height:21px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:1472px; left:651px; height:25px; width:43px;'>den</span><span class='ocrx_word' style='position:absolute; top:1471px; left:715px; height:32px; width:137px;'>Israeliten</span><span class='ocrx_word' style='position:absolute; top:1471px; left:877px; height:32px; width:96px;'>verehrt</span><span class='ocrx_word' style='position:absolute; top:1472px; left:1000px; height:26px; width:110px;'>wurden.</span><span class='ocr_par' style='position:absolute; top:1513px; left:91px; height:35px; width:1019px;' ></span><span class='ocr_line' style='position:absolute; top:1513px; left:91px; height:35px; width:1019px;' ></span><span class='ocrx_word' style='position:absolute; top:1515px; left:91px; height:26px; width:58px;'>Mit</span><span class='ocrx_word' style='position:absolute; top:1515px; left:167px; height:26px; width:53px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1520px; left:240px; height:28px; width:92px;'>ganzen</span><span class='ocrx_word' style='position:absolute; top:1513px; left:352px; height:27px; width:109px;'>Namen:</span><span class='ocrx_word' style='position:absolute; top:1513px; left:482px; height:31px; width:158px;'>Beth»Aven,</span><span class='ocrx_word' style='position:absolute; top:1513px; left:658px; height:27px; width:50px;'>das</span><span class='ocrx_word' style='position:absolute; top:1513px; left:726px; height:35px; width:167px;'>Götzenhaus,</span><span class='ocrx_word' style='position:absolute; top:1513px; left:914px; height:33px; width:65px;'>oder,</span><span class='ocrx_word' style='position:absolute; top:1514px; left:997px; height:26px; width:32px;'>da</span><span class='ocrx_word' style='position:absolute; top:1520px; left:1048px; height:21px; width:62px;'>man</span><span class='ocr_par' style='position:absolute; top:1555px; left:56px; height:78px; width:1054px;' ></span><span class='ocr_line' style='position:absolute; top:1555px; left:91px; height:33px; width:540px;' ></span><span class='ocrx_word' style='position:absolute; top:1558px; left:91px; height:26px; width:58px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1557px; left:169px; height:26px; width:85px;'>Eiteln</span><span class='ocrx_word' style='position:absolute; top:1556px; left:275px; height:31px; width:178px;'>nachwandelt.</span><span class='ocrx_word' style='position:absolute; top:1555px; left:473px; height:33px; width:59px;'>Hos.</span><span class='ocrx_word' style='position:absolute; top:1558px; left:549px; height:26px; width:22px;'>4,</span><span class='ocrx_word' style='position:absolute; top:1558px; left:593px; height:23px; width:38px;'>15.</span><span class='ocr_line' style='position:absolute; top:1597px; left:56px; height:36px; width:1054px;' ></span><span class='ocrx_word' style='position:absolute; top:1597px; left:56px; height:36px; width:186px;'>Augustus.</span><span class='ocrx_word' style='position:absolute; top:1597px; left:287px; height:34px; width:132px;'>Würdig</span><span class='ocrx_word' style='position:absolute; top:1598px; left:448px; height:32px; width:129px;'>verehrt</span><span class='ocrx_word' style='position:absolute; top:1598px; left:608px; height:26px; width:60px;'>und</span><span class='ocrx_word' style='position:absolute; top:1599px; left:704px; height:33px; width:172px;'>angebetet</span><span class='ocrx_word' style='position:absolute; top:1605px; left:908px; height:27px; width:36px;'>zu</span><span class='ocrx_word' style='position:absolute; top:1599px; left:978px; height:28px; width:132px;'>werden.</span><span class='ocr_par' style='position:absolute; top:1640px; left:92px; height:34px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1640px; left:92px; height:34px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1640px; left:92px; height:34px; width:97px;'>Diesen</span><span class='ocrx_word' style='position:absolute; top:1640px; left:211px; height:27px; width:100px;'>Namen</span><span class='ocrx_word' style='position:absolute; top:1641px; left:340px; height:33px; width:46px;'>gab</span><span class='ocrx_word' style='position:absolute; top:1641px; left:413px; height:26px; width:46px;'>das</span><span class='ocrx_word' style='position:absolute; top:1640px; left:487px; height:32px; width:109px;'>romische</span><span class='ocrx_word' style='position:absolute; top:1640px; left:616px; height:27px; width:62px;'>Voll</span><span class='ocrx_word' style='position:absolute; top:1641px; left:706px; height:26px; width:52px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1641px; left:781px; height:31px; width:88px;'>Kaiser</span><span class='ocrx_word' style='position:absolute; top:1641px; left:887px; height:31px; width:143px;'>Octavian,</span><span class='ocrx_word' style='position:absolute; top:1642px; left:1058px; height:26px; width:50px;'>und</span><span class='ocr_par' style='position:absolute; top:1682px; left:93px; height:34px; width:1015px;' ></span><span class='ocr_line' style='position:absolute; top:1682px; left:93px; height:34px; width:1015px;' ></span><span class='ocrx_word' style='position:absolute; top:1683px; left:93px; height:27px; width:49px;'>alle</span><span class='ocrx_word' style='position:absolute; top:1683px; left:161px; height:32px; width:130px;'>romischen</span><span class='ocrx_word' style='position:absolute; top:1683px; left:310px; height:32px; width:86px;'>Kaiser</span><span class='ocrx_word' style='position:absolute; top:1683px; left:416px; height:30px; width:79px;'>haben</span><span class='ocrx_word' style='position:absolute; top:1682px; left:514px; height:32px; width:80px;'>diesen</span><span class='ocrx_word' style='position:absolute; top:1682px; left:614px; height:27px; width:95px;'>Namen</span><span class='ocrx_word' style='position:absolute; top:1683px; left:728px; height:33px; width:170px;'>beibehalten,</span><span class='ocrx_word' style='position:absolute; top:1682px; left:917px; height:33px; width:47px;'>daß</span><span class='ocrx_word' style='position:absolute; top:1682px; left:983px; height:33px; width:31px;'>sie</span><span class='ocrx_word' style='position:absolute; top:1692px; left:1033px; height:18px; width:75px;'>«au,-</span><span class='ocr_par' style='position:absolute; top:1724px; left:55px; height:119px; width:1052px;' ></span><span class='ocr_line' style='position:absolute; top:1724px; left:90px; height:35px; width:907px;' ></span><span class='ocrx_word' style='position:absolute; top:1733px; left:90px; height:25px; width:52px;'>per</span><span class='ocrx_word' style='position:absolute; top:1727px; left:160px; height:31px; width:124px;'>2ußr>«ti,</span><span class='ocrx_word' style='position:absolute; top:1726px; left:304px; height:25px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:1724px; left:345px; height:26px; width:15px;'>i,</span><span class='ocrx_word' style='position:absolute; top:1725px; left:382px; height:32px; width:80px;'>allzeit</span><span class='ocrx_word' style='position:absolute; top:1725px; left:482px; height:31px; width:99px;'>Mehrer</span><span class='ocrx_word' style='position:absolute; top:1725px; left:600px; height:26px; width:43px;'>des</span><span class='ocrx_word' style='position:absolute; top:1724px; left:664px; height:32px; width:86px;'>Reichs</span><span class='ocrx_word' style='position:absolute; top:1725px; left:770px; height:34px; width:115px;'>geheißen</span><span class='ocrx_word' style='position:absolute; top:1725px; left:904px; height:33px; width:93px;'>haben.</span><span class='ocr_line' style='position:absolute; top:1766px; left:55px; height:34px; width:897px;' ></span><span class='ocrx_word' style='position:absolute; top:1766px; left:55px; height:34px; width:121px;'>Avith.</span><span class='ocrx_word' style='position:absolute; top:1767px; left:212px; height:32px; width:112px;'>Haufe.</span><span class='ocrx_word' style='position:absolute; top:1766px; left:361px; height:27px; width:63px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:1766px; left:443px; height:28px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:1768px; left:542px; height:25px; width:27px;'>in</span><span class='ocrx_word' style='position:absolute; top:1767px; left:587px; height:32px; width:122px;'>Idumäa.</span><span class='ocrx_word' style='position:absolute; top:1769px; left:732px; height:24px; width:10px;'>1</span><span class='ocrx_word' style='position:absolute; top:1767px; left:763px; height:32px; width:68px;'>Mos.</span><span class='ocrx_word' style='position:absolute; top:1769px; left:849px; height:29px; width:43px;'>36,</span><span class='ocrx_word' style='position:absolute; top:1769px; left:910px; height:26px; width:42px;'>35.</span><span class='ocr_line' style='position:absolute; top:1809px; left:57px; height:34px; width:1050px;' ></span><span class='ocrx_word' style='position:absolute; top:1809px; left:57px; height:30px; width:125px;'>Aulon.</span><span class='ocrx_word' style='position:absolute; top:1809px; left:236px; height:34px; width:209px;'>Ausgehöhlt.</span><span class='ocrx_word' style='position:absolute; top:1809px; left:491px; height:27px; width:62px;'>Das</span><span class='ocrx_word' style='position:absolute; top:1809px; left:581px; height:34px; width:72px;'>große</span><span class='ocrx_word' style='position:absolute; top:1809px; left:681px; height:32px; width:76px;'>Thal,</span><span class='ocrx_word' style='position:absolute; top:1810px; left:791px; height:27px; width:80px;'>worin</span><span class='ocrx_word' style='position:absolute; top:1810px; left:897px; height:27px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1809px; left:962px; height:34px; width:145px;'>berühmten</span><span class='ocr_par' style='position:absolute; top:1851px; left:89px; height:36px; width:1017px;' ></span><span class='ocr_line' style='position:absolute; top:1851px; left:89px; height:36px; width:1017px;' ></span><span class='ocrx_word' style='position:absolute; top:1853px; left:89px; height:29px; width:97px;'>Städte</span><span class='ocrx_word' style='position:absolute; top:1852px; left:204px; height:34px; width:111px;'>Vethsan</span><span class='ocrx_word' style='position:absolute; top:1852px; left:334px; height:27px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:1852px; left:409px; height:34px; width:179px;'>Scythopolis,</span><span class='ocrx_word' style='position:absolute; top:1851px; left:605px; height:34px; width:127px;'>Tlberias,</span><span class='ocrx_word' style='position:absolute; top:1852px; left:751px; height:35px; width:111px;'>Iericho,</span><span class='ocrx_word' style='position:absolute; top:1851px; left:881px; height:29px; width:48px;'>das</span><span class='ocrx_word' style='position:absolute; top:1853px; left:949px; height:27px; width:64px;'>todte</span><span class='ocrx_word' style='position:absolute; top:1852px; left:1033px; height:28px; width:73px;'>Meer</span></div>
|
metadata
CHANGED
@@ -1,82 +1,95 @@
|
|
1
|
-
--- !ruby/object:Gem::Specification
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
2
|
name: rhocr
|
3
|
-
version: !ruby/object:Gem::Version
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: '0.1'
|
4
5
|
prerelease:
|
5
|
-
version: 0.0.3
|
6
6
|
platform: ruby
|
7
|
-
authors:
|
7
|
+
authors:
|
8
8
|
- Andreas Neumann
|
9
9
|
autorequire:
|
10
10
|
bindir: bin
|
11
11
|
cert_chain: []
|
12
|
-
|
13
|
-
|
14
|
-
|
15
|
-
|
16
|
-
|
12
|
+
date: 2011-09-08 00:00:00.000000000Z
|
13
|
+
dependencies:
|
14
|
+
- !ruby/object:Gem::Dependency
|
15
|
+
name: nokogiri
|
16
|
+
requirement: &70276550001820 !ruby/object:Gem::Requirement
|
17
|
+
none: false
|
18
|
+
requirements:
|
19
|
+
- - ! '>='
|
20
|
+
- !ruby/object:Gem::Version
|
21
|
+
version: '0'
|
22
|
+
type: :runtime
|
23
|
+
prerelease: false
|
24
|
+
version_requirements: *70276550001820
|
17
25
|
description: Manipulate and use OCR data encode in HOCR
|
18
|
-
email:
|
26
|
+
email: andreas@neumann.biz
|
19
27
|
executables: []
|
20
|
-
|
21
28
|
extensions: []
|
22
|
-
|
23
|
-
extra_rdoc_files:
|
29
|
+
extra_rdoc_files:
|
24
30
|
- README
|
25
|
-
-
|
31
|
+
- TODO.txt
|
32
|
+
- lib/hocr_box.rb
|
33
|
+
- lib/ocr_document.rb
|
34
|
+
- lib/ocr_element.rb
|
26
35
|
- lib/ocr_page.rb
|
27
|
-
- lib/ocrx_word.rb
|
28
36
|
- lib/rhocr.rb
|
29
|
-
files:
|
37
|
+
files:
|
30
38
|
- Manifest
|
31
39
|
- README
|
32
40
|
- Rakefile
|
41
|
+
- TODO.txt
|
42
|
+
- data/Seite_Die_Gartenlaube_242.html
|
33
43
|
- data/Seite_Tagebuch_H_C_Lang_08.html
|
44
|
+
- data/Seite_Tagebuch_H_C_Lang_08.jpg
|
45
|
+
- data/test.html
|
46
|
+
- data/test.png
|
34
47
|
- example/example_server.rb
|
35
48
|
- example/public/OCRTest.css
|
36
49
|
- example/public/OCRTest.html
|
37
50
|
- example/public/OCRTest_marker.js
|
38
|
-
- example/public/
|
51
|
+
- example/public/Seite_Tagebuch_H_C_Lang_08.jpg
|
39
52
|
- example/public/img/Seite_Tagebuch_H_C_Lang_08.jpg
|
40
|
-
- lib/
|
53
|
+
- lib/hocr_box.rb
|
54
|
+
- lib/ocr_document.rb
|
55
|
+
- lib/ocr_element.rb
|
41
56
|
- lib/ocr_page.rb
|
42
|
-
- lib/ocrx_word.rb
|
43
57
|
- lib/rhocr.rb
|
44
58
|
- rhocr.gemspec
|
45
|
-
-
|
46
|
-
-
|
47
|
-
-
|
48
|
-
|
59
|
+
- spec/hocr_box_spec.rb
|
60
|
+
- spec/ocr_document_spec.rb
|
61
|
+
- spec/ocr_element_spec.rb
|
62
|
+
- spec/ocr_page_spec.rb
|
63
|
+
- spec/rhocr_spec.rb
|
64
|
+
- test.html
|
49
65
|
homepage: http://github.com/daandi/rhocr
|
50
66
|
licenses: []
|
51
|
-
|
52
67
|
post_install_message:
|
53
|
-
rdoc_options:
|
68
|
+
rdoc_options:
|
54
69
|
- --line-numbers
|
55
70
|
- --inline-source
|
56
71
|
- --title
|
57
72
|
- Rhocr
|
58
73
|
- --main
|
59
74
|
- README
|
60
|
-
require_paths:
|
75
|
+
require_paths:
|
61
76
|
- lib
|
62
|
-
required_ruby_version: !ruby/object:Gem::Requirement
|
77
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
63
78
|
none: false
|
64
|
-
requirements:
|
65
|
-
- -
|
66
|
-
- !ruby/object:Gem::Version
|
67
|
-
version:
|
68
|
-
required_rubygems_version: !ruby/object:Gem::Requirement
|
79
|
+
requirements:
|
80
|
+
- - ! '>='
|
81
|
+
- !ruby/object:Gem::Version
|
82
|
+
version: '0'
|
83
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
69
84
|
none: false
|
70
|
-
requirements:
|
71
|
-
- -
|
72
|
-
- !ruby/object:Gem::Version
|
73
|
-
version:
|
85
|
+
requirements:
|
86
|
+
- - ! '>='
|
87
|
+
- !ruby/object:Gem::Version
|
88
|
+
version: '1.2'
|
74
89
|
requirements: []
|
75
|
-
|
76
90
|
rubyforge_project: rhocr
|
77
|
-
rubygems_version: 1.6
|
91
|
+
rubygems_version: 1.8.6
|
78
92
|
signing_key:
|
79
93
|
specification_version: 3
|
80
94
|
summary: Manipulate and use OCR data encode in HOCR
|
81
95
|
test_files: []
|
82
|
-
|
Binary file
|
data/lib/ocr_box.rb
DELETED
@@ -1,43 +0,0 @@
|
|
1
|
-
#coding: utf-8
|
2
|
-
|
3
|
-
class OCRBox
|
4
|
-
|
5
|
-
attr_reader :x1, :y1, :x2, :y2
|
6
|
-
|
7
|
-
def initialize(x1, y1 , x2, y2)
|
8
|
-
@x1 = x1
|
9
|
-
@y1 = y1
|
10
|
-
@x2 = x2
|
11
|
-
@y2 = y2
|
12
|
-
end
|
13
|
-
|
14
|
-
def encloses?(element)
|
15
|
-
@x1 <= element.x1 and
|
16
|
-
@x2 >= element.x2 and
|
17
|
-
@y1 <= element.y1 and
|
18
|
-
@y2 >= element.y2
|
19
|
-
end
|
20
|
-
|
21
|
-
def enclosed_by?(element)
|
22
|
-
return element.encloses? self
|
23
|
-
end
|
24
|
-
|
25
|
-
def to_s
|
26
|
-
"tl->(x:#{@x1} y:#{@y1})/br->:(x:#{@x2} y:#{@y2})"
|
27
|
-
end
|
28
|
-
|
29
|
-
def to_css_style
|
30
|
-
top = @y1
|
31
|
-
left = @x1
|
32
|
-
height = @y2 - @y1
|
33
|
-
width = @x2 - @x1
|
34
|
-
|
35
|
-
"position:absolute; top:#{top}px; left:#{left}px; height:#{height}px; width:#{width}px;"
|
36
|
-
end
|
37
|
-
|
38
|
-
def to_json
|
39
|
-
|
40
|
-
end
|
41
|
-
|
42
|
-
end
|
43
|
-
|
data/lib/ocrx_word.rb
DELETED
@@ -1,23 +0,0 @@
|
|
1
|
-
#coding: utf-8
|
2
|
-
|
3
|
-
require 'cgi'
|
4
|
-
require_relative 'ocr_box'
|
5
|
-
|
6
|
-
class OCRXWord < OCRBox
|
7
|
-
|
8
|
-
attr_reader :text
|
9
|
-
|
10
|
-
def initialize(x1,y1,x2,y2,word)
|
11
|
-
super(x1.to_i, y1.to_i, x2.to_i, y2.to_i)
|
12
|
-
@text = word
|
13
|
-
end
|
14
|
-
|
15
|
-
def to_html(css_class = 'ocrx_word')
|
16
|
-
"<span style='#{ to_css_style }' class='#{css_class}'><span class='word'>" + CGI::escapeHTML(@text) +"</span></span>"
|
17
|
-
end
|
18
|
-
|
19
|
-
def to_s
|
20
|
-
"#{@text}\t#{super}"
|
21
|
-
end
|
22
|
-
|
23
|
-
end
|
data/rspec/ocr_box_spec.rb
DELETED
@@ -1,48 +0,0 @@
|
|
1
|
-
#coding: utf-8
|
2
|
-
|
3
|
-
require_relative '../lib/ocr_box'
|
4
|
-
|
5
|
-
describe OCRBox do
|
6
|
-
|
7
|
-
before(:each) do
|
8
|
-
@box ||= OCRBox.new(1,2,20,8)
|
9
|
-
end
|
10
|
-
|
11
|
-
describe "#to_s" do
|
12
|
-
it "prints a human readable Box-Version with coordinates upper_left(x,y) bottom_right(x,y)" do
|
13
|
-
@box.to_s.should == "tl->(x:1 y:2)/br->:(x:20 y:8)"
|
14
|
-
end
|
15
|
-
end
|
16
|
-
|
17
|
-
describe '#encloses?(element)' do
|
18
|
-
it "tests wather given OCRBox is enclosed by the current OCRBox" do
|
19
|
-
@box.encloses?( OCRBox.new(0,3,19,7) ).should be_false
|
20
|
-
@box.encloses?( OCRBox.new(2,3,19,7) ).should be_true
|
21
|
-
end
|
22
|
-
it "encloses also itself" do
|
23
|
-
@box.encloses?( @box ).should be_true
|
24
|
-
end
|
25
|
-
end
|
26
|
-
|
27
|
-
describe '#to_css_style' do
|
28
|
-
it 'should create css-style attributes' do
|
29
|
-
@box.to_css_style.should == 'position:absolute; top:2px; left:1px; height:6px; width:19px;'
|
30
|
-
end
|
31
|
-
end
|
32
|
-
|
33
|
-
describe '#enclosed_by?(element)' do
|
34
|
-
it 'should be enclosed by Boxes bigger than itself' do
|
35
|
-
@box.enclosed_by?( OCRBox.new(0,1,21,9) ).should be_true
|
36
|
-
end
|
37
|
-
it 'should not be enclosed by Boxes smaller than itself' do
|
38
|
-
@box.enclosed_by?( OCRBox.new(2,3,19,7) ).should be_false
|
39
|
-
end
|
40
|
-
it 'should be enclosed by Boxes of the same size' do
|
41
|
-
@box.enclosed_by?( @box ).should be_true
|
42
|
-
end
|
43
|
-
end
|
44
|
-
|
45
|
-
|
46
|
-
|
47
|
-
|
48
|
-
end
|
data/rspec/ocr_page_spec.rb
DELETED
@@ -1,17 +0,0 @@
|
|
1
|
-
#coding: utf-8
|
2
|
-
|
3
|
-
require_relative '../lib/ocr_page'
|
4
|
-
|
5
|
-
describe OCRPage do
|
6
|
-
|
7
|
-
before(:each) do
|
8
|
-
@ocr_page ||= OCRPage.new('../data/Seite_Tagebuch_H_C_Lang_08.html')
|
9
|
-
end
|
10
|
-
|
11
|
-
describe '' do
|
12
|
-
it '' do
|
13
|
-
p @ocr_page.enclosed_words( OCRBox.new(500,1703,1200,1800) )
|
14
|
-
end
|
15
|
-
end
|
16
|
-
|
17
|
-
end
|
data/rspec/ocrx_word_spec.rb
DELETED
@@ -1,32 +0,0 @@
|
|
1
|
-
#coding: utf-8
|
2
|
-
|
3
|
-
require_relative '../lib/ocrx_word'
|
4
|
-
|
5
|
-
describe OCRXWord do
|
6
|
-
|
7
|
-
before(:each) do
|
8
|
-
@ocrx_word = OCRXWord.new(10,15,20,20,'WORT')
|
9
|
-
end
|
10
|
-
|
11
|
-
describe '#to_s' do
|
12
|
-
it 'should print the coordinates of the box and the textual information' do
|
13
|
-
p @ocrx_word
|
14
|
-
@ocrx_word.to_s.should == "WORT\ttl->(x:10 y:15)/br->:(x:20 y:20)"
|
15
|
-
end
|
16
|
-
end
|
17
|
-
|
18
|
-
describe '#to_html(css_class)' do
|
19
|
-
it 'should create an span elment to overlay an image on an html-page' do
|
20
|
-
@ocrx_word.to_html.should == "<span style='position:absolute; top:15px; left:10px; height:5px; width:10px;' class='ocrx_word'><span class='word'>WORT</span></span>"
|
21
|
-
end
|
22
|
-
|
23
|
-
it 'no css_class_class given should default to ocrx_word' do
|
24
|
-
@ocrx_word.to_html.should =~ /class='ocrx_word'/
|
25
|
-
end
|
26
|
-
|
27
|
-
it 'css_class given should be part of genearted html' do
|
28
|
-
@ocrx_word.to_html('rosebud').should =~ /class='rosebud'/
|
29
|
-
end
|
30
|
-
end
|
31
|
-
|
32
|
-
end
|