rhocr 0.0.3 → 0.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/Manifest +15 -6
- data/Rakefile +3 -3
- data/TODO.txt +42 -0
- data/data/Seite_Die_Gartenlaube_242.html +42 -0
- data/data/Seite_Tagebuch_H_C_Lang_08.jpg +0 -0
- data/data/test.html +71 -0
- data/data/test.png +0 -0
- data/example/example_server.rb +2 -2
- data/example/public/Seite_Tagebuch_H_C_Lang_08.jpg +0 -0
- data/lib/hocr_box.rb +67 -0
- data/lib/ocr_document.rb +50 -0
- data/lib/ocr_element.rb +149 -0
- data/lib/ocr_page.rb +80 -25
- data/lib/rhocr.rb +30 -1
- data/rhocr.gemspec +12 -9
- data/spec/hocr_box_spec.rb +94 -0
- data/spec/ocr_document_spec.rb +80 -0
- data/spec/ocr_element_spec.rb +86 -0
- data/spec/ocr_page_spec.rb +116 -0
- data/spec/rhocr_spec.rb +34 -0
- data/test.html +1 -0
- metadata +52 -39
- data/example/public/img/Seite_Tagebuch_H_C_Lang_05.jpg +0 -0
- data/lib/ocr_box.rb +0 -43
- data/lib/ocrx_word.rb +0 -23
- data/rspec/ocr_box_spec.rb +0 -48
- data/rspec/ocr_page_spec.rb +0 -17
- data/rspec/ocrx_word_spec.rb +0 -32
data/test.html
ADDED
@@ -0,0 +1 @@
|
|
1
|
+
<div class='ocr_page' style='position:absolute; top:0px; left:0px; height:1326px; width:1326px;;background-image: url(data/test.png); width:1326px; height:1326>px ;'><span class='ocrx_block' style='position:absolute; top:32px; left:55px; height:1855px; width:1080px;' ></span><span class='ocr_par' style='position:absolute; top:32px; left:432px; height:39px; width:685px;' ></span><span class='ocr_line' style='position:absolute; top:32px; left:432px; height:39px; width:685px;' ></span><span class='ocrx_word' style='position:absolute; top:32px; left:432px; height:35px; width:156px;'>Athenobius</span><span class='ocrx_word' style='position:absolute; top:48px; left:606px; height:6px; width:34px;'>—</span><span class='ocrx_word' style='position:absolute; top:34px; left:657px; height:28px; width:92px;'>Aulon.</span><span class='ocrx_word' style='position:absolute; top:37px; left:1074px; height:34px; width:43px;'>29</span><span class='ocr_par' style='position:absolute; top:109px; left:79px; height:80px; width:1040px;' ></span><span class='ocr_line' style='position:absolute; top:109px; left:79px; height:36px; width:1040px;' ></span><span class='ocrx_word' style='position:absolute; top:109px; left:79px; height:35px; width:215px;'>Athenobius,</span><span class='ocrx_word' style='position:absolute; top:112px; left:334px; height:27px; width:64px;'>Der</span><span class='ocrx_word' style='position:absolute; top:115px; left:417px; height:24px; width:59px;'>von</span><span class='ocrx_word' style='position:absolute; top:112px; left:494px; height:27px; width:51px;'>der</span><span class='ocrx_word' style='position:absolute; top:112px; left:565px; height:28px; width:122px;'>Göttin</span><span class='ocrx_word' style='position:absolute; top:112px; left:707px; height:28px; width:150px;'>Minerva</span><span class='ocrx_word' style='position:absolute; top:112px; left:876px; height:33px; width:78px;'>lebt,</span><span class='ocrx_word' style='position:absolute; top:112px; left:974px; height:28px; width:69px;'>oder:</span><span class='ocrx_word' style='position:absolute; top:112px; left:1062px; height:28px; width:57px;'>Mi»</span><span class='ocr_line' style='position:absolute; top:155px; left:108px; height:34px; width:192px;' ></span><span class='ocrx_word' style='position:absolute; top:159px; left:108px; height:23px; width:75px;'>nerva</span><span class='ocrx_word' style='position:absolute; top:155px; left:201px; height:34px; width:99px;'>Bogen.</span><span class='ocr_par' style='position:absolute; top:196px; left:74px; height:120px; width:1043px;' ></span><span class='ocr_line' style='position:absolute; top:196px; left:160px; height:36px; width:957px;' ></span><span class='ocrx_word' style='position:absolute; top:198px; left:160px; height:27px; width:54px;'>Des</span><span class='ocrx_word' style='position:absolute; top:197px; left:242px; height:33px; width:98px;'>Königs</span><span class='ocrx_word' style='position:absolute; top:196px; left:367px; height:34px; width:136px;'>Antiochus</span><span class='ocrx_word' style='position:absolute; top:197px; left:531px; height:33px; width:95px;'>Freund</span><span class='ocrx_word' style='position:absolute; top:197px; left:655px; height:28px; width:58px;'>oder</span><span class='ocrx_word' style='position:absolute; top:196px; left:739px; height:36px; width:119px;'>geheimer</span><span class='ocrx_word' style='position:absolute; top:196px; left:885px; height:34px; width:78px;'>Nath.</span><span class='ocrx_word' style='position:absolute; top:199px; left:994px; height:25px; width:11px;'>l</span><span class='ocrx_word' style='position:absolute; top:197px; left:1033px; height:29px; width:84px;'>Mack.</span><span class='ocr_line' style='position:absolute; top:241px; left:109px; height:33px; width:97px;' ></span><span class='ocrx_word' style='position:absolute; top:241px; left:109px; height:33px; width:38px;'>15,</span><span class='ocrx_word' style='position:absolute; top:242px; left:166px; height:25px; width:40px;'>28.</span><span class='ocr_line' style='position:absolute; top:281px; left:74px; height:35px; width:1042px;' ></span><span class='ocrx_word' style='position:absolute; top:281px; left:74px; height:34px; width:131px;'>Athlai.</span><span class='ocrx_word' style='position:absolute; top:284px; left:242px; height:26px; width:68px;'>Dee</span><span class='ocrx_word' style='position:absolute; top:282px; left:337px; height:33px; width:80px;'>Herr</span><span class='ocrx_word' style='position:absolute; top:281px; left:440px; height:34px; width:158px;'>zerreißet</span><span class='ocrx_word' style='position:absolute; top:282px; left:625px; height:28px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:282px; left:706px; height:34px; width:158px;'>zerbricht.</span><span class='ocrx_word' style='position:absolute; top:282px; left:898px; height:28px; width:77px;'>Einer</span><span class='ocrx_word' style='position:absolute; top:286px; left:999px; height:24px; width:51px;'>von</span><span class='ocrx_word' style='position:absolute; top:282px; left:1069px; height:28px; width:47px;'>den</span><span class='ocr_par' style='position:absolute; top:324px; left:74px; height:77px; width:1040px;' ></span><span class='ocr_line' style='position:absolute; top:324px; left:107px; height:33px; width:487px;' ></span><span class='ocrx_word' style='position:absolute; top:325px; left:107px; height:32px; width:174px;'>Nachlommen</span><span class='ocrx_word' style='position:absolute; top:324px; left:300px; height:28px; width:92px;'>Bebai.</span><span class='ocrx_word' style='position:absolute; top:324px; left:410px; height:32px; width:62px;'>Esra</span><span class='ocrx_word' style='position:absolute; top:327px; left:496px; height:28px; width:37px;'>10,</span><span class='ocrx_word' style='position:absolute; top:326px; left:553px; height:25px; width:41px;'>28.</span><span class='ocr_line' style='position:absolute; top:366px; left:74px; height:35px; width:1040px;' ></span><span class='ocrx_word' style='position:absolute; top:366px; left:74px; height:34px; width:115px;'>Athni.</span><span class='ocrx_word' style='position:absolute; top:368px; left:217px; height:27px; width:79px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:367px; left:315px; height:34px; width:135px;'>Trübsal</span><span class='ocrx_word' style='position:absolute; top:372px; left:469px; height:22px; width:59px;'>von</span><span class='ocrx_word' style='position:absolute; top:366px; left:548px; height:28px; width:90px;'>Gott.</span><span class='ocrx_word' style='position:absolute; top:366px; left:673px; height:28px; width:49px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:366px; left:742px; height:34px; width:77px;'>Sohn</span><span class='ocrx_word' style='position:absolute; top:366px; left:838px; height:34px; width:116px;'>Semaja.</span><span class='ocrx_word' style='position:absolute; top:369px; left:986px; height:25px; width:12px;'>1</span><span class='ocrx_word' style='position:absolute; top:368px; left:1018px; height:32px; width:96px;'>Chron.</span><span class='ocr_par' style='position:absolute; top:412px; left:71px; height:76px; width:1041px;' ></span><span class='ocr_line' style='position:absolute; top:412px; left:104px; height:28px; width:83px;' ></span><span class='ocrx_word' style='position:absolute; top:412px; left:104px; height:28px; width:40px;'>27.</span><span class='ocrx_word' style='position:absolute; top:413px; left:163px; height:25px; width:24px;'>7.</span><span class='ocr_line' style='position:absolute; top:451px; left:71px; height:37px; width:1041px;' ></span><span class='ocrx_word' style='position:absolute; top:451px; left:71px; height:34px; width:146px;'>Athniel.</span><span class='ocrx_word' style='position:absolute; top:452px; left:246px; height:27px; width:118px;'>Gottes</span><span class='ocrx_word' style='position:absolute; top:451px; left:384px; height:33px; width:147px;'>Trübsal,</span><span class='ocrx_word' style='position:absolute; top:451px; left:550px; height:28px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:451px; left:591px; height:28px; width:17px;'>i.</span><span class='ocrx_word' style='position:absolute; top:451px; left:627px; height:28px; width:54px;'>eine</span><span class='ocrx_word' style='position:absolute; top:451px; left:699px; height:33px; width:120px;'>Trübsal,</span><span class='ocrx_word' style='position:absolute; top:459px; left:839px; height:20px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:452px; left:908px; height:28px; width:62px;'>Gott</span><span class='ocrx_word' style='position:absolute; top:452px; left:990px; height:36px; width:122px;'>zugesügt.</span><span class='ocr_par' style='position:absolute; top:494px; left:102px; height:34px; width:1008px;' ></span><span class='ocr_line' style='position:absolute; top:494px; left:102px; height:34px; width:1008px;' ></span><span class='ocrx_word' style='position:absolute; top:496px; left:102px; height:27px; width:50px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:495px; left:172px; height:31px; width:76px;'>Sohn</span><span class='ocrx_word' style='position:absolute; top:495px; left:268px; height:30px; width:94px;'>Kenas,</span><span class='ocrx_word' style='position:absolute; top:495px; left:380px; height:26px; width:44px;'>des</span><span class='ocrx_word' style='position:absolute; top:494px; left:445px; height:27px; width:112px;'>Bruders</span><span class='ocrx_word' style='position:absolute; top:494px; left:576px; height:32px; width:89px;'>Kaleb;</span><span class='ocrx_word' style='position:absolute; top:500px; left:693px; height:28px; width:105px;'>gewann</span><span class='ocrx_word' style='position:absolute; top:495px; left:818px; height:33px; width:98px;'>Kiriath</span><span class='ocrx_word' style='position:absolute; top:495px; left:936px; height:33px; width:106px;'>Sepher,</span><span class='ocrx_word' style='position:absolute; top:495px; left:1061px; height:28px; width:49px;'>und</span><span class='ocr_par' style='position:absolute; top:535px; left:68px; height:79px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:535px; left:100px; height:35px; width:937px;' ></span><span class='ocrx_word' style='position:absolute; top:538px; left:100px; height:27px; width:80px;'>damit</span><span class='ocrx_word' style='position:absolute; top:537px; left:199px; height:33px; width:82px;'>Achsa.</span><span class='ocrx_word' style='position:absolute; top:538px; left:300px; height:26px; width:36px;'>die</span><span class='ocrx_word' style='position:absolute; top:537px; left:356px; height:32px; width:98px;'>Tochter</span><span class='ocrx_word' style='position:absolute; top:535px; left:472px; height:32px; width:81px;'>seines</span><span class='ocrx_word' style='position:absolute; top:537px; left:574px; height:27px; width:100px;'>Betters</span><span class='ocrx_word' style='position:absolute; top:537px; left:694px; height:27px; width:86px;'>Kaleb.</span><span class='ocrx_word' style='position:absolute; top:536px; left:800px; height:34px; width:77px;'>Nicht,</span><span class='ocrx_word' style='position:absolute; top:540px; left:899px; height:29px; width:20px;'>1.</span><span class='ocrx_word' style='position:absolute; top:539px; left:940px; height:26px; width:38px;'>12.</span><span class='ocrx_word' style='position:absolute; top:539px; left:1000px; height:25px; width:37px;'>13.</span><span class='ocr_line' style='position:absolute; top:576px; left:68px; height:38px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:578px; left:68px; height:36px; width:308px;'>Atroth-Sophan,</span><span class='ocrx_word' style='position:absolute; top:580px; left:396px; height:26px; width:37px;'>die</span><span class='ocrx_word' style='position:absolute; top:580px; left:454px; height:27px; width:101px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:580px; left:580px; height:26px; width:53px;'>oder</span><span class='ocrx_word' style='position:absolute; top:579px; left:658px; height:30px; width:102px;'>Decke,</span><span class='ocrx_word' style='position:absolute; top:580px; left:785px; height:26px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:580px; left:860px; height:34px; width:177px;'>Bedeckung</span><span class='ocrx_word' style='position:absolute; top:576px; left:1057px; height:32px; width:62px;'>des'</span><span class='ocr_par' style='position:absolute; top:621px; left:100px; height:36px; width:1011px;' ></span><span class='ocr_line' style='position:absolute; top:621px; left:100px; height:36px; width:1011px;' ></span><span class='ocrx_word' style='position:absolute; top:624px; left:100px; height:33px; width:135px;'>Hügels.</span><span class='ocrx_word' style='position:absolute; top:623px; left:273px; height:27px; width:62px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:623px; left:355px; height:26px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:623px; left:456px; height:26px; width:40px;'>der</span><span class='ocrx_word' style='position:absolute; top:621px; left:515px; height:28px; width:141px;'>Rubeniten</span><span class='ocrx_word' style='position:absolute; top:621px; left:680px; height:27px; width:35px;'>im</span><span class='ocrx_word' style='position:absolute; top:622px; left:734px; height:34px; width:141px;'>Königreich</span><span class='ocrx_word' style='position:absolute; top:622px; left:895px; height:32px; width:97px;'>Sthon.</span><span class='ocrx_word' style='position:absolute; top:624px; left:1008px; height:26px; width:16px;'>4</span><span class='ocrx_word' style='position:absolute; top:623px; left:1043px; height:34px; width:68px;'>Mos.</span><span class='ocr_par' style='position:absolute; top:668px; left:67px; height:74px; width:1045px;' ></span><span class='ocr_line' style='position:absolute; top:668px; left:98px; height:30px; width:102px;' ></span><span class='ocrx_word' style='position:absolute; top:669px; left:98px; height:29px; width:41px;'>32,</span><span class='ocrx_word' style='position:absolute; top:668px; left:158px; height:25px; width:42px;'>35.</span><span class='ocr_line' style='position:absolute; top:706px; left:67px; height:36px; width:1045px;' ></span><span class='ocrx_word' style='position:absolute; top:707px; left:67px; height:35px; width:274px;'>AtrothAddar:</span><span class='ocrx_word' style='position:absolute; top:706px; left:356px; height:29px; width:62px;'>Die</span><span class='ocrx_word' style='position:absolute; top:707px; left:432px; height:27px; width:105px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:706px; left:551px; height:27px; width:110px;'>Addar</span><span class='ocrx_word' style='position:absolute; top:706px; left:675px; height:31px; width:54px;'>(des</span><span class='ocrx_word' style='position:absolute; top:706px; left:744px; height:33px; width:105px;'>Sohnes</span><span class='ocrx_word' style='position:absolute; top:706px; left:861px; height:34px; width:155px;'>Benjamin).</span><span class='ocrx_word' style='position:absolute; top:708px; left:1037px; height:33px; width:75px;'>Diese</span><span class='ocr_par' style='position:absolute; top:748px; left:98px; height:37px; width:1013px;' ></span><span class='ocr_line' style='position:absolute; top:748px; left:98px; height:37px; width:1013px;' ></span><span class='ocrx_word' style='position:absolute; top:752px; left:98px; height:28px; width:86px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:751px; left:202px; height:34px; width:98px;'>gehörte</span><span class='ocrx_word' style='position:absolute; top:750px; left:322px; height:27px; width:47px;'>den</span><span class='ocrx_word' style='position:absolute; top:748px; left:395px; height:33px; width:216px;'>Benjaminitern,</span><span class='ocrx_word' style='position:absolute; top:749px; left:635px; height:33px; width:43px;'>lag</span><span class='ocrx_word' style='position:absolute; top:748px; left:702px; height:27px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:749px; left:753px; height:27px; width:45px;'>den</span><span class='ocrx_word' style='position:absolute; top:749px; left:826px; height:35px; width:112px;'>Grenzen</span><span class='ocrx_word' style='position:absolute; top:750px; left:962px; height:33px; width:71px;'>Iuda</span><span class='ocrx_word' style='position:absolute; top:750px; left:1057px; height:28px; width:54px;'>tmd</span><span class='ocr_par' style='position:absolute; top:794px; left:64px; height:76px; width:1048px;' ></span><span class='ocr_line' style='position:absolute; top:794px; left:98px; height:31px; width:134px;' ></span><span class='ocrx_word' style='position:absolute; top:794px; left:98px; height:31px; width:134px;'>Ephraim.</span><span class='ocr_line' style='position:absolute; top:833px; left:64px; height:37px; width:1048px;' ></span><span class='ocrx_word' style='position:absolute; top:834px; left:64px; height:36px; width:355px;'>Atroth.Beth-Ioab,</span><span class='ocrx_word' style='position:absolute; top:836px; left:438px; height:26px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:835px; left:480px; height:27px; width:17px;'>i.</span><span class='ocrx_word' style='position:absolute; top:834px; left:517px; height:27px; width:48px;'>die</span><span class='ocrx_word' style='position:absolute; top:834px; left:584px; height:27px; width:104px;'>Krone</span><span class='ocrx_word' style='position:absolute; top:833px; left:712px; height:28px; width:52px;'>des</span><span class='ocrx_word' style='position:absolute; top:833px; left:784px; height:33px; width:125px;'>Hauses</span><span class='ocrx_word' style='position:absolute; top:834px; left:926px; height:32px; width:94px;'>Ioab.</span><span class='ocrx_word' style='position:absolute; top:835px; left:1050px; height:28px; width:62px;'>Eine</span><span class='ocr_par' style='position:absolute; top:876px; left:101px; height:35px; width:1012px;' ></span><span class='ocr_line' style='position:absolute; top:876px; left:101px; height:35px; width:1012px;' ></span><span class='ocrx_word' style='position:absolute; top:879px; left:101px; height:28px; width:86px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:879px; left:201px; height:27px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:879px; left:249px; height:32px; width:80px;'>Iuda,</span><span class='ocrx_word' style='position:absolute; top:883px; left:350px; height:22px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:878px; left:408px; height:27px; width:37px;'>die</span><span class='ocrx_word' style='position:absolute; top:877px; left:456px; height:32px; width:178px;'>Nachlommen</span><span class='ocrx_word' style='position:absolute; top:876px; left:645px; height:28px; width:97px;'>Salma</span><span class='ocrx_word' style='position:absolute; top:876px; left:762px; height:34px; width:114px;'>gewohnt</span><span class='ocrx_word' style='position:absolute; top:877px; left:887px; height:33px; width:85px;'>haben.</span><span class='ocrx_word' style='position:absolute; top:880px; left:992px; height:24px; width:10px;'>1</span><span class='ocrx_word' style='position:absolute; top:877px; left:1021px; height:34px; width:92px;'>Chron.</span><span class='ocr_par' style='position:absolute; top:923px; left:64px; height:73px; width:1048px;' ></span><span class='ocr_line' style='position:absolute; top:923px; left:96px; height:30px; width:89px;' ></span><span class='ocrx_word' style='position:absolute; top:923px; left:96px; height:30px; width:24px;'>2,</span><span class='ocrx_word' style='position:absolute; top:924px; left:141px; height:25px; width:44px;'>54.</span><span class='ocr_line' style='position:absolute; top:961px; left:64px; height:35px; width:1048px;' ></span><span class='ocrx_word' style='position:absolute; top:962px; left:64px; height:31px; width:148px;'>Attalia.</span><span class='ocrx_word' style='position:absolute; top:963px; left:249px; height:27px; width:63px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:963px; left:330px; height:27px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:962px; left:428px; height:26px; width:27px;'>in</span><span class='ocrx_word' style='position:absolute; top:961px; left:474px; height:33px; width:163px;'>Pamphilien</span><span class='ocrx_word' style='position:absolute; top:962px; left:665px; height:28px; width:36px;'>od.</span><span class='ocrx_word' style='position:absolute; top:961px; left:720px; height:33px; width:104px;'>Libyen,</span><span class='ocrx_word' style='position:absolute; top:967px; left:848px; height:22px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:962px; left:916px; height:27px; width:88px;'>Attala</span><span class='ocrx_word' style='position:absolute; top:962px; left:1023px; height:34px; width:89px;'>Phila.</span><span class='ocr_par' style='position:absolute; top:1005px; left:62px; height:77px; width:1073px;' ></span><span class='ocr_line' style='position:absolute; top:1005px; left:95px; height:34px; width:499px;' ></span><span class='ocrx_word' style='position:absolute; top:1006px; left:95px; height:33px; width:90px;'>delpho</span><span class='ocrx_word' style='position:absolute; top:1006px; left:206px; height:27px; width:96px;'>erbaut.</span><span class='ocrx_word' style='position:absolute; top:1006px; left:321px; height:31px; width:47px;'>Ap.</span><span class='ocrx_word' style='position:absolute; top:1005px; left:388px; height:33px; width:83px;'>Gesch.</span><span class='ocrx_word' style='position:absolute; top:1006px; left:494px; height:32px; width:39px;'>14,</span><span class='ocrx_word' style='position:absolute; top:1006px; left:553px; height:25px; width:41px;'>25.</span><span class='ocr_line' style='position:absolute; top:1046px; left:62px; height:36px; width:1073px;' ></span><span class='ocrx_word' style='position:absolute; top:1048px; left:62px; height:29px; width:146px;'>Attalus</span><span class='ocrx_word' style='position:absolute; top:1048px; left:255px; height:27px; width:51px;'>Ein</span><span class='ocrx_word' style='position:absolute; top:1046px; left:330px; height:34px; width:81px;'>König</span><span class='ocrx_word' style='position:absolute; top:1047px; left:436px; height:26px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:1046px; left:482px; height:32px; width:112px;'>Mysien,</span><span class='ocrx_word' style='position:absolute; top:1046px; left:623px; height:32px; width:99px;'>welches</span><span class='ocrx_word' style='position:absolute; top:1047px; left:747px; height:26px; width:72px;'>unter</span><span class='ocrx_word' style='position:absolute; top:1046px; left:843px; height:35px; width:129px;'>Phrygien</span><span class='ocrx_word' style='position:absolute; top:1047px; left:997px; height:35px; width:115px;'>gehörte;</span><span class='ocrx_word' style='position:absolute; top:1058px; left:1128px; height:9px; width:7px;'>,</span><span class='ocr_par' style='position:absolute; top:1089px; left:95px; height:36px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1089px; left:95px; height:36px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1093px; left:95px; height:32px; width:112px;'>genannt</span><span class='ocrx_word' style='position:absolute; top:1095px; left:227px; height:22px; width:47px;'>von</span><span class='ocrx_word' style='position:absolute; top:1090px; left:294px; height:29px; width:122px;'>Attale,</span><span class='ocrx_word' style='position:absolute; top:1090px; left:435px; height:30px; width:99px;'>welches</span><span class='ocrx_word' style='position:absolute; top:1089px; left:553px; height:27px; width:38px;'>bei</span><span class='ocrx_word' style='position:absolute; top:1089px; left:610px; height:26px; width:47px;'>den</span><span class='ocrx_word' style='position:absolute; top:1089px; left:676px; height:33px; width:143px;'>Phrygiern</span><span class='ocrx_word' style='position:absolute; top:1089px; left:838px; height:32px; width:79px;'>Kropf</span><span class='ocrx_word' style='position:absolute; top:1090px; left:935px; height:26px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:1090px; left:1012px; height:34px; width:99px;'>Gurgel</span><span class='ocr_par' style='position:absolute; top:1131px; left:94px; height:37px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1131px; left:94px; height:37px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1133px; left:94px; height:35px; width:119px;'>geheißen</span><span class='ocrx_word' style='position:absolute; top:1133px; left:233px; height:32px; width:77px;'>haben</span><span class='ocrx_word' style='position:absolute; top:1131px; left:329px; height:30px; width:51px;'>soll.</span><span class='ocrx_word' style='position:absolute; top:1157px; left:393px; height:4px; width:4px;'>,</span><span class='ocrx_word' style='position:absolute; top:1131px; left:417px; height:28px; width:62px;'>War</span><span class='ocrx_word' style='position:absolute; top:1132px; left:497px; height:26px; width:39px;'>ein</span><span class='ocrx_word' style='position:absolute; top:1132px; left:555px; height:33px; width:82px;'>König</span><span class='ocrx_word' style='position:absolute; top:1132px; left:660px; height:26px; width:40px;'>der</span><span class='ocrx_word' style='position:absolute; top:1132px; left:719px; height:33px; width:170px;'>Pergamener</span><span class='ocrx_word' style='position:absolute; top:1133px; left:907px; height:25px; width:49px;'>und</span><span class='ocrx_word' style='position:absolute; top:1131px; left:976px; height:34px; width:134px;'>Phrvgier.</span><span class='ocr_par' style='position:absolute; top:1175px; left:59px; height:75px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:1175px; left:95px; height:32px; width:237px;' ></span><span class='ocrx_word' style='position:absolute; top:1177px; left:95px; height:24px; width:11px;'>l</span><span class='ocrx_word' style='position:absolute; top:1175px; left:130px; height:27px; width:81px;'>Mack.</span><span class='ocrx_word' style='position:absolute; top:1176px; left:233px; height:31px; width:39px;'>15,</span><span class='ocrx_word' style='position:absolute; top:1176px; left:292px; height:25px; width:40px;'>22.</span><span class='ocr_line' style='position:absolute; top:1216px; left:59px; height:34px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:1217px; left:59px; height:29px; width:87px;'>Ava.</span><span class='ocrx_word' style='position:absolute; top:1217px; left:184px; height:33px; width:40px;'>Ist</span><span class='ocrx_word' style='position:absolute; top:1217px; left:242px; height:26px; width:38px;'>bei</span><span class='ocrx_word' style='position:absolute; top:1218px; left:299px; height:25px; width:45px;'>den</span><span class='ocrx_word' style='position:absolute; top:1217px; left:364px; height:26px; width:68px;'>alten</span><span class='ocrx_word' style='position:absolute; top:1216px; left:453px; height:32px; width:115px;'>Griechen</span><span class='ocrx_word' style='position:absolute; top:1216px; left:587px; height:26px; width:49px;'>Aia</span><span class='ocrx_word' style='position:absolute; top:1216px; left:655px; height:26px; width:36px;'>od.</span><span class='ocrx_word' style='position:absolute; top:1216px; left:711px; height:31px; width:60px;'>Aea,</span><span class='ocrx_word' style='position:absolute; top:1216px; left:790px; height:26px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1216px; left:842px; height:33px; width:151px;'>Hauptstadt</span><span class='ocrx_word' style='position:absolute; top:1217px; left:1010px; height:26px; width:26px;'>in</span><span class='ocrx_word' style='position:absolute; top:1216px; left:1051px; height:29px; width:59px;'>Col»</span><span class='ocr_par' style='position:absolute; top:1258px; left:92px; height:35px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1258px; left:92px; height:35px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1261px; left:92px; height:32px; width:73px;'>chide,</span><span class='ocrx_word' style='position:absolute; top:1265px; left:186px; height:21px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:1260px; left:244px; height:25px; width:79px;'>Aetas</span><span class='ocrx_word' style='position:absolute; top:1258px; left:341px; height:34px; width:110px;'>regierte.</span><span class='ocrx_word' style='position:absolute; top:1258px; left:494px; height:33px; width:99px;'>Colchis</span><span class='ocrx_word' style='position:absolute; top:1258px; left:612px; height:33px; width:66px;'>heißt</span><span class='ocrx_word' style='position:absolute; top:1258px; left:697px; height:34px; width:115px;'>heutiges</span><span class='ocrx_word' style='position:absolute; top:1258px; left:833px; height:34px; width:83px;'>Tages</span><span class='ocrx_word' style='position:absolute; top:1258px; left:938px; height:35px; width:170px;'>Mengrelicn,</span><span class='ocr_par' style='position:absolute; top:1300px; left:92px; height:35px; width:1017px;' ></span><span class='ocr_line' style='position:absolute; top:1300px; left:92px; height:35px; width:1017px;' ></span><span class='ocrx_word' style='position:absolute; top:1303px; left:92px; height:27px; width:39px;'>die</span><span class='ocrx_word' style='position:absolute; top:1303px; left:160px; height:32px; width:98px;'>meisten</span><span class='ocrx_word' style='position:absolute; top:1302px; left:277px; height:30px; width:153px;'>Einwohner</span><span class='ocrx_word' style='position:absolute; top:1300px; left:455px; height:33px; width:50px;'>sind</span><span class='ocrx_word' style='position:absolute; top:1300px; left:531px; height:34px; width:122px;'>Christen.</span><span class='ocrx_word' style='position:absolute; top:1300px; left:698px; height:28px; width:57px;'>Von</span><span class='ocrx_word' style='position:absolute; top:1300px; left:780px; height:32px; width:51px;'>hier</span><span class='ocrx_word' style='position:absolute; top:1302px; left:855px; height:26px; width:101px;'>wurden</span><span class='ocrx_word' style='position:absolute; top:1302px; left:980px; height:26px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1301px; left:1037px; height:28px; width:72px;'>Leute</span><span class='ocr_par' style='position:absolute; top:1342px; left:92px; height:36px; width:1018px;' ></span><span class='ocr_line' style='position:absolute; top:1342px; left:92px; height:36px; width:1018px;' ></span><span class='ocrx_word' style='position:absolute; top:1349px; left:92px; height:22px; width:52px;'>von</span><span class='ocrx_word' style='position:absolute; top:1344px; left:165px; height:32px; width:182px;'>Salmanasscr</span><span class='ocrx_word' style='position:absolute; top:1344px; left:371px; height:31px; width:57px;'>nach</span><span class='ocrx_word' style='position:absolute; top:1343px; left:454px; height:27px; width:128px;'>Samaria</span><span class='ocrx_word' style='position:absolute; top:1343px; left:606px; height:35px; width:110px;'>gesührt,</span><span class='ocrx_word' style='position:absolute; top:1347px; left:741px; height:22px; width:38px;'>wo</span><span class='ocrx_word' style='position:absolute; top:1342px; left:804px; height:33px; width:31px;'>sie</span><span class='ocrx_word' style='position:absolute; top:1343px; left:859px; height:32px; width:58px;'>noch</span><span class='ocrx_word' style='position:absolute; top:1343px; left:942px; height:33px; width:51px;'>ihre</span><span class='ocrx_word' style='position:absolute; top:1344px; left:1019px; height:27px; width:91px;'>Götter</span><span class='ocr_par' style='position:absolute; top:1386px; left:58px; height:76px; width:1051px;' ></span><span class='ocr_line' style='position:absolute; top:1386px; left:93px; height:33px; width:782px;' ></span><span class='ocrx_word' style='position:absolute; top:1387px; left:93px; height:32px; width:118px;'>Nibehas</span><span class='ocrx_word' style='position:absolute; top:1387px; left:231px; height:26px; width:48px;'>und</span><span class='ocrx_word' style='position:absolute; top:1386px; left:298px; height:32px; width:123px;'>Tharthac</span><span class='ocrx_word' style='position:absolute; top:1386px; left:440px; height:27px; width:138px;'>anbeteten.</span><span class='ocrx_word' style='position:absolute; top:1388px; left:597px; height:24px; width:15px;'>2</span><span class='ocrx_word' style='position:absolute; top:1387px; left:630px; height:26px; width:64px;'>Kön.</span><span class='ocrx_word' style='position:absolute; top:1388px; left:716px; height:28px; width:38px;'>l7,</span><span class='ocrx_word' style='position:absolute; top:1386px; left:775px; height:27px; width:41px;'>24.</span><span class='ocrx_word' style='position:absolute; top:1387px; left:835px; height:26px; width:40px;'>31.</span><span class='ocr_line' style='position:absolute; top:1428px; left:58px; height:34px; width:1051px;' ></span><span class='ocrx_word' style='position:absolute; top:1428px; left:58px; height:30px; width:117px;'>Aven.</span><span class='ocrx_word' style='position:absolute; top:1429px; left:213px; height:33px; width:101px;'>Götze,</span><span class='ocrx_word' style='position:absolute; top:1428px; left:339px; height:27px; width:163px;'>Eitelleit.</span><span class='ocrx_word' style='position:absolute; top:1428px; left:538px; height:27px; width:42px;'>So</span><span class='ocrx_word' style='position:absolute; top:1429px; left:605px; height:26px; width:60px;'>wird</span><span class='ocrx_word' style='position:absolute; top:1428px; left:690px; height:33px; width:88px;'>Bethel</span><span class='ocrx_word' style='position:absolute; top:1429px; left:802px; height:33px; width:118px;'>genannt.</span><span class='ocrx_word' style='position:absolute; top:1428px; left:939px; height:34px; width:56px;'>Hos.</span><span class='ocrx_word' style='position:absolute; top:1431px; left:1023px; height:29px; width:38px;'>10,</span><span class='ocrx_word' style='position:absolute; top:1431px; left:1086px; height:25px; width:23px;'>8.</span><span class='ocr_par' style='position:absolute; top:1471px; left:92px; height:34px; width:1018px;' ></span><span class='ocr_line' style='position:absolute; top:1471px; left:92px; height:34px; width:1018px;' ></span><span class='ocrx_word' style='position:absolute; top:1478px; left:92px; height:27px; width:88px;'>wegen</span><span class='ocrx_word' style='position:absolute; top:1472px; left:199px; height:26px; width:42px;'>der</span><span class='ocrx_word' style='position:absolute; top:1471px; left:261px; height:33px; width:104px;'>Götzen,</span><span class='ocrx_word' style='position:absolute; top:1471px; left:390px; height:26px; width:39px;'>die</span><span class='ocrx_word' style='position:absolute; top:1471px; left:456px; height:32px; width:100px;'>daselbst</span><span class='ocrx_word' style='position:absolute; top:1476px; left:579px; height:21px; width:49px;'>von</span><span class='ocrx_word' style='position:absolute; top:1472px; left:651px; height:25px; width:43px;'>den</span><span class='ocrx_word' style='position:absolute; top:1471px; left:715px; height:32px; width:137px;'>Israeliten</span><span class='ocrx_word' style='position:absolute; top:1471px; left:877px; height:32px; width:96px;'>verehrt</span><span class='ocrx_word' style='position:absolute; top:1472px; left:1000px; height:26px; width:110px;'>wurden.</span><span class='ocr_par' style='position:absolute; top:1513px; left:91px; height:35px; width:1019px;' ></span><span class='ocr_line' style='position:absolute; top:1513px; left:91px; height:35px; width:1019px;' ></span><span class='ocrx_word' style='position:absolute; top:1515px; left:91px; height:26px; width:58px;'>Mit</span><span class='ocrx_word' style='position:absolute; top:1515px; left:167px; height:26px; width:53px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1520px; left:240px; height:28px; width:92px;'>ganzen</span><span class='ocrx_word' style='position:absolute; top:1513px; left:352px; height:27px; width:109px;'>Namen:</span><span class='ocrx_word' style='position:absolute; top:1513px; left:482px; height:31px; width:158px;'>Beth»Aven,</span><span class='ocrx_word' style='position:absolute; top:1513px; left:658px; height:27px; width:50px;'>das</span><span class='ocrx_word' style='position:absolute; top:1513px; left:726px; height:35px; width:167px;'>Götzenhaus,</span><span class='ocrx_word' style='position:absolute; top:1513px; left:914px; height:33px; width:65px;'>oder,</span><span class='ocrx_word' style='position:absolute; top:1514px; left:997px; height:26px; width:32px;'>da</span><span class='ocrx_word' style='position:absolute; top:1520px; left:1048px; height:21px; width:62px;'>man</span><span class='ocr_par' style='position:absolute; top:1555px; left:56px; height:78px; width:1054px;' ></span><span class='ocr_line' style='position:absolute; top:1555px; left:91px; height:33px; width:540px;' ></span><span class='ocrx_word' style='position:absolute; top:1558px; left:91px; height:26px; width:58px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1557px; left:169px; height:26px; width:85px;'>Eiteln</span><span class='ocrx_word' style='position:absolute; top:1556px; left:275px; height:31px; width:178px;'>nachwandelt.</span><span class='ocrx_word' style='position:absolute; top:1555px; left:473px; height:33px; width:59px;'>Hos.</span><span class='ocrx_word' style='position:absolute; top:1558px; left:549px; height:26px; width:22px;'>4,</span><span class='ocrx_word' style='position:absolute; top:1558px; left:593px; height:23px; width:38px;'>15.</span><span class='ocr_line' style='position:absolute; top:1597px; left:56px; height:36px; width:1054px;' ></span><span class='ocrx_word' style='position:absolute; top:1597px; left:56px; height:36px; width:186px;'>Augustus.</span><span class='ocrx_word' style='position:absolute; top:1597px; left:287px; height:34px; width:132px;'>Würdig</span><span class='ocrx_word' style='position:absolute; top:1598px; left:448px; height:32px; width:129px;'>verehrt</span><span class='ocrx_word' style='position:absolute; top:1598px; left:608px; height:26px; width:60px;'>und</span><span class='ocrx_word' style='position:absolute; top:1599px; left:704px; height:33px; width:172px;'>angebetet</span><span class='ocrx_word' style='position:absolute; top:1605px; left:908px; height:27px; width:36px;'>zu</span><span class='ocrx_word' style='position:absolute; top:1599px; left:978px; height:28px; width:132px;'>werden.</span><span class='ocr_par' style='position:absolute; top:1640px; left:92px; height:34px; width:1016px;' ></span><span class='ocr_line' style='position:absolute; top:1640px; left:92px; height:34px; width:1016px;' ></span><span class='ocrx_word' style='position:absolute; top:1640px; left:92px; height:34px; width:97px;'>Diesen</span><span class='ocrx_word' style='position:absolute; top:1640px; left:211px; height:27px; width:100px;'>Namen</span><span class='ocrx_word' style='position:absolute; top:1641px; left:340px; height:33px; width:46px;'>gab</span><span class='ocrx_word' style='position:absolute; top:1641px; left:413px; height:26px; width:46px;'>das</span><span class='ocrx_word' style='position:absolute; top:1640px; left:487px; height:32px; width:109px;'>romische</span><span class='ocrx_word' style='position:absolute; top:1640px; left:616px; height:27px; width:62px;'>Voll</span><span class='ocrx_word' style='position:absolute; top:1641px; left:706px; height:26px; width:52px;'>dem</span><span class='ocrx_word' style='position:absolute; top:1641px; left:781px; height:31px; width:88px;'>Kaiser</span><span class='ocrx_word' style='position:absolute; top:1641px; left:887px; height:31px; width:143px;'>Octavian,</span><span class='ocrx_word' style='position:absolute; top:1642px; left:1058px; height:26px; width:50px;'>und</span><span class='ocr_par' style='position:absolute; top:1682px; left:93px; height:34px; width:1015px;' ></span><span class='ocr_line' style='position:absolute; top:1682px; left:93px; height:34px; width:1015px;' ></span><span class='ocrx_word' style='position:absolute; top:1683px; left:93px; height:27px; width:49px;'>alle</span><span class='ocrx_word' style='position:absolute; top:1683px; left:161px; height:32px; width:130px;'>romischen</span><span class='ocrx_word' style='position:absolute; top:1683px; left:310px; height:32px; width:86px;'>Kaiser</span><span class='ocrx_word' style='position:absolute; top:1683px; left:416px; height:30px; width:79px;'>haben</span><span class='ocrx_word' style='position:absolute; top:1682px; left:514px; height:32px; width:80px;'>diesen</span><span class='ocrx_word' style='position:absolute; top:1682px; left:614px; height:27px; width:95px;'>Namen</span><span class='ocrx_word' style='position:absolute; top:1683px; left:728px; height:33px; width:170px;'>beibehalten,</span><span class='ocrx_word' style='position:absolute; top:1682px; left:917px; height:33px; width:47px;'>daß</span><span class='ocrx_word' style='position:absolute; top:1682px; left:983px; height:33px; width:31px;'>sie</span><span class='ocrx_word' style='position:absolute; top:1692px; left:1033px; height:18px; width:75px;'>«au,-</span><span class='ocr_par' style='position:absolute; top:1724px; left:55px; height:119px; width:1052px;' ></span><span class='ocr_line' style='position:absolute; top:1724px; left:90px; height:35px; width:907px;' ></span><span class='ocrx_word' style='position:absolute; top:1733px; left:90px; height:25px; width:52px;'>per</span><span class='ocrx_word' style='position:absolute; top:1727px; left:160px; height:31px; width:124px;'>2ußr>«ti,</span><span class='ocrx_word' style='position:absolute; top:1726px; left:304px; height:25px; width:22px;'>d.</span><span class='ocrx_word' style='position:absolute; top:1724px; left:345px; height:26px; width:15px;'>i,</span><span class='ocrx_word' style='position:absolute; top:1725px; left:382px; height:32px; width:80px;'>allzeit</span><span class='ocrx_word' style='position:absolute; top:1725px; left:482px; height:31px; width:99px;'>Mehrer</span><span class='ocrx_word' style='position:absolute; top:1725px; left:600px; height:26px; width:43px;'>des</span><span class='ocrx_word' style='position:absolute; top:1724px; left:664px; height:32px; width:86px;'>Reichs</span><span class='ocrx_word' style='position:absolute; top:1725px; left:770px; height:34px; width:115px;'>geheißen</span><span class='ocrx_word' style='position:absolute; top:1725px; left:904px; height:33px; width:93px;'>haben.</span><span class='ocr_line' style='position:absolute; top:1766px; left:55px; height:34px; width:897px;' ></span><span class='ocrx_word' style='position:absolute; top:1766px; left:55px; height:34px; width:121px;'>Avith.</span><span class='ocrx_word' style='position:absolute; top:1767px; left:212px; height:32px; width:112px;'>Haufe.</span><span class='ocrx_word' style='position:absolute; top:1766px; left:361px; height:27px; width:63px;'>Eine</span><span class='ocrx_word' style='position:absolute; top:1766px; left:443px; height:28px; width:81px;'>Stadt</span><span class='ocrx_word' style='position:absolute; top:1768px; left:542px; height:25px; width:27px;'>in</span><span class='ocrx_word' style='position:absolute; top:1767px; left:587px; height:32px; width:122px;'>Idumäa.</span><span class='ocrx_word' style='position:absolute; top:1769px; left:732px; height:24px; width:10px;'>1</span><span class='ocrx_word' style='position:absolute; top:1767px; left:763px; height:32px; width:68px;'>Mos.</span><span class='ocrx_word' style='position:absolute; top:1769px; left:849px; height:29px; width:43px;'>36,</span><span class='ocrx_word' style='position:absolute; top:1769px; left:910px; height:26px; width:42px;'>35.</span><span class='ocr_line' style='position:absolute; top:1809px; left:57px; height:34px; width:1050px;' ></span><span class='ocrx_word' style='position:absolute; top:1809px; left:57px; height:30px; width:125px;'>Aulon.</span><span class='ocrx_word' style='position:absolute; top:1809px; left:236px; height:34px; width:209px;'>Ausgehöhlt.</span><span class='ocrx_word' style='position:absolute; top:1809px; left:491px; height:27px; width:62px;'>Das</span><span class='ocrx_word' style='position:absolute; top:1809px; left:581px; height:34px; width:72px;'>große</span><span class='ocrx_word' style='position:absolute; top:1809px; left:681px; height:32px; width:76px;'>Thal,</span><span class='ocrx_word' style='position:absolute; top:1810px; left:791px; height:27px; width:80px;'>worin</span><span class='ocrx_word' style='position:absolute; top:1810px; left:897px; height:27px; width:38px;'>die</span><span class='ocrx_word' style='position:absolute; top:1809px; left:962px; height:34px; width:145px;'>berühmten</span><span class='ocr_par' style='position:absolute; top:1851px; left:89px; height:36px; width:1017px;' ></span><span class='ocr_line' style='position:absolute; top:1851px; left:89px; height:36px; width:1017px;' ></span><span class='ocrx_word' style='position:absolute; top:1853px; left:89px; height:29px; width:97px;'>Städte</span><span class='ocrx_word' style='position:absolute; top:1852px; left:204px; height:34px; width:111px;'>Vethsan</span><span class='ocrx_word' style='position:absolute; top:1852px; left:334px; height:27px; width:56px;'>oder</span><span class='ocrx_word' style='position:absolute; top:1852px; left:409px; height:34px; width:179px;'>Scythopolis,</span><span class='ocrx_word' style='position:absolute; top:1851px; left:605px; height:34px; width:127px;'>Tlberias,</span><span class='ocrx_word' style='position:absolute; top:1852px; left:751px; height:35px; width:111px;'>Iericho,</span><span class='ocrx_word' style='position:absolute; top:1851px; left:881px; height:29px; width:48px;'>das</span><span class='ocrx_word' style='position:absolute; top:1853px; left:949px; height:27px; width:64px;'>todte</span><span class='ocrx_word' style='position:absolute; top:1852px; left:1033px; height:28px; width:73px;'>Meer</span></div>
|
metadata
CHANGED
@@ -1,82 +1,95 @@
|
|
1
|
-
--- !ruby/object:Gem::Specification
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
2
|
name: rhocr
|
3
|
-
version: !ruby/object:Gem::Version
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: '0.1'
|
4
5
|
prerelease:
|
5
|
-
version: 0.0.3
|
6
6
|
platform: ruby
|
7
|
-
authors:
|
7
|
+
authors:
|
8
8
|
- Andreas Neumann
|
9
9
|
autorequire:
|
10
10
|
bindir: bin
|
11
11
|
cert_chain: []
|
12
|
-
|
13
|
-
|
14
|
-
|
15
|
-
|
16
|
-
|
12
|
+
date: 2011-09-08 00:00:00.000000000Z
|
13
|
+
dependencies:
|
14
|
+
- !ruby/object:Gem::Dependency
|
15
|
+
name: nokogiri
|
16
|
+
requirement: &70276550001820 !ruby/object:Gem::Requirement
|
17
|
+
none: false
|
18
|
+
requirements:
|
19
|
+
- - ! '>='
|
20
|
+
- !ruby/object:Gem::Version
|
21
|
+
version: '0'
|
22
|
+
type: :runtime
|
23
|
+
prerelease: false
|
24
|
+
version_requirements: *70276550001820
|
17
25
|
description: Manipulate and use OCR data encode in HOCR
|
18
|
-
email:
|
26
|
+
email: andreas@neumann.biz
|
19
27
|
executables: []
|
20
|
-
|
21
28
|
extensions: []
|
22
|
-
|
23
|
-
extra_rdoc_files:
|
29
|
+
extra_rdoc_files:
|
24
30
|
- README
|
25
|
-
-
|
31
|
+
- TODO.txt
|
32
|
+
- lib/hocr_box.rb
|
33
|
+
- lib/ocr_document.rb
|
34
|
+
- lib/ocr_element.rb
|
26
35
|
- lib/ocr_page.rb
|
27
|
-
- lib/ocrx_word.rb
|
28
36
|
- lib/rhocr.rb
|
29
|
-
files:
|
37
|
+
files:
|
30
38
|
- Manifest
|
31
39
|
- README
|
32
40
|
- Rakefile
|
41
|
+
- TODO.txt
|
42
|
+
- data/Seite_Die_Gartenlaube_242.html
|
33
43
|
- data/Seite_Tagebuch_H_C_Lang_08.html
|
44
|
+
- data/Seite_Tagebuch_H_C_Lang_08.jpg
|
45
|
+
- data/test.html
|
46
|
+
- data/test.png
|
34
47
|
- example/example_server.rb
|
35
48
|
- example/public/OCRTest.css
|
36
49
|
- example/public/OCRTest.html
|
37
50
|
- example/public/OCRTest_marker.js
|
38
|
-
- example/public/
|
51
|
+
- example/public/Seite_Tagebuch_H_C_Lang_08.jpg
|
39
52
|
- example/public/img/Seite_Tagebuch_H_C_Lang_08.jpg
|
40
|
-
- lib/
|
53
|
+
- lib/hocr_box.rb
|
54
|
+
- lib/ocr_document.rb
|
55
|
+
- lib/ocr_element.rb
|
41
56
|
- lib/ocr_page.rb
|
42
|
-
- lib/ocrx_word.rb
|
43
57
|
- lib/rhocr.rb
|
44
58
|
- rhocr.gemspec
|
45
|
-
-
|
46
|
-
-
|
47
|
-
-
|
48
|
-
|
59
|
+
- spec/hocr_box_spec.rb
|
60
|
+
- spec/ocr_document_spec.rb
|
61
|
+
- spec/ocr_element_spec.rb
|
62
|
+
- spec/ocr_page_spec.rb
|
63
|
+
- spec/rhocr_spec.rb
|
64
|
+
- test.html
|
49
65
|
homepage: http://github.com/daandi/rhocr
|
50
66
|
licenses: []
|
51
|
-
|
52
67
|
post_install_message:
|
53
|
-
rdoc_options:
|
68
|
+
rdoc_options:
|
54
69
|
- --line-numbers
|
55
70
|
- --inline-source
|
56
71
|
- --title
|
57
72
|
- Rhocr
|
58
73
|
- --main
|
59
74
|
- README
|
60
|
-
require_paths:
|
75
|
+
require_paths:
|
61
76
|
- lib
|
62
|
-
required_ruby_version: !ruby/object:Gem::Requirement
|
77
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
63
78
|
none: false
|
64
|
-
requirements:
|
65
|
-
- -
|
66
|
-
- !ruby/object:Gem::Version
|
67
|
-
version:
|
68
|
-
required_rubygems_version: !ruby/object:Gem::Requirement
|
79
|
+
requirements:
|
80
|
+
- - ! '>='
|
81
|
+
- !ruby/object:Gem::Version
|
82
|
+
version: '0'
|
83
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
69
84
|
none: false
|
70
|
-
requirements:
|
71
|
-
- -
|
72
|
-
- !ruby/object:Gem::Version
|
73
|
-
version:
|
85
|
+
requirements:
|
86
|
+
- - ! '>='
|
87
|
+
- !ruby/object:Gem::Version
|
88
|
+
version: '1.2'
|
74
89
|
requirements: []
|
75
|
-
|
76
90
|
rubyforge_project: rhocr
|
77
|
-
rubygems_version: 1.6
|
91
|
+
rubygems_version: 1.8.6
|
78
92
|
signing_key:
|
79
93
|
specification_version: 3
|
80
94
|
summary: Manipulate and use OCR data encode in HOCR
|
81
95
|
test_files: []
|
82
|
-
|
Binary file
|
data/lib/ocr_box.rb
DELETED
@@ -1,43 +0,0 @@
|
|
1
|
-
#coding: utf-8
|
2
|
-
|
3
|
-
class OCRBox
|
4
|
-
|
5
|
-
attr_reader :x1, :y1, :x2, :y2
|
6
|
-
|
7
|
-
def initialize(x1, y1 , x2, y2)
|
8
|
-
@x1 = x1
|
9
|
-
@y1 = y1
|
10
|
-
@x2 = x2
|
11
|
-
@y2 = y2
|
12
|
-
end
|
13
|
-
|
14
|
-
def encloses?(element)
|
15
|
-
@x1 <= element.x1 and
|
16
|
-
@x2 >= element.x2 and
|
17
|
-
@y1 <= element.y1 and
|
18
|
-
@y2 >= element.y2
|
19
|
-
end
|
20
|
-
|
21
|
-
def enclosed_by?(element)
|
22
|
-
return element.encloses? self
|
23
|
-
end
|
24
|
-
|
25
|
-
def to_s
|
26
|
-
"tl->(x:#{@x1} y:#{@y1})/br->:(x:#{@x2} y:#{@y2})"
|
27
|
-
end
|
28
|
-
|
29
|
-
def to_css_style
|
30
|
-
top = @y1
|
31
|
-
left = @x1
|
32
|
-
height = @y2 - @y1
|
33
|
-
width = @x2 - @x1
|
34
|
-
|
35
|
-
"position:absolute; top:#{top}px; left:#{left}px; height:#{height}px; width:#{width}px;"
|
36
|
-
end
|
37
|
-
|
38
|
-
def to_json
|
39
|
-
|
40
|
-
end
|
41
|
-
|
42
|
-
end
|
43
|
-
|
data/lib/ocrx_word.rb
DELETED
@@ -1,23 +0,0 @@
|
|
1
|
-
#coding: utf-8
|
2
|
-
|
3
|
-
require 'cgi'
|
4
|
-
require_relative 'ocr_box'
|
5
|
-
|
6
|
-
class OCRXWord < OCRBox
|
7
|
-
|
8
|
-
attr_reader :text
|
9
|
-
|
10
|
-
def initialize(x1,y1,x2,y2,word)
|
11
|
-
super(x1.to_i, y1.to_i, x2.to_i, y2.to_i)
|
12
|
-
@text = word
|
13
|
-
end
|
14
|
-
|
15
|
-
def to_html(css_class = 'ocrx_word')
|
16
|
-
"<span style='#{ to_css_style }' class='#{css_class}'><span class='word'>" + CGI::escapeHTML(@text) +"</span></span>"
|
17
|
-
end
|
18
|
-
|
19
|
-
def to_s
|
20
|
-
"#{@text}\t#{super}"
|
21
|
-
end
|
22
|
-
|
23
|
-
end
|
data/rspec/ocr_box_spec.rb
DELETED
@@ -1,48 +0,0 @@
|
|
1
|
-
#coding: utf-8
|
2
|
-
|
3
|
-
require_relative '../lib/ocr_box'
|
4
|
-
|
5
|
-
describe OCRBox do
|
6
|
-
|
7
|
-
before(:each) do
|
8
|
-
@box ||= OCRBox.new(1,2,20,8)
|
9
|
-
end
|
10
|
-
|
11
|
-
describe "#to_s" do
|
12
|
-
it "prints a human readable Box-Version with coordinates upper_left(x,y) bottom_right(x,y)" do
|
13
|
-
@box.to_s.should == "tl->(x:1 y:2)/br->:(x:20 y:8)"
|
14
|
-
end
|
15
|
-
end
|
16
|
-
|
17
|
-
describe '#encloses?(element)' do
|
18
|
-
it "tests wather given OCRBox is enclosed by the current OCRBox" do
|
19
|
-
@box.encloses?( OCRBox.new(0,3,19,7) ).should be_false
|
20
|
-
@box.encloses?( OCRBox.new(2,3,19,7) ).should be_true
|
21
|
-
end
|
22
|
-
it "encloses also itself" do
|
23
|
-
@box.encloses?( @box ).should be_true
|
24
|
-
end
|
25
|
-
end
|
26
|
-
|
27
|
-
describe '#to_css_style' do
|
28
|
-
it 'should create css-style attributes' do
|
29
|
-
@box.to_css_style.should == 'position:absolute; top:2px; left:1px; height:6px; width:19px;'
|
30
|
-
end
|
31
|
-
end
|
32
|
-
|
33
|
-
describe '#enclosed_by?(element)' do
|
34
|
-
it 'should be enclosed by Boxes bigger than itself' do
|
35
|
-
@box.enclosed_by?( OCRBox.new(0,1,21,9) ).should be_true
|
36
|
-
end
|
37
|
-
it 'should not be enclosed by Boxes smaller than itself' do
|
38
|
-
@box.enclosed_by?( OCRBox.new(2,3,19,7) ).should be_false
|
39
|
-
end
|
40
|
-
it 'should be enclosed by Boxes of the same size' do
|
41
|
-
@box.enclosed_by?( @box ).should be_true
|
42
|
-
end
|
43
|
-
end
|
44
|
-
|
45
|
-
|
46
|
-
|
47
|
-
|
48
|
-
end
|
data/rspec/ocr_page_spec.rb
DELETED
@@ -1,17 +0,0 @@
|
|
1
|
-
#coding: utf-8
|
2
|
-
|
3
|
-
require_relative '../lib/ocr_page'
|
4
|
-
|
5
|
-
describe OCRPage do
|
6
|
-
|
7
|
-
before(:each) do
|
8
|
-
@ocr_page ||= OCRPage.new('../data/Seite_Tagebuch_H_C_Lang_08.html')
|
9
|
-
end
|
10
|
-
|
11
|
-
describe '' do
|
12
|
-
it '' do
|
13
|
-
p @ocr_page.enclosed_words( OCRBox.new(500,1703,1200,1800) )
|
14
|
-
end
|
15
|
-
end
|
16
|
-
|
17
|
-
end
|
data/rspec/ocrx_word_spec.rb
DELETED
@@ -1,32 +0,0 @@
|
|
1
|
-
#coding: utf-8
|
2
|
-
|
3
|
-
require_relative '../lib/ocrx_word'
|
4
|
-
|
5
|
-
describe OCRXWord do
|
6
|
-
|
7
|
-
before(:each) do
|
8
|
-
@ocrx_word = OCRXWord.new(10,15,20,20,'WORT')
|
9
|
-
end
|
10
|
-
|
11
|
-
describe '#to_s' do
|
12
|
-
it 'should print the coordinates of the box and the textual information' do
|
13
|
-
p @ocrx_word
|
14
|
-
@ocrx_word.to_s.should == "WORT\ttl->(x:10 y:15)/br->:(x:20 y:20)"
|
15
|
-
end
|
16
|
-
end
|
17
|
-
|
18
|
-
describe '#to_html(css_class)' do
|
19
|
-
it 'should create an span elment to overlay an image on an html-page' do
|
20
|
-
@ocrx_word.to_html.should == "<span style='position:absolute; top:15px; left:10px; height:5px; width:10px;' class='ocrx_word'><span class='word'>WORT</span></span>"
|
21
|
-
end
|
22
|
-
|
23
|
-
it 'no css_class_class given should default to ocrx_word' do
|
24
|
-
@ocrx_word.to_html.should =~ /class='ocrx_word'/
|
25
|
-
end
|
26
|
-
|
27
|
-
it 'css_class given should be part of genearted html' do
|
28
|
-
@ocrx_word.to_html('rosebud').should =~ /class='rosebud'/
|
29
|
-
end
|
30
|
-
end
|
31
|
-
|
32
|
-
end
|