ocrd 3.1.0__py3-none-any.whl → 3.1.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- ocrd/ocrd-all-tool.json +43 -19
- {ocrd-3.1.0.dist-info → ocrd-3.1.1.dist-info}/METADATA +1 -1
- {ocrd-3.1.0.dist-info → ocrd-3.1.1.dist-info}/RECORD +7 -7
- {ocrd-3.1.0.dist-info → ocrd-3.1.1.dist-info}/LICENSE +0 -0
- {ocrd-3.1.0.dist-info → ocrd-3.1.1.dist-info}/WHEEL +0 -0
- {ocrd-3.1.0.dist-info → ocrd-3.1.1.dist-info}/entry_points.txt +0 -0
- {ocrd-3.1.0.dist-info → ocrd-3.1.1.dist-info}/top_level.txt +0 -0
ocrd/ocrd-all-tool.json
CHANGED
|
@@ -1,21 +1,45 @@
|
|
|
1
1
|
{
|
|
2
|
-
|
|
3
|
-
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
|
|
14
|
-
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
}
|
|
2
|
+
"ocrd-dummy": {
|
|
3
|
+
"executable": "ocrd-dummy",
|
|
4
|
+
"description": "Bare-bones processor creates PAGE-XML and optionally copies file from input group to output group",
|
|
5
|
+
"steps": [
|
|
6
|
+
"preprocessing/optimization"
|
|
7
|
+
],
|
|
8
|
+
"categories": [
|
|
9
|
+
"Image preprocessing"
|
|
10
|
+
],
|
|
11
|
+
"input_file_grp_cardinality": 1,
|
|
12
|
+
"output_file_grp_cardinality": 1,
|
|
13
|
+
"parameters": {
|
|
14
|
+
"copy_files": {
|
|
15
|
+
"type": "boolean",
|
|
16
|
+
"default": false,
|
|
17
|
+
"description": "Whether to actually copy files (true) or just create PAGE-XML as a side effect (false)"
|
|
18
|
+
}
|
|
20
19
|
}
|
|
21
|
-
}
|
|
20
|
+
},
|
|
21
|
+
"ocrd-filter": {
|
|
22
|
+
"executable": "ocrd-filter",
|
|
23
|
+
"description": "Bare-bones processor can be dynamically configured to remove segments based on XPath queries",
|
|
24
|
+
"steps": [
|
|
25
|
+
"recognition/post-correction"
|
|
26
|
+
],
|
|
27
|
+
"categories": [
|
|
28
|
+
"Quality assurance"
|
|
29
|
+
],
|
|
30
|
+
"input_file_grp_cardinality": 1,
|
|
31
|
+
"output_file_grp_cardinality": 1,
|
|
32
|
+
"parameters": {
|
|
33
|
+
"select": {
|
|
34
|
+
"type": "string",
|
|
35
|
+
"default": "//*[ends-with(local-name(),'Region')]",
|
|
36
|
+
"description": "Which segments to select for removal. An XPath 2.0 query expression (path and optional predicates), with 'pc' as namespace prefix for PAGE-XML and our extension functions (see help text). Only selection of segment hierarchy elements is allowed (so e.g. `*` would be equivalent to `pc:NoiseRegion|pc:LineDrawingRegion|pc:AdvertRegion|pc:ImageRegion|pc:ChartRegion|pc:MusicRegion|pc:GraphicRegion|pc:UnknownRegion|pc:CustomRegion|pc:SeparatorRegion|pc:MathsRegion|pc:TextRegion|pc:MapRegion|pc:ChemRegion|pc:TableRegion|pc:TextLine|pc:Word|pc:Glyph`, but `pc:MetadataItem` or `pc:Border` or `pc:Coords` would not match).\nFor example, to remove words or glyphs with low text confidence, select '(pc:Word|pc:Glyph)[pc:TextEquiv/@conf < 0.7]'. Or low layout confidence, '*[pc:Coords/@conf < 0.7]'.\nTo remove high pixel-to-character rate, select '*[pc:pixelarea(.) div string-length(pc:textequiv(.)) > 10000]'."
|
|
37
|
+
},
|
|
38
|
+
"plot": {
|
|
39
|
+
"type": "boolean",
|
|
40
|
+
"default": false,
|
|
41
|
+
"description": "Whether to extract an image for each filtered segment and write to the output fileGrp."
|
|
42
|
+
}
|
|
43
|
+
}
|
|
44
|
+
}
|
|
45
|
+
}
|
|
@@ -2,7 +2,7 @@ ocrd/__init__.py,sha256=ZswMVmlqFhAEIzMR3my6IKPq9XLH21aDPC_m_8Jh4dA,1076
|
|
|
2
2
|
ocrd/constants.py,sha256=6dn3mG54WqHsKInmLZp4kJjNqqPtBoFoSuLUuRbOps0,740
|
|
3
3
|
ocrd/lib.bash,sha256=le6XqAOEacdjP3JNSlPkxwRH1y0oVjNQM2tX5d6QFO4,10901
|
|
4
4
|
ocrd/mets_server.py,sha256=EL6CMtVjmVPs9--3Vn-JyhU2VDMNw-6QN_XWRKFp6uk,22451
|
|
5
|
-
ocrd/ocrd-all-tool.json,sha256=
|
|
5
|
+
ocrd/ocrd-all-tool.json,sha256=EYXmMzP68p3KzL8nUZ16TCX2chQzKkAeISvuXqI_yIw,2094
|
|
6
6
|
ocrd/resolver.py,sha256=Ba9ALQbTXz6_mla4VqN9tAfHoj6aKuNJAU4tIDnjcHE,14952
|
|
7
7
|
ocrd/resource_list.yml,sha256=82-PiqkZnka1kTj3MQqNn4wXWKHHtoFchsQuetWuqFs,2633
|
|
8
8
|
ocrd/resource_manager.py,sha256=kIWDoKxWH4IJE1gcoTcCRQjYjieCqiQclyuyF6Y9b8A,16813
|
|
@@ -120,9 +120,9 @@ ocrd_validators/xlink.xsd,sha256=8fW7YAMWXN2PbB_MMvj9H5ZeFoEBDzuYBtlGC8_6ijw,318
|
|
|
120
120
|
ocrd_validators/xsd_mets_validator.py,sha256=4GWfLyqkmca0x7osDuXuExYuM0HWVrKoqn0S35sFhHU,467
|
|
121
121
|
ocrd_validators/xsd_page_validator.py,sha256=BNz_9u-Ek4UCeyZu3KxSQoolfW9lvuaSR9nIu1XXxeE,467
|
|
122
122
|
ocrd_validators/xsd_validator.py,sha256=6HrVAf6SzCvfUIuQdIzz9bOq4V-zhyii9yrUPoK2Uvo,2094
|
|
123
|
-
ocrd-3.1.
|
|
124
|
-
ocrd-3.1.
|
|
125
|
-
ocrd-3.1.
|
|
126
|
-
ocrd-3.1.
|
|
127
|
-
ocrd-3.1.
|
|
128
|
-
ocrd-3.1.
|
|
123
|
+
ocrd-3.1.1.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
|
124
|
+
ocrd-3.1.1.dist-info/METADATA,sha256=athV-jzUTYFDjcbykQcSH6JXva7mNDVyHJgf3LCof8s,10442
|
|
125
|
+
ocrd-3.1.1.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
|
|
126
|
+
ocrd-3.1.1.dist-info/entry_points.txt,sha256=4hcJ2LkK_OlIabHnKgFit35Ap7b5Lz1Gb4hzkxV0Kiw,152
|
|
127
|
+
ocrd-3.1.1.dist-info/top_level.txt,sha256=pUgiN42t4KXC5rvpi6V8atza31XP4SCznXpXlVlvomM,75
|
|
128
|
+
ocrd-3.1.1.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|