-
Notifications
You must be signed in to change notification settings - Fork 6
/
ocrd-tool.json
89 lines (89 loc) · 2.74 KB
/
ocrd-tool.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
{
"version": "0.0.2",
"git_url": "https://github.com/jkamlah/ocrd_pagetopdf",
"tools": {
"ocrd-pagetopdf": {
"executable": "ocrd-pagetopdf",
"description": "Convert text and layout annotations to PDF format (overlaying original image with text layer and polygon outlines)",
"categories": [
"Long-term preservation"
],
"steps": [
"postprocessing/format-conversion"
],
"input_file_grp": [
"OCR-D-OCR-PAGE"
],
"output_file_grp": [
"OCR-D-OCR-PDF"
],
"parameters": {
"font": {
"description": "Font file to be used in PDF file. If unset, AletheiaSans.ttf is used. (Make sure to pick a font which covers all glyphs!)",
"type": "string",
"format": "uri",
"content-type": "application/x-font-ttf",
"default": ""
},
"outlines": {
"description": "What segment hierarchy to draw coordinate outlines for. If unset, no outlines are drawn.",
"type": "string",
"default": "",
"enum": [
"",
"region",
"line",
"word",
"glyph"
]
},
"textequiv_level": {
"description": "What segment hierarchy level to render text output from. If unset, no text is rendered.",
"type": "string",
"default": "",
"enum": [
"",
"region",
"line",
"word",
"glyph"
]
},
"negative2zero": {
"description": "Set all negative box values to 0",
"type": "boolean",
"default": false
},
"ext": {
"description": "Output filename extension",
"type": "string",
"default": ".pdf"
},
"multipage": {
"description": "Merge all PDFs into one multipage file. The value is used as filename for the pdf.",
"type": "string",
"default": ""
},
"pagelabel": {
"description": "Parameter for 'multipage': Set the page information, which will be used as pagelabel. Default is 'pageId', e.g. the option 'pagenumber' will create numbered pagelabel consecutively",
"type": "string",
"default": "pageId",
"enum": [
"pagenumber",
"pageId",
"basename",
"basename_without_extension",
"local_filename",
"ID",
"url"
]
},
"script-args": {
"description": "Extra arguments to PageToPdf (see https://github.com/PRImA-Research-Lab/prima-page-to-pdf)",
"type": "string",
"default": ""
}
}
}
}
}