forked from czcorpus/xmlanntools
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathveld_xml2vrt.yaml
87 lines (82 loc) · 2.23 KB
/
veld_xml2vrt.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
x-veld:
code:
description: "A demo code veld, integrating the xml2vrt script. For more documentation,
see: https://github.com/czcorpus/xmlanntools?tab=readme-ov-file#xml2vrt"
topic:
- NLP
- ETL
input:
- volume: /veld/input/data/
environment_var: in_ann_xml_file
file_type: xml
- volume: /veld/input/config/
environment_var: in_ann2standoff_ini_file
file_type: ini
output:
- volume: /veld/output/
environment_var: out_conlluish_xml_file
file_type: xml
config:
- environment_var: attributes
var_type: str
optional: true
- environment_var: token_element
var_type: str
optional: true
- environment_var: include_elements
var_type: str
optional: true
- environment_var: exclude_elements
var_type: str
optional: true
- environment_var: keep_token_tags
var_type: bool
default: false
optional: true
- environment_var: keep_empty
var_type: bool
default: false
optional: true
- environment_var: discard_freetext
var_type: bool
default: false
optional: true
- environment_var: no_glue
var_type: bool
default: false
optional: true
- environment_var: glue
var_type: str
optional: true
- environment_var: fragment
var_type: bool
default: false
optional: true
- environment_var: no_flattening
var_type: bool
default: false
optional: true
services:
veld_xml2vrt:
build: .
volumes:
- ./:/veld/code/
- ./data/xml2vrt/in/data/:/veld/input/data/
- ./data/xml2vrt/in/config/:/veld/input/config/
- ./data/xml2vrt/out/:/veld/output/
command: bash /veld/code/veld_xml2vrt.sh
environment:
in_ann_xml_file: null
in_ann2standoff_ini_file: null
out_conlluish_xml_file: null
attributes: null
token_element: null
include_elements: null
exclude_elements: null
keep_token_tags: false
keep_empty: false
discard_freetext: false
no_glue: false
glue: null
fragment: false
no_flattening: false