-
Notifications
You must be signed in to change notification settings - Fork 2
/
exemple.xml
36 lines (36 loc) · 1.23 KB
/
exemple.xml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
<?xml version="1.0" encoding="UTF-8"?>
<?xml-model href="protogenie/schema.rng" schematypens="http://relaxng.org/ns/structure/1.0"?>
<config>
<output column_marker="TAB">
<header>
<key></key>
</header>
</output>
<memory path="memory.csv" />
<default-header>
<header type="order">
<key map-to="token">0</key>
<key map-to="lemma">1</key>
<key map-to="POS">2</key>
<key map-to="morph">3</key>
</header>
</default-header>
<corpora>
<corpus path="datasets/chrestien.tsv" column_marker="TAB">
<splitter name="token_window" window="20"/>
<header type="default" />
</corpus>
<corpus path="datasets/dotmarkers.tsv" column_marker="TAB">
<splitter name="punctuation" sentence_markers=";?!."/>
<header type="default" />
</corpus>
<corpus path="datasets/empty_line.tsv" column_marker="TAB">
<splitter name="empty_line"/>
<header type="default" />
</corpus>
<corpus path="datasets/flow.tsv" column_marker="TAB">
<splitter name="file_split"/>
<header type="default" />
</corpus>
</corpora>
</config>