-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathconfig-fi.json
30 lines (30 loc) · 1.02 KB
/
config-fi.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
{
"LANGUAGE": "finnish",
"FASTTEXT_PATH": "./fasttext",
"BIN_FILE": "cc.fi.300.bin",
"VEC_FILE": "cc.fi.300.vec",
"OUT_FILE": "cc.fi.300.filtered.vec",
"VOCAB_FILE": "cc.fi.300.filtered.vocab",
"_comment_regex_positive": "C, Q, W, X or Z excluded",
"REGEX_POSITIVE": "([abd-pr-vyABD-PR-VYÄäÖöÅ劚Žž\\-\\']+$)",
"_comment_regex_negative_1": "Exclude words beginning with dash",
"_comment_regex_negative_2": "and containing consecutive dashes",
"REGEX_NEGATIVE": "^-|--",
"_comment_regex_foreign": "Exclude if matches and doesn't pass spell check",
"REGEX_FOREIGN": "[Å劚Žž]",
"_comment_regex_repeat": "Exclude if 3 or more consecutive repeated letters",
"REGEX_REPEAT": "(\\w)\\1{2,}",
"RANDOM_CONSONANTS": "bdfghjklmnprstv",
"RANDOM_MIN_LENGTH": "4",
"RANDOM_MAX_LENGTH": "20",
"NN_LOOP_CUTOFF": "100",
"NN_LOOP_WORDS": "1000",
"DATABASE": {
"dbname": "decrapper",
"table": "garbwords",
"user": "root",
"password": "",
"host": "localhost",
"port": "3306"
}
}