-
Notifications
You must be signed in to change notification settings - Fork 0
/
config.yaml
50 lines (44 loc) · 1.01 KB
/
config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
# File paths
data:
cleaned: data/processed/cleaned.pkl
features: data/processed/features.pkl
targets: data/processed/targets.pkl
reference:
features_map: data/reference/features_map.pkl
targets_map: data/reference/targets_map.pkl
perseus:
raw_dir: data/raw/treebank_data-master/v1.6/greek/data
tagset: data/raw/treebank_data-master/v2.0/Greek/TAGSETS.xml
raw: data/interim/perseus_raw.pkl
normalized: data/interim/perseus_normalized.pkl
# Training configs
runs:
runs_dir: runs
run:
train:
clf_module: cgpos.model.multinomial_naive_bayes
clfs: [MultinomialNaiveBayes, StupidBayes]
test_split:
n_splits: 1
train_size: 0.98
random_state: 30
tune_split:
n_splits: 5
train_size: 0.96
random_state: 20
f1_average: "macro"
export_pred: False
# Best model directory
model: models/pos_tagger.pkl
param_grid:
MultinomialNaiveBayes:
alpha:
start: 0.1
stop: 1
step: 0.1
ngram_range:
depth: 6
StupidBayes:
ngram_depth:
start: 4
stop: 9