-
Notifications
You must be signed in to change notification settings - Fork 73
/
twpos.json
71 lines (71 loc) · 1.51 KB
/
twpos.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
{
"task": "tagger",
"basedir": "./twpos",
"conll_output": "twposresults.conll",
"charsz": 16,
"unif": 0.1,
"preproc": {
},
"backend": "tensorflow",
"dataset": "twpos",
"loader": {
"reader_type": "default",
"named_fields": {
"0": "text",
"-1": "y"
}
},
"features": [
{
"name": "word",
"vectorizer": {
"type": "dict1d",
"fields": "text",
"transform": "baseline.lowercase"
},
"embeddings": { "label": "glove-twitter-27B"}
},
{
"name": "word2",
"vectorizer": {
"type": "dict1d",
"fields": "text",
"transform": "baseline.lowercase"
},
"embeddings": { "label": "glove-42B"}
},
{
"name": "word3",
"vectorizer": {
"type": "dict1d",
"fields": "text",
"transform": "baseline.web_cleanup"
},
"embeddings": { "label": "w2v-twitter-30M" }
},
{
"name": "char",
"vectorizer": { "type": "dict2d" },
"embeddings": { "dsz": 30, "wsz": 30, "type": "char-conv" }
}
],
"model": {
"model_type": "default",
"hsz": 200,
"dropout": 0.5,
"rnntype": "blstm",
"layers": 1,
"crf": true
},
"train": {
"batchsz": 20,
"epochs": 40,
"optim": "sgd",
"eta": 0.01,
"mom": 0.9,
"patience": 20,
"early_stopping_metric": "acc",
"span_type": "token",
"clip": 5.0
}
}