yanaiela commited on
Commit
8745e78
1 Parent(s): 03af4fc

decomposable_attention elmo snli

Browse files
.gitattributes CHANGED
@@ -29,3 +29,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
29
  *.zip filter=lfs diff=lfs merge=lfs -text
30
  *.zst filter=lfs diff=lfs merge=lfs -text
31
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
29
  *.zip filter=lfs diff=lfs merge=lfs -text
30
  *.zst filter=lfs diff=lfs merge=lfs -text
31
  *tfevents* filter=lfs diff=lfs merge=lfs -text
32
+ *.th filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - allennlp
4
+ ---
5
+
6
+ # TODO: Fill this model card
config.json ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_reader": {
3
+ "type": "snli",
4
+ "token_indexers": {
5
+ "elmo": {
6
+ "type": "elmo_characters"
7
+ }
8
+ },
9
+ "tokenizer": {
10
+ "end_tokens": [
11
+ "@@NULL@@"
12
+ ]
13
+ }
14
+ },
15
+ "train_data_path": "https://s3-us-west-2.amazonaws.com/allennlp/datasets/snli/snli_1.0_train.jsonl",
16
+ "validation_data_path": "https://s3-us-west-2.amazonaws.com/allennlp/datasets/snli/snli_1.0_dev.jsonl",
17
+ "model": {
18
+ "type": "decomposable_attention",
19
+ "text_field_embedder": {
20
+ "token_embedders": {
21
+ "elmo": {
22
+ "type": "elmo_token_embedder",
23
+ "do_layer_norm": false,
24
+ "dropout": 0.2
25
+ }
26
+ }
27
+ },
28
+ "attend_feedforward": {
29
+ "input_dim": 1024,
30
+ "num_layers": 2,
31
+ "hidden_dims": 200,
32
+ "activations": "relu",
33
+ "dropout": 0.2
34
+ },
35
+ "matrix_attention": {
36
+ "type": "dot_product"
37
+ },
38
+ "compare_feedforward": {
39
+ "input_dim": 2048,
40
+ "num_layers": 2,
41
+ "hidden_dims": 200,
42
+ "activations": "relu",
43
+ "dropout": 0.2
44
+ },
45
+ "aggregate_feedforward": {
46
+ "input_dim": 400,
47
+ "num_layers": 2,
48
+ "hidden_dims": [
49
+ 200,
50
+ 3
51
+ ],
52
+ "activations": [
53
+ "relu",
54
+ "linear"
55
+ ],
56
+ "dropout": [
57
+ 0.2,
58
+ 0.0
59
+ ]
60
+ },
61
+ "initializer": {
62
+ "regexes": [
63
+ [
64
+ ".*linear_layers.*weight",
65
+ {
66
+ "type": "xavier_normal"
67
+ }
68
+ ],
69
+ [
70
+ ".*token_embedder_tokens\\._projection.*weight",
71
+ {
72
+ "type": "xavier_normal"
73
+ }
74
+ ]
75
+ ]
76
+ }
77
+ },
78
+ "iterator": {
79
+ "type": "bucket",
80
+ "sorting_keys": [
81
+ [
82
+ "premise",
83
+ "num_tokens"
84
+ ],
85
+ [
86
+ "hypothesis",
87
+ "num_tokens"
88
+ ]
89
+ ],
90
+ "batch_size": 64
91
+ },
92
+ "trainer": {
93
+ "num_epochs": 140,
94
+ "patience": 20,
95
+ "cuda_device": 0,
96
+ "grad_clipping": 5.0,
97
+ "validation_metric": "+accuracy",
98
+ "optimizer": {
99
+ "type": "adagrad"
100
+ }
101
+ }
102
+ }
vocabulary/labels.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ entailment
2
+ contradiction
3
+ neutral
vocabulary/non_padded_namespaces.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ *tags
2
+ *labels
weights.th ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97c2e5073fedecd62e12ef2e65731379978cfcf917bb23cdf0d833053ab34c79
3
+ size 377518648