Sanatbek commited on
Commit
443fde0
1 Parent(s): bc54271

Upload config.yaml

Browse files
Files changed (1) hide show
  1. config.yaml +119 -0
config.yaml ADDED
@@ -0,0 +1,119 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ name: "uzbek_kazakh_deen_sp"
3
+ joeynmt_version: "2.0.0"
4
+
5
+ data:
6
+ train: "/content/drive/MyDrive/uzbek_kazakh/train"
7
+ dev: "/content/drive/MyDrive/uzbek_kazakh/validation"
8
+ test: "/content/drive/MyDrive/uzbek_kazakh/test"
9
+ dataset_type: "huggingface"
10
+ #dataset_cfg: # not necessary for manually saved pyarray daraset
11
+ # name: "uz-kz"
12
+ sample_dev_subset: 200
13
+ src:
14
+ lang: "uz"
15
+ max_length: 100
16
+ lowercase: False
17
+ normalize: False
18
+ level: "bpe"
19
+ voc_limit: 10000
20
+ voc_min_freq: 1
21
+ voc_file: "/content/drive/MyDrive/uzbek_kazakh/vocab.txt"
22
+ tokenizer_type: "sentencepiece"
23
+ tokenizer_cfg:
24
+ model_file: "/content/drive/MyDrive/uzbek_kazakh/sp.model"
25
+
26
+ trg:
27
+ lang: "kz"
28
+ max_length: 100
29
+ lowercase: False
30
+ normalize: False
31
+ level: "bpe"
32
+ voc_limit: 10000
33
+ voc_min_freq: 1
34
+ voc_file: "/content/drive/MyDrive/uzbek_kazakh/vocab.txt"
35
+ tokenizer_type: "sentencepiece"
36
+ tokenizer_cfg:
37
+ model_file: "/content/drive/MyDrive/uzbek_kazakh/sp.model"
38
+
39
+
40
+ testing:
41
+ n_best: 1
42
+ beam_size: 5
43
+ beam_alpha: 1.0
44
+ batch_size: 256
45
+ batch_type: "token"
46
+ max_output_length: 100
47
+ eval_metrics: ["bleu"]
48
+ #return_prob: "hyp"
49
+ #return_attention: False
50
+ sacrebleu_cfg:
51
+ tokenize: "13a"
52
+
53
+ training:
54
+ load_model: "/content/drive/MyDrive/models/uzbek_kazakh/latest.ckpt"
55
+ reset_best_ckpt: False
56
+ reset_scheduler: False
57
+ reset_optimizer: False
58
+ reset_iter_state: False
59
+ random_seed: 42
60
+ optimizer: "adam"
61
+ normalization: "tokens"
62
+ adam_betas: [0.9, 0.999]
63
+ scheduling: "warmupinversesquareroot"
64
+ learning_rate_warmup: 2000
65
+ learning_rate: 0.0002
66
+ learning_rate_min: 0.00000001
67
+ weight_decay: 0.0
68
+ label_smoothing: 0.1
69
+ loss: "crossentropy"
70
+ batch_size: 512
71
+ batch_type: "token"
72
+ batch_multiplier: 4
73
+ early_stopping_metric: "bleu"
74
+ epochs: 10
75
+ updates: 20000
76
+ validation_freq: 1000
77
+ logging_freq: 100
78
+ model_dir: "/content/drive/MyDrive/models/uzbek_kazakh_resume"
79
+ overwrite: True
80
+ shuffle: True
81
+ use_cuda: True
82
+ print_valid_sents: [0, 1, 2, 3]
83
+ keep_best_ckpts: 3
84
+
85
+ model:
86
+ initializer: "xavier"
87
+ bias_initializer: "zeros"
88
+ init_gain: 1.0
89
+ embed_initializer: "xavier"
90
+ embed_init_gain: 1.0
91
+ tied_embeddings: True
92
+ tied_softmax: True
93
+ encoder:
94
+ type: "transformer"
95
+ num_layers: 6
96
+ num_heads: 4
97
+ embeddings:
98
+ embedding_dim: 256
99
+ scale: True
100
+ dropout: 0.0
101
+ # typically ff_size = 4 x hidden_size
102
+ hidden_size: 256
103
+ ff_size: 1024
104
+ dropout: 0.1
105
+ layer_norm: "pre"
106
+ decoder:
107
+ type: "transformer"
108
+ num_layers: 6
109
+ num_heads: 8
110
+ embeddings:
111
+ embedding_dim: 256
112
+ scale: True
113
+ dropout: 0.0
114
+ # typically ff_size = 4 x hidden_size
115
+ hidden_size: 256
116
+ ff_size: 1024
117
+ dropout: 0.1
118
+ layer_norm: "pre"
119
+