ad019el commited on
Commit
420eaed
1 Parent(s): 6d61fab

Training in progress, step 300

Browse files
Files changed (3) hide show
  1. config.json +6 -7
  2. pytorch_model.bin +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -1,6 +1,5 @@
1
  {
2
  "_name_or_path": "ad019el/Kabyle_xlsr-finetuned-tamasheq.en",
3
- "gradient_checkpointing": true,
4
  "activation_dropout": 0.05,
5
  "adapter_attn_dim": null,
6
  "adapter_kernel_size": 3,
@@ -10,7 +9,7 @@
10
  "architectures": [
11
  "Wav2Vec2ForCTC"
12
  ],
13
- "attention_dropout": 0.1,
14
  "bos_token_id": 1,
15
  "classifier_proj_size": 256,
16
  "codevector_dim": 768,
@@ -51,16 +50,16 @@
51
  "feat_extract_activation": "gelu",
52
  "feat_extract_dropout": 0.0,
53
  "feat_extract_norm": "layer",
54
- "feat_proj_dropout": 0.0,
55
  "feat_quantizer_dropout": 0.0,
56
  "final_dropout": 0.0,
57
  "hidden_act": "gelu",
58
- "hidden_dropout": 0.1,
59
  "hidden_size": 1024,
60
  "initializer_range": 0.02,
61
  "intermediate_size": 4096,
62
  "layer_norm_eps": 1e-05,
63
- "layerdrop": 0.2,
64
  "mask_feature_length": 10,
65
  "mask_feature_min_masks": 0,
66
  "mask_feature_prob": 0.0,
@@ -78,7 +77,7 @@
78
  "num_hidden_layers": 24,
79
  "num_negatives": 100,
80
  "output_hidden_size": 1024,
81
- "pad_token_id": 29,
82
  "proj_codevector_dim": 768,
83
  "tdnn_dilation": [
84
  1,
@@ -104,6 +103,6 @@
104
  "torch_dtype": "float32",
105
  "transformers_version": "4.33.0",
106
  "use_weighted_layer_sum": false,
107
- "vocab_size": 30,
108
  "xvector_output_dim": 512
109
  }
 
1
  {
2
  "_name_or_path": "ad019el/Kabyle_xlsr-finetuned-tamasheq.en",
 
3
  "activation_dropout": 0.05,
4
  "adapter_attn_dim": null,
5
  "adapter_kernel_size": 3,
 
9
  "architectures": [
10
  "Wav2Vec2ForCTC"
11
  ],
12
+ "attention_dropout": 0.2,
13
  "bos_token_id": 1,
14
  "classifier_proj_size": 256,
15
  "codevector_dim": 768,
 
50
  "feat_extract_activation": "gelu",
51
  "feat_extract_dropout": 0.0,
52
  "feat_extract_norm": "layer",
53
+ "feat_proj_dropout": 0.1,
54
  "feat_quantizer_dropout": 0.0,
55
  "final_dropout": 0.0,
56
  "hidden_act": "gelu",
57
+ "hidden_dropout": 0.2,
58
  "hidden_size": 1024,
59
  "initializer_range": 0.02,
60
  "intermediate_size": 4096,
61
  "layer_norm_eps": 1e-05,
62
+ "layerdrop": 0.4,
63
  "mask_feature_length": 10,
64
  "mask_feature_min_masks": 0,
65
  "mask_feature_prob": 0.0,
 
77
  "num_hidden_layers": 24,
78
  "num_negatives": 100,
79
  "output_hidden_size": 1024,
80
+ "pad_token_id": 31,
81
  "proj_codevector_dim": 768,
82
  "tdnn_dilation": [
83
  1,
 
103
  "torch_dtype": "float32",
104
  "transformers_version": "4.33.0",
105
  "use_weighted_layer_sum": false,
106
+ "vocab_size": 32,
107
  "xvector_output_dim": 512
108
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b126ad797b0635deb678753911532f0d4779b545d8b03f6b8b8a5aa01c82dbf
3
- size 1262024813
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9241009547bda1ca1601c79ba7d1e84b11d2e2db1ef8f245de563fa7029d6a0
3
+ size 1262033069
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a572e40d9f760e26ad5c68b12aca2f753f6ae4394cddfb369c5e0ef220fd51a8
3
  size 4027
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d3a0ab3e996c2bd91c1438deb204abcd6599fa6c2af500d250ae9d18fd61fdb
3
  size 4027