Minata commited on
Commit
47c303e
1 Parent(s): 0492367

Training in progress, step 500

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "uclanlp/plbart-large",
3
+ "activation_dropout": 0.0,
4
+ "activation_function": "gelu",
5
+ "architectures": [
6
+ "PLBartForConditionalGeneration"
7
+ ],
8
+ "attention_dropout": 0.1,
9
+ "bos_token_id": 0,
10
+ "classifier_dropout": 0.0,
11
+ "d_model": 1024,
12
+ "decoder_attention_heads": 16,
13
+ "decoder_ffn_dim": 4096,
14
+ "decoder_layerdrop": 0.0,
15
+ "decoder_layers": 12,
16
+ "dropout": 0.1,
17
+ "encoder_attention_heads": 16,
18
+ "encoder_ffn_dim": 4096,
19
+ "encoder_layerdrop": 0.0,
20
+ "encoder_layers": 12,
21
+ "eos_token_id": 2,
22
+ "forced_eos_token_id": 2,
23
+ "gradient_checkpointing": false,
24
+ "init_std": 0.02,
25
+ "is_encoder_decoder": true,
26
+ "max_position_embeddings": 1024,
27
+ "model_type": "plbart",
28
+ "num_hidden_layers": 12,
29
+ "pad_token_id": 1,
30
+ "scale_embedding": true,
31
+ "torch_dtype": "float32",
32
+ "transformers_version": "4.26.1",
33
+ "use_cache": true,
34
+ "vocab_size": 50005
35
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ce3e949bccd072e4edcd336891736dc34e97311501cde8b47629d38ecd7c73a
3
+ size 1624475405
runs/Feb20_12-36-46_db6f5b0c4128/1676896617.4634156/events.out.tfevents.1676896617.db6f5b0c4128.22230.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d636537f199d679b1e34d77e56c664e3764f89c3b74361ff63593d6c73dcc6d
3
+ size 5972
runs/Feb20_12-36-46_db6f5b0c4128/events.out.tfevents.1676896617.db6f5b0c4128.22230.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:762be842691d6187fa2156bf95463135c0bef8f35aa668aaa7d2b4ed9ffe3feb
3
+ size 4250
runs/Feb20_12-43-09_db6f5b0c4128/1676896995.434722/events.out.tfevents.1676896995.db6f5b0c4128.25241.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52190e24268a345fb1981f2f8a5a13c459c0726ca2fde71c6c4c4c55f5b7ff91
3
+ size 5972
runs/Feb20_12-43-09_db6f5b0c4128/events.out.tfevents.1676896995.db6f5b0c4128.25241.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98fc3e3c06d6ffcdefb15bbbb281bfc16e705662a613280fb5c6e4844cb9f384
3
+ size 4250
runs/Feb20_12-44-33_db6f5b0c4128/1676897079.907183/events.out.tfevents.1676897079.db6f5b0c4128.25732.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4678c83762b7335b655b881fa55f6de2106b80113a40d3694ffa82e864b9045d
3
+ size 5972
runs/Feb20_12-44-33_db6f5b0c4128/events.out.tfevents.1676897079.db6f5b0c4128.25732.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f67f9fcf58c3b55e566de338883ccc03f4439176a2d912611e22904e94c12b0
3
+ size 4250
runs/Feb20_12-46-02_db6f5b0c4128/1676897168.7182176/events.out.tfevents.1676897168.db6f5b0c4128.26288.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29ad77de8f29f767f3740fd29d21964a2871090c4612f51ae8ed21d918687569
3
+ size 5972
runs/Feb20_12-46-02_db6f5b0c4128/events.out.tfevents.1676897168.db6f5b0c4128.26288.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e74bff4c3cebe77fee8bc8f1c7e17c08919b0c1de3e100e43965bae4f3af35de
3
+ size 4250
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f72f5d040a176945623a255484d24066f8c0da89a294359154e226efbe494b80
3
+ size 985833
special_tokens_map.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "__java__",
4
+ "__python__",
5
+ "__en_XX__"
6
+ ],
7
+ "bos_token": "<s>",
8
+ "cls_token": "<s>",
9
+ "eos_token": "</s>",
10
+ "mask_token": {
11
+ "content": "<mask>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ "pad_token": "<pad>",
18
+ "sep_token": "</s>",
19
+ "unk_token": "<unk>"
20
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": null,
3
+ "bos_token": "<s>",
4
+ "cls_token": "<s>",
5
+ "eos_token": "</s>",
6
+ "language_codes": "base",
7
+ "mask_token": {
8
+ "__type": "AddedToken",
9
+ "content": "<mask>",
10
+ "lstrip": true,
11
+ "normalized": true,
12
+ "rstrip": false,
13
+ "single_word": false
14
+ },
15
+ "model_max_length": 1000000000000000019884624838656,
16
+ "name_or_path": "uclanlp/plbart-large",
17
+ "pad_token": "<pad>",
18
+ "sep_token": "</s>",
19
+ "sp_model_kwargs": {},
20
+ "special_tokens_map_file": null,
21
+ "src_lang": null,
22
+ "tgt_lang": null,
23
+ "tokenizer_class": "PLBartTokenizer",
24
+ "unk_token": "<unk>"
25
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4686666161c7a14888fbddeaa3fb6628c030dcff444097fd9890ab5c0cfdbf1
3
+ size 3643