Sandiago21 commited on
Commit
77e5520
1 Parent(s): 45ea4a5

End of training

Browse files
README.md CHANGED
@@ -1,12 +1,11 @@
1
  ---
2
  language:
3
  - multilingual
4
- license: apache-2.0
5
- base_model: mistralai/Mistral-7B-v0.1
6
  tags:
7
  - generated_from_trainer
8
  datasets:
9
- - arc
10
  model-index:
11
  - name: mistral-7b-llm-science-exam
12
  results: []
@@ -17,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  # mistral-7b-llm-science-exam
19
 
20
- This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the ARC dataset.
21
 
22
  ## Model description
23
 
@@ -36,13 +35,13 @@ More information needed
36
  ### Training hyperparameters
37
 
38
  The following hyperparameters were used during training:
39
- - learning_rate: 2e-05
40
- - train_batch_size: 1
41
- - eval_batch_size: 8
42
  - seed: 42
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
- - lr_scheduler_type: linear
45
- - lr_scheduler_warmup_steps: 50
46
  - num_epochs: 1
47
 
48
  ### Framework versions
 
1
  ---
2
  language:
3
  - multilingual
4
+ base_model: /kaggle/input/mistral-7b/Mistral-7B-v0.1
 
5
  tags:
6
  - generated_from_trainer
7
  datasets:
8
+ - STEM
9
  model-index:
10
  - name: mistral-7b-llm-science-exam
11
  results: []
 
16
 
17
  # mistral-7b-llm-science-exam
18
 
19
+ This model is a fine-tuned version of [/kaggle/input/mistral-7b/Mistral-7B-v0.1](https://huggingface.co//kaggle/input/mistral-7b/Mistral-7B-v0.1) on the llm-science-exam dataset.
20
 
21
  ## Model description
22
 
 
35
  ### Training hyperparameters
36
 
37
  The following hyperparameters were used during training:
38
+ - learning_rate: 1e-05
39
+ - train_batch_size: 2
40
+ - eval_batch_size: 2
41
  - seed: 42
42
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
43
+ - lr_scheduler_type: cosine
44
+ - lr_scheduler_warmup_steps: 25
45
  - num_epochs: 1
46
 
47
  ### Framework versions
adapter_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "auto_mapping": null,
3
- "base_model_name_or_path": "mistralai/Mistral-7B-v0.1",
4
  "bias": "none",
5
  "fan_in_fan_out": false,
6
  "inference_mode": true,
 
1
  {
2
  "auto_mapping": null,
3
+ "base_model_name_or_path": "/kaggle/input/mistral-7b/Mistral-7B-v0.1",
4
  "bias": "none",
5
  "fan_in_fan_out": false,
6
  "inference_mode": true,
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d6e48c63cb54dc17c542358f7fe252e7e537c2c5e741089b07cdbf2222fc9c75
3
  size 109097933
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3ea89ea4b4b01471867e342833f3182664bc5d9667c08cfd651220831cf2991
3
  size 109097933
special_tokens_map.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<unk>",
4
+ "<s>",
5
+ "</s>"
6
+ ],
7
+ "bos_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "pad_token": "</s>",
10
+ "unk_token": "<unk>"
11
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
3
+ size 493443
tokenizer_config.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<unk>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<s>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ }
27
+ },
28
+ "additional_special_tokens": [
29
+ "<unk>",
30
+ "<s>",
31
+ "</s>"
32
+ ],
33
+ "bos_token": "<s>",
34
+ "clean_up_tokenization_spaces": false,
35
+ "eos_token": "</s>",
36
+ "legacy": true,
37
+ "model_max_length": 1000000000000000019884624838656,
38
+ "pad_token": null,
39
+ "sp_model_kwargs": {},
40
+ "spaces_between_special_tokens": false,
41
+ "tokenizer_class": "LlamaTokenizer",
42
+ "unk_token": "<unk>",
43
+ "use_default_system_prompt": true
44
+ }
train_with_llm_answers.csv CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aaad09104310eaaa7ee2ee7c10fd465ddad8907d7d54abaaff45ad31161f8f2c
3
  size 4091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85286bab714706443a5a98be9bb777ca67e3f6827f1200c9309f35e64a95e885
3
  size 4091