Minbyul commited on
Commit
c55047f
1 Parent(s): c96f885

Model save

Browse files
README.md CHANGED
@@ -1,15 +1,12 @@
1
  ---
2
  base_model: dmis-lab/selfbiorag_7b
3
  tags:
4
- - alignment-handbook
5
- - trl
6
- - sft
7
- - generated_from_trainer
8
  - trl
9
  - sft
 
10
  - generated_from_trainer
11
  datasets:
12
- - HuggingFaceH4/deita-10k-v0-sft
13
  model-index:
14
  - name: selfbiorag-7b-1e-6-wo-medication_qa-iter-sft-step1_lr
15
  results: []
@@ -20,9 +17,9 @@ should probably proofread and complete it, then remove this comment. -->
20
 
21
  # selfbiorag-7b-1e-6-wo-medication_qa-iter-sft-step1_lr
22
 
23
- This model is a fine-tuned version of [dmis-lab/selfbiorag_7b](https://huggingface.co/dmis-lab/selfbiorag_7b) on the HuggingFaceH4/deita-10k-v0-sft dataset.
24
  It achieves the following results on the evaluation set:
25
- - Loss: 1.4498
26
 
27
  ## Model description
28
 
@@ -59,9 +56,9 @@ The following hyperparameters were used during training:
59
 
60
  | Training Loss | Epoch | Step | Validation Loss |
61
  |:-------------:|:-----:|:----:|:---------------:|
62
- | 1.4296 | 1.0 | 5 | 1.4870 |
63
- | 1.3958 | 2.0 | 10 | 1.4528 |
64
- | 1.3728 | 3.0 | 15 | 1.4498 |
65
 
66
 
67
  ### Framework versions
 
1
  ---
2
  base_model: dmis-lab/selfbiorag_7b
3
  tags:
 
 
 
 
4
  - trl
5
  - sft
6
+ - alignment-handbook
7
  - generated_from_trainer
8
  datasets:
9
+ - generator
10
  model-index:
11
  - name: selfbiorag-7b-1e-6-wo-medication_qa-iter-sft-step1_lr
12
  results: []
 
17
 
18
  # selfbiorag-7b-1e-6-wo-medication_qa-iter-sft-step1_lr
19
 
20
+ This model is a fine-tuned version of [dmis-lab/selfbiorag_7b](https://huggingface.co/dmis-lab/selfbiorag_7b) on the generator dataset.
21
  It achieves the following results on the evaluation set:
22
+ - Loss: 1.4499
23
 
24
  ## Model description
25
 
 
56
 
57
  | Training Loss | Epoch | Step | Validation Loss |
58
  |:-------------:|:-----:|:----:|:---------------:|
59
+ | 1.4295 | 1.0 | 5 | 1.4872 |
60
+ | 1.3958 | 2.0 | 10 | 1.4525 |
61
+ | 1.3727 | 3.0 | 15 | 1.4499 |
62
 
63
 
64
  ### Framework versions
all_results.json CHANGED
@@ -5,8 +5,8 @@
5
  "eval_samples": 666,
6
  "eval_samples_per_second": 10.921,
7
  "eval_steps_per_second": 0.728,
8
- "train_loss": 1.4013684431711833,
9
- "train_runtime": 256.7817,
10
  "train_samples": 4285,
11
  "train_samples_per_second": 3.668,
12
  "train_steps_per_second": 0.058
 
5
  "eval_samples": 666,
6
  "eval_samples_per_second": 10.921,
7
  "eval_steps_per_second": 0.728,
8
+ "train_loss": 1.401317008336385,
9
+ "train_runtime": 256.842,
10
  "train_samples": 4285,
11
  "train_samples_per_second": 3.668,
12
  "train_steps_per_second": 0.058
config.json CHANGED
@@ -23,6 +23,6 @@
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
  "transformers_version": "4.39.0.dev0",
26
- "use_cache": true,
27
  "vocab_size": 32016
28
  }
 
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
  "transformers_version": "4.39.0.dev0",
26
+ "use_cache": false,
27
  "vocab_size": 32016
28
  }
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64747326af38ef976fe2a9f79962310c8f5d284bd29ecdd6910972d17098fb87
3
  size 4939116424
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91c6bd0ecec78726699501214eccc730928def5ed304bb3716e2af2e13e6a7df
3
  size 4939116424
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f70e97dc1024a8c64ed319f33ed5cca288458da77b5f3b11fa960e0503873e29
3
  size 4947390880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f60a1b51f98add6b1024d09db57756a0438e273fefb55cead2b2bb63364f281
3
  size 4947390880
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e5ce4f584f045bc1271a3e311d75cb071aa23ea3f5aa2ae6a0610f216d828b2
3
  size 3590619888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81b61b9cd7734acacd39cc7c1451df2119e5d8d532ea93fad8ff187d18121fa9
3
  size 3590619888
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 3.0,
3
- "train_loss": 1.4013684431711833,
4
- "train_runtime": 256.7817,
5
  "train_samples": 4285,
6
  "train_samples_per_second": 3.668,
7
  "train_steps_per_second": 0.058
 
1
  {
2
  "epoch": 3.0,
3
+ "train_loss": 1.401317008336385,
4
+ "train_runtime": 256.842,
5
  "train_samples": 4285,
6
  "train_samples_per_second": 3.668,
7
  "train_steps_per_second": 0.058
trainer_state.json CHANGED
@@ -10,62 +10,62 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.2,
13
- "grad_norm": 7.938698333852073,
14
  "learning_rate": 5e-07,
15
  "loss": 1.4592,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 1.0,
20
- "grad_norm": 7.651680054024693,
21
  "learning_rate": 8.742553740855505e-07,
22
- "loss": 1.4296,
23
  "step": 5
24
  },
25
  {
26
  "epoch": 1.0,
27
- "eval_loss": 1.4870359897613525,
28
- "eval_runtime": 3.9957,
29
- "eval_samples_per_second": 11.262,
30
- "eval_steps_per_second": 0.751,
31
  "step": 5
32
  },
33
  {
34
  "epoch": 2.0,
35
- "grad_norm": 6.421895096428511,
36
  "learning_rate": 3.2269755647873214e-07,
37
  "loss": 1.3958,
38
  "step": 10
39
  },
40
  {
41
  "epoch": 2.0,
42
- "eval_loss": 1.4527603387832642,
43
- "eval_runtime": 4.1269,
44
- "eval_samples_per_second": 10.904,
45
- "eval_steps_per_second": 0.727,
46
  "step": 10
47
  },
48
  {
49
  "epoch": 3.0,
50
- "grad_norm": 6.165632694186387,
51
  "learning_rate": 0.0,
52
- "loss": 1.3728,
53
  "step": 15
54
  },
55
  {
56
  "epoch": 3.0,
57
- "eval_loss": 1.4498004913330078,
58
- "eval_runtime": 4.1113,
59
- "eval_samples_per_second": 10.945,
60
- "eval_steps_per_second": 0.73,
61
  "step": 15
62
  },
63
  {
64
  "epoch": 3.0,
65
  "step": 15,
66
  "total_flos": 3088349921280.0,
67
- "train_loss": 1.4013684431711833,
68
- "train_runtime": 256.7817,
69
  "train_samples_per_second": 3.668,
70
  "train_steps_per_second": 0.058
71
  }
 
10
  "log_history": [
11
  {
12
  "epoch": 0.2,
13
+ "grad_norm": 7.939234477653451,
14
  "learning_rate": 5e-07,
15
  "loss": 1.4592,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 1.0,
20
+ "grad_norm": 7.674129849441835,
21
  "learning_rate": 8.742553740855505e-07,
22
+ "loss": 1.4295,
23
  "step": 5
24
  },
25
  {
26
  "epoch": 1.0,
27
+ "eval_loss": 1.4871999025344849,
28
+ "eval_runtime": 4.0086,
29
+ "eval_samples_per_second": 11.226,
30
+ "eval_steps_per_second": 0.748,
31
  "step": 5
32
  },
33
  {
34
  "epoch": 2.0,
35
+ "grad_norm": 6.446393481808942,
36
  "learning_rate": 3.2269755647873214e-07,
37
  "loss": 1.3958,
38
  "step": 10
39
  },
40
  {
41
  "epoch": 2.0,
42
+ "eval_loss": 1.4525436162948608,
43
+ "eval_runtime": 4.1386,
44
+ "eval_samples_per_second": 10.873,
45
+ "eval_steps_per_second": 0.725,
46
  "step": 10
47
  },
48
  {
49
  "epoch": 3.0,
50
+ "grad_norm": 6.1815285521818035,
51
  "learning_rate": 0.0,
52
+ "loss": 1.3727,
53
  "step": 15
54
  },
55
  {
56
  "epoch": 3.0,
57
+ "eval_loss": 1.4498653411865234,
58
+ "eval_runtime": 4.1282,
59
+ "eval_samples_per_second": 10.901,
60
+ "eval_steps_per_second": 0.727,
61
  "step": 15
62
  },
63
  {
64
  "epoch": 3.0,
65
  "step": 15,
66
  "total_flos": 3088349921280.0,
67
+ "train_loss": 1.401317008336385,
68
+ "train_runtime": 256.842,
69
  "train_samples_per_second": 3.668,
70
  "train_steps_per_second": 0.058
71
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dac4842160e387abe206b6581f5723d808f0d6dcb0d00d95ff7bcbe60bfa7d4c
3
  size 6328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5e6e1b0e12146544d2ddefb72a4555b01fa23a1a28364efbfe462a257c293b7
3
  size 6328