Model save

Files changed (7) hide show

README.md CHANGED Viewed

@@ -15,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.0664
 ## Model description
@@ -51,7 +51,7 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 1.0705        | 0.67  | 34   | 1.0662          |
 ### Framework versions

 This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 1.0663
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 1.0705        | 0.67  | 34   | 1.0663          |
 ### Framework versions

adapter_config.json CHANGED Viewed

@@ -16,10 +16,10 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "q_proj",
-    "o_proj",
     "k_proj",
-    "v_proj"
   ],
   "task_type": "CAUSAL_LM"
 }

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "k_proj",
+    "v_proj",
+    "q_proj",
+    "o_proj"
   ],
   "task_type": "CAUSAL_LM"
 }

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e19f497c1a2314d323c7c294be89240e3bc32be6b039941943df639a83419bc0
 size 109086672

 version https://git-lfs.github.com/spec/v1
+oid sha256:bd98740d75b764bd1cc3fcb15fb21ba7ffbf4fe912ea54260aa2eb01248a70b2
 size 109086672

all_results.json CHANGED Viewed

@@ -1,13 +1,8 @@
 {
     "epoch": 0.67,
-    "eval_loss": 1.0663659572601318,
-    "eval_runtime": 360.1757,
-    "eval_samples": 23110,
-    "eval_samples_per_second": 64.163,
-    "eval_steps_per_second": 1.005,
-    "train_loss": 1.091969286694246,
-    "train_runtime": 10565.8845,
     "train_samples": 207865,
-    "train_samples_per_second": 19.673,
     "train_steps_per_second": 0.005
 }

 {
     "epoch": 0.67,
+    "train_loss": 1.0919693988912247,
+    "train_runtime": 10567.5625,
     "train_samples": 207865,
+    "train_samples_per_second": 19.67,
     "train_steps_per_second": 0.005
 }

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 0.67,
-    "train_loss": 1.091969286694246,
-    "train_runtime": 10565.8845,
     "train_samples": 207865,
-    "train_samples_per_second": 19.673,
     "train_steps_per_second": 0.005
 }

 {
     "epoch": 0.67,
+    "train_loss": 1.0919693988912247,
+    "train_runtime": 10567.5625,
     "train_samples": 207865,
+    "train_samples_per_second": 19.67,
     "train_steps_per_second": 0.005
 }

trainer_state.json CHANGED Viewed

@@ -52,19 +52,19 @@
     },
     {
       "epoch": 0.67,
-      "eval_loss": 1.066247820854187,
-      "eval_runtime": 359.3813,
-      "eval_samples_per_second": 64.305,
-      "eval_steps_per_second": 1.007,
       "step": 34
     },
     {
       "epoch": 0.67,
       "step": 34,
       "total_flos": 5.175876094263296e+16,
-      "train_loss": 1.091969286694246,
-      "train_runtime": 10565.8845,
-      "train_samples_per_second": 19.673,
       "train_steps_per_second": 0.005
     }
   ],

     },
     {
       "epoch": 0.67,
+      "eval_loss": 1.066256046295166,
+      "eval_runtime": 359.6899,
+      "eval_samples_per_second": 64.25,
+      "eval_steps_per_second": 1.006,
       "step": 34
     },
     {
       "epoch": 0.67,
       "step": 34,
       "total_flos": 5.175876094263296e+16,
+      "train_loss": 1.0919693988912247,
+      "train_runtime": 10567.5625,
+      "train_samples_per_second": 19.67,
       "train_steps_per_second": 0.005
     }
   ],

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1c2c56271c5d9179a88d13f67a03da9a745a966c640935167f20ae45263a8e7b
 size 5624

 version https://git-lfs.github.com/spec/v1
+oid sha256:9977e48f8d6567c3265a35aa99f23ba670f89bbf8dea7abf2cdbb0ce4deb9178
 size 5624