End of training

Files changed (6) hide show

README.md CHANGED Viewed

@@ -34,8 +34,8 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 0.0002
-- train_batch_size: 4
-- eval_batch_size: 8
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
@@ -49,6 +49,6 @@ The following hyperparameters were used during training:
 - PEFT 0.8.2
 - Transformers 4.37.2
-- Pytorch 2.2.1+cu121
-- Datasets 2.19.0
 - Tokenizers 0.15.2

 The following hyperparameters were used during training:
 - learning_rate: 0.0002
+- train_batch_size: 16
+- eval_batch_size: 32
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - PEFT 0.8.2
 - Transformers 4.37.2
+- Pytorch 2.3.0+cu121
+- Datasets 2.19.1
 - Tokenizers 0.15.2

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "microsoft/Phi-3-mini-4k-instruct",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -19,8 +19,8 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "o_proj",
-    "gate_up_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": null,
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "gate_up_proj",
+    "o_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea5f88cbe06f500dc62b8cda9b34f58c2423fc5a3e50f70674396787ce919c73
-size 52446056

 version https://git-lfs.github.com/spec/v1
+oid sha256:cef7d3db8482fa1656c71ce896de4d706f3876e6907dcbe7f0a285d9f6209d2b
+size 26233776

runs/May09_13-11-44_cbnu-DGX-Station/events.out.tfevents.1715227914.cbnu-DGX-Station.2152000.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b75f9e03d905d443b0540d9b8bf6cc5a81aed7fc6f535935dbce7ba31527f63a
+size 7024

runs/May09_14-02-26_cbnu-DGX-Station/events.out.tfevents.1715230953.cbnu-DGX-Station.2158130.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:303a0483f10d388049a5702598b02dba3b1d3181913bde2208189f7cdb2adc87
+size 7024

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cf12d913283fa21c6dd5168c08a67c7288a6bf15b30d547f23eee84cb474a5e3
 size 4728

 version https://git-lfs.github.com/spec/v1
+oid sha256:d7098eb921aee8fcd4a260237cdf3708ecc0178eeccf10da63a41b374abeb24d
 size 4728