Model save

Files changed (5) hide show

README.md CHANGED Viewed

@@ -5,7 +5,7 @@ tags:
 - trl
 - sft
 - generated_from_trainer
-base_model: tiiuae/falcon-7b
 model-index:
 - name: falcon7binstruct
   results: []
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
 # falcon7binstruct
-This model is a fine-tuned version of [tiiuae/falcon-7b](https://huggingface.co/tiiuae/falcon-7b) on the None dataset.
 ## Model description
@@ -47,10 +47,6 @@ The following hyperparameters were used during training:
 - training_steps: 10
 - mixed_precision_training: Native AMP
-### Training results
 ### Framework versions
 - PEFT 0.7.2.dev0

 - trl
 - sft
 - generated_from_trainer
+base_model: vilsonrodrigues/falcon-7b-instruct-sharded
 model-index:
 - name: falcon7binstruct
   results: []
 # falcon7binstruct
+This model is a fine-tuned version of [vilsonrodrigues/falcon-7b-instruct-sharded](https://huggingface.co/vilsonrodrigues/falcon-7b-instruct-sharded) on the None dataset.
 ## Model description
 - training_steps: 10
 - mixed_precision_training: Native AMP
 ### Framework versions
 - PEFT 0.7.2.dev0

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "tiiuae/falcon-7b",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -19,10 +19,10 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "query_key_value",
     "dense",
     "dense_4h_to_h",
-    "dense_h_to_4h"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "vilsonrodrigues/falcon-7b-instruct-sharded",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "dense_h_to_4h",
     "dense",
     "dense_4h_to_h",
+    "query_key_value"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7272882dad9a0408037e428b832f99edbe61b87240233d82be34ef923c336f02
 size 130583912

 version https://git-lfs.github.com/spec/v1
+oid sha256:5967403586bbf8b5c66aabb2475c8cec61035cf4e1cb75cc2c4cb9c32ad60fcb
 size 130583912

tokenizer.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "version": "1.0",
   "truncation": {
     "direction": "Right",
-    "max_length": 256,
     "strategy": "LongestFirst",
     "stride": 0
   },

   "version": "1.0",
   "truncation": {
     "direction": "Right",
+    "max_length": 1024,
     "strategy": "LongestFirst",
     "stride": 0
   },

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e7a6a86cd20f63a320b3c042615d338c8a09ffce381cc39ad2a3d47778a8f6da
 size 4792

 version https://git-lfs.github.com/spec/v1
+oid sha256:d061ff7501cef667fce3218cf66f5de86959968a038ae3ec253026a3e5ee8545
 size 4792