jwongTensora
/

00000000-0000-0000-0000-000000000000

Generated from Trainer

Model card Files Files and versions Community

jwongTensora commited on 1 day ago

Commit

02a3888

·

verified ·

1 Parent(s): c088179

End of training

Files changed (2) hide show

README.md +2 -2
adapter_model.bin +1 -1

README.md CHANGED Viewed

@@ -39,7 +39,7 @@ early_stopping_patience: null
 eval_max_new_tokens: 128
 eval_table_size: null
 evals_per_epoch: 4
-flash_attention: false
 fp16: null
 fsdp: null
 fsdp_config: null
@@ -82,7 +82,7 @@ train_on_inputs: false
 trust_remote_code: true
 val_set_size: 0.05
 wandb_entity: null
-wandb_mode: online
 wandb_name: 00000000-0000-0000-0000-000000000000
 wandb_project: Gradients-On-Demand
 wandb_run: your_name

 eval_max_new_tokens: 128
 eval_table_size: null
 evals_per_epoch: 4
+flash_attention: true
 fp16: null
 fsdp: null
 fsdp_config: null
 trust_remote_code: true
 val_set_size: 0.05
 wandb_entity: null
+wandb_mode: disabled
 wandb_name: 00000000-0000-0000-0000-000000000000
 wandb_project: Gradients-On-Demand
 wandb_run: your_name

adapter_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:43ced410eba3c47f620189ae448fca0d1c45f73c6619c207823c285ec243f99c
 size 21378

 version https://git-lfs.github.com/spec/v1
+oid sha256:5bad72ac69a8ea0e3f6d1dd6e9d0627b722cd79446e99703c751c2aaad24d35c
 size 21378