aryaadhi commited on
Commit
00071a9
1 Parent(s): b0915bd

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -11,7 +11,7 @@
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
  "lora_alpha": 16,
14
- "lora_dropout": 0.05,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
@@ -20,9 +20,9 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "v_proj",
24
  "q_proj",
25
- "k_proj"
 
26
  ],
27
  "task_type": "CAUSAL_LM",
28
  "use_dora": false,
 
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
  "lora_alpha": 16,
14
+ "lora_dropout": 0.1,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "q_proj",
24
+ "k_proj",
25
+ "v_proj"
26
  ],
27
  "task_type": "CAUSAL_LM",
28
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5be520c1c19e55201b404a24747172aa211568df1468101f7420a5f27b72674
3
  size 18893616
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:920f90492b983056b7f47519a2ef1375608b021b87b6d8617ae85514d80d0278
3
  size 18893616
runs/Jul20_14-40-55_cmle-training-13669393038079472133/events.out.tfevents.1721486456.cmle-training-13669393038079472133 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a919bf8e67dbfc7eb66f97d81d052dfdc6c9f0a5b5a835c46b71ba6a8e95a739
3
+ size 7783
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f00ac591a99e9872ef76e8517d2c8b3021f58138bc213ca8c8e6d97752637b56
3
  size 4731
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97e742e0588f19998138fea0049b74f0fb38873746807daa6bbbd8d1580750b6
3
  size 4731