wikimia_unlearned

Browse files

Files changed (5) hide show

adapter_config.json +52 -52
adapter_model.safetensors +1 -1
config.yaml +1 -1
logs/events.out.tfevents.1714972871.c32766770a73 +3 -0
training_args.bin +1 -1

adapter_config.json CHANGED Viewed

@@ -20,70 +20,70 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "model.layers.8.self_attn.q_proj",
-    "model.layers.5.self_attn.v_proj",
-    "model.layers.15.self_attn.q_proj",
-    "model.layers.17.self_attn.q_proj",
-    "model.layers.16.self_attn.q_proj",
-    "model.layers.22.self_attn.q_proj",
-    "model.layers.12.self_attn.v_proj",
-    "model.layers.31.self_attn.v_proj",
-    "model.layers.24.self_attn.v_proj",
-    "model.layers.0.self_attn.q_proj",
     "model.layers.3.self_attn.v_proj",
-    "model.layers.13.self_attn.q_proj",
-    "model.layers.24.self_attn.q_proj",
-    "model.layers.16.self_attn.v_proj",
-    "model.layers.25.self_attn.q_proj",
-    "model.layers.20.self_attn.q_proj",
-    "model.layers.13.self_attn.v_proj",
-    "model.layers.18.self_attn.q_proj",
-    "model.layers.5.self_attn.q_proj",
-    "model.layers.26.self_attn.q_proj",
-    "model.layers.29.self_attn.v_proj",
-    "model.layers.17.self_attn.v_proj",
-    "model.layers.8.self_attn.v_proj",
-    "model.layers.30.self_attn.q_proj",
     "model.layers.28.self_attn.q_proj",
-    "model.layers.10.self_attn.v_proj",
-    "model.layers.0.self_attn.v_proj",
-    "model.layers.3.self_attn.q_proj",
-    "model.layers.4.self_attn.v_proj",
-    "model.layers.9.self_attn.v_proj",
     "model.layers.19.self_attn.v_proj",
     "model.layers.2.self_attn.v_proj",
-    "model.layers.28.self_attn.v_proj",
-    "model.layers.2.self_attn.q_proj",
     "model.layers.1.self_attn.q_proj",
-    "model.layers.21.self_attn.v_proj",
-    "model.layers.22.self_attn.v_proj",
     "model.layers.11.self_attn.q_proj",
-    "model.layers.15.self_attn.v_proj",
     "model.layers.23.self_attn.q_proj",
-    "model.layers.1.self_attn.v_proj",
-    "model.layers.25.self_attn.v_proj",
-    "model.layers.14.self_attn.v_proj",
-    "model.layers.30.self_attn.v_proj",
-    "model.layers.23.self_attn.v_proj",
-    "model.layers.20.self_attn.v_proj",
-    "model.layers.9.self_attn.q_proj",
-    "model.layers.18.self_attn.v_proj",
     "model.layers.19.self_attn.q_proj",
-    "model.layers.6.self_attn.v_proj",
-    "model.layers.27.self_attn.v_proj",
-    "model.layers.10.self_attn.q_proj",
-    "model.layers.29.self_attn.q_proj",
     "model.layers.7.self_attn.q_proj",
-    "model.layers.6.self_attn.q_proj",
-    "model.layers.26.self_attn.v_proj",
-    "model.layers.27.self_attn.q_proj",
-    "model.layers.4.self_attn.q_proj",
-    "model.layers.7.self_attn.v_proj",
     "model.layers.14.self_attn.q_proj",
-    "model.layers.31.self_attn.q_proj",
-    "model.layers.21.self_attn.q_proj",
     "model.layers.12.self_attn.q_proj",
-    "model.layers.11.self_attn.v_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "model.layers.3.self_attn.q_proj",
     "model.layers.8.self_attn.q_proj",
+    "model.layers.14.self_attn.v_proj",
+    "model.layers.4.self_attn.v_proj",
+    "model.layers.10.self_attn.q_proj",
+    "model.layers.15.self_attn.v_proj",
     "model.layers.3.self_attn.v_proj",
     "model.layers.28.self_attn.q_proj",
+    "model.layers.24.self_attn.v_proj",
+    "model.layers.12.self_attn.v_proj",
+    "model.layers.13.self_attn.v_proj",
+    "model.layers.1.self_attn.v_proj",
+    "model.layers.2.self_attn.q_proj",
+    "model.layers.27.self_attn.q_proj",
     "model.layers.19.self_attn.v_proj",
+    "model.layers.7.self_attn.v_proj",
+    "model.layers.21.self_attn.v_proj",
+    "model.layers.29.self_attn.q_proj",
+    "model.layers.25.self_attn.v_proj",
+    "model.layers.8.self_attn.v_proj",
     "model.layers.2.self_attn.v_proj",
+    "model.layers.6.self_attn.v_proj",
+    "model.layers.16.self_attn.v_proj",
+    "model.layers.17.self_attn.v_proj",
+    "model.layers.4.self_attn.q_proj",
+    "model.layers.20.self_attn.q_proj",
+    "model.layers.18.self_attn.v_proj",
+    "model.layers.11.self_attn.v_proj",
+    "model.layers.20.self_attn.v_proj",
+    "model.layers.31.self_attn.q_proj",
+    "model.layers.27.self_attn.v_proj",
+    "model.layers.0.self_attn.v_proj",
+    "model.layers.6.self_attn.q_proj",
+    "model.layers.22.self_attn.q_proj",
+    "model.layers.25.self_attn.q_proj",
+    "model.layers.24.self_attn.q_proj",
     "model.layers.1.self_attn.q_proj",
+    "model.layers.18.self_attn.q_proj",
+    "model.layers.23.self_attn.v_proj",
+    "model.layers.30.self_attn.q_proj",
     "model.layers.11.self_attn.q_proj",
+    "model.layers.31.self_attn.v_proj",
+    "model.layers.15.self_attn.q_proj",
+    "model.layers.0.self_attn.q_proj",
+    "model.layers.9.self_attn.v_proj",
+    "model.layers.10.self_attn.v_proj",
+    "model.layers.13.self_attn.q_proj",
     "model.layers.23.self_attn.q_proj",
+    "model.layers.5.self_attn.v_proj",
     "model.layers.19.self_attn.q_proj",
+    "model.layers.9.self_attn.q_proj",
     "model.layers.7.self_attn.q_proj",
+    "model.layers.5.self_attn.q_proj",
+    "model.layers.29.self_attn.v_proj",
     "model.layers.14.self_attn.q_proj",
     "model.layers.12.self_attn.q_proj",
+    "model.layers.30.self_attn.v_proj",
+    "model.layers.26.self_attn.q_proj",
+    "model.layers.21.self_attn.q_proj",
+    "model.layers.28.self_attn.v_proj",
+    "model.layers.17.self_attn.q_proj",
+    "model.layers.22.self_attn.v_proj",
+    "model.layers.26.self_attn.v_proj",
+    "model.layers.16.self_attn.q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e73eee9e3bf37d3e84f6ccad7a2ce8a2f65c456e910cfc1315a7a736bdf4bc31
 size 8405600

 version https://git-lfs.github.com/spec/v1
+oid sha256:bb6525ec9c2e18efe8ac86b939009dbf5869f6e5bdd0afcc2829bbc2ab054be0
 size 8405600

config.yaml CHANGED Viewed

@@ -6,7 +6,7 @@ LoRA:
   dropout: 0.05
 lr: 2.0e-05
 split: WikiMIA_QA_256
-data_path: swj0419/WikiMIA
 gradient_accumulation_steps: 4
 num_epochs: 50
 forget_loss: grad_ascent

   dropout: 0.05
 lr: 2.0e-05
 split: WikiMIA_QA_256
+data_path: lluvecwonv/WikiMIA_QA
 gradient_accumulation_steps: 4
 num_epochs: 50
 forget_loss: grad_ascent

logs/events.out.tfevents.1714972871.c32766770a73 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:638b84a9af6971a26176ae60885a97372faa1a118b6781d7e46ba96607ac1b3d
+size 9391

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:764fad990484805e9775a52604e5b1989f7a3603645913351e4ff6d9abbf2493
 size 6648

 version https://git-lfs.github.com/spec/v1
+oid sha256:53e0c50ffd1b0464e411cc017833c7f5fd6ef2b9080f7db441c84d5c4e03ca6f
 size 6648