Suprit
/

Zhongjing-LLaMA-lora

Model card Files Files and versions Community

Suprit commited on Sep 15, 2023

Commit

eb3bdc6

•

1 Parent(s): ef00c6f

Upload 148 files

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

ppo_8_2/README.md +9 -0
ppo_8_2/adapter_config.json +21 -0
ppo_8_2/adapter_model.bin +3 -0
ppo_8_2/checkpoint-1000/README.md +9 -0
ppo_8_2/checkpoint-1000/adapter_config.json +21 -0
ppo_8_2/checkpoint-1000/adapter_model.bin +3 -0
ppo_8_2/checkpoint-1000/finetuning_args.json +13 -0
ppo_8_2/checkpoint-1000/reward/adapter_config.json +21 -0
ppo_8_2/checkpoint-1000/reward/adapter_model.bin +3 -0
ppo_8_2/checkpoint-1000/training_args.bin +3 -0
ppo_8_2/checkpoint-1000/value_head.bin +3 -0
ppo_8_2/checkpoint-1500/README.md +9 -0
ppo_8_2/checkpoint-1500/adapter_config.json +21 -0
ppo_8_2/checkpoint-1500/adapter_model.bin +3 -0
ppo_8_2/checkpoint-1500/finetuning_args.json +13 -0
ppo_8_2/checkpoint-1500/reward/adapter_config.json +21 -0
ppo_8_2/checkpoint-1500/reward/adapter_model.bin +3 -0
ppo_8_2/checkpoint-1500/training_args.bin +3 -0
ppo_8_2/checkpoint-1500/value_head.bin +3 -0
ppo_8_2/checkpoint-2000/README.md +9 -0
ppo_8_2/checkpoint-2000/adapter_config.json +21 -0
ppo_8_2/checkpoint-2000/adapter_model.bin +3 -0
ppo_8_2/checkpoint-2000/finetuning_args.json +13 -0
ppo_8_2/checkpoint-2000/reward/adapter_config.json +21 -0
ppo_8_2/checkpoint-2000/reward/adapter_model.bin +3 -0
ppo_8_2/checkpoint-2000/training_args.bin +3 -0
ppo_8_2/checkpoint-2000/value_head.bin +3 -0
ppo_8_2/checkpoint-2500/README.md +9 -0
ppo_8_2/checkpoint-2500/adapter_config.json +21 -0
ppo_8_2/checkpoint-2500/adapter_model.bin +3 -0
ppo_8_2/checkpoint-2500/finetuning_args.json +13 -0
ppo_8_2/checkpoint-2500/reward/adapter_config.json +21 -0
ppo_8_2/checkpoint-2500/reward/adapter_model.bin +3 -0
ppo_8_2/checkpoint-2500/training_args.bin +3 -0
ppo_8_2/checkpoint-2500/value_head.bin +3 -0
ppo_8_2/checkpoint-3000/README.md +9 -0
ppo_8_2/checkpoint-3000/adapter_config.json +21 -0
ppo_8_2/checkpoint-3000/adapter_model.bin +3 -0
ppo_8_2/checkpoint-3000/finetuning_args.json +13 -0
ppo_8_2/checkpoint-3000/reward/adapter_config.json +21 -0
ppo_8_2/checkpoint-3000/reward/adapter_model.bin +3 -0
ppo_8_2/checkpoint-3000/training_args.bin +3 -0
ppo_8_2/checkpoint-3000/value_head.bin +3 -0
ppo_8_2/checkpoint-3500/README.md +9 -0
ppo_8_2/checkpoint-3500/adapter_config.json +21 -0
ppo_8_2/checkpoint-3500/adapter_model.bin +3 -0
ppo_8_2/checkpoint-3500/finetuning_args.json +13 -0
ppo_8_2/checkpoint-3500/reward/adapter_config.json +21 -0
ppo_8_2/checkpoint-3500/reward/adapter_model.bin +3 -0
ppo_8_2/checkpoint-3500/training_args.bin +3 -0

ppo_8_2/README.md ADDED Viewed

	@@ -0,0 +1,9 @@

+---
+library_name: peft
+---
+## Training procedure
+### Framework versions
+- PEFT 0.4.0

ppo_8_2/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1c928225a000087e828682fd7dbb78c2e0967c4809838b2625c8172f6d7e5ea9
+size 26269517

ppo_8_2/checkpoint-1000/README.md ADDED Viewed

	@@ -0,0 +1,9 @@

+---
+library_name: peft
+---
+## Training procedure
+### Framework versions
+- PEFT 0.4.0

ppo_8_2/checkpoint-1000/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-1000/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f3b38d60a11127e242f9a807b77448d47842e0f18af9424ae49afe5390c54a56
+size 26269517

ppo_8_2/checkpoint-1000/finetuning_args.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "finetuning_type": "lora",
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "lora_rank": 8,
+  "lora_target": [
+    "q_proj",
+    "v_proj"
+  ],
+  "name_module_trainable": "mlp",
+  "num_hidden_layers": 32,
+  "num_layer_trainable": 3
+}

ppo_8_2/checkpoint-1000/reward/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-1000/reward/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406
+size 443

ppo_8_2/checkpoint-1000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d62ae8853df9b7076a445889032c6f5e0e6027dd349ea6633ce27d8f17c6c3f2
+size 3359

ppo_8_2/checkpoint-1000/value_head.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee6bbe9deb8bed10ff62722d2119134fd8ec11e8e788cf2f711483bd7dc20395
+size 21491

ppo_8_2/checkpoint-1500/README.md ADDED Viewed

	@@ -0,0 +1,9 @@

+---
+library_name: peft
+---
+## Training procedure
+### Framework versions
+- PEFT 0.4.0

ppo_8_2/checkpoint-1500/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-1500/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b098c659862af7bed6745f049aab340876fc9b217030cdc029e3ce977b3ce4d6
+size 26269517

ppo_8_2/checkpoint-1500/finetuning_args.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "finetuning_type": "lora",
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "lora_rank": 8,
+  "lora_target": [
+    "q_proj",
+    "v_proj"
+  ],
+  "name_module_trainable": "mlp",
+  "num_hidden_layers": 32,
+  "num_layer_trainable": 3
+}

ppo_8_2/checkpoint-1500/reward/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-1500/reward/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406
+size 443

ppo_8_2/checkpoint-1500/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d62ae8853df9b7076a445889032c6f5e0e6027dd349ea6633ce27d8f17c6c3f2
+size 3359

ppo_8_2/checkpoint-1500/value_head.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d90d06cd75a2a587a6c8982bf0f843e42ecdd4626396bb9414094056407b0169
+size 21491

ppo_8_2/checkpoint-2000/README.md ADDED Viewed

	@@ -0,0 +1,9 @@

+---
+library_name: peft
+---
+## Training procedure
+### Framework versions
+- PEFT 0.4.0

ppo_8_2/checkpoint-2000/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-2000/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:baf7b9f520e3c9685f93827f6fc58dfb518aa8e08b106d294e8b7636cc904b1a
+size 26269517

ppo_8_2/checkpoint-2000/finetuning_args.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "finetuning_type": "lora",
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "lora_rank": 8,
+  "lora_target": [
+    "q_proj",
+    "v_proj"
+  ],
+  "name_module_trainable": "mlp",
+  "num_hidden_layers": 32,
+  "num_layer_trainable": 3
+}

ppo_8_2/checkpoint-2000/reward/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-2000/reward/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406
+size 443

ppo_8_2/checkpoint-2000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d62ae8853df9b7076a445889032c6f5e0e6027dd349ea6633ce27d8f17c6c3f2
+size 3359

ppo_8_2/checkpoint-2000/value_head.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:407f2258d250161d932305f5295f61b79a4e1abdf8cb52d7ac71febe14ed222d
+size 21491

ppo_8_2/checkpoint-2500/README.md ADDED Viewed

	@@ -0,0 +1,9 @@

+---
+library_name: peft
+---
+## Training procedure
+### Framework versions
+- PEFT 0.4.0

ppo_8_2/checkpoint-2500/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-2500/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:48c4a5692a05c7670f077797e6b91105f40fb45c93f02fdec53c1c8e5722b3e2
+size 26269517

ppo_8_2/checkpoint-2500/finetuning_args.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "finetuning_type": "lora",
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "lora_rank": 8,
+  "lora_target": [
+    "q_proj",
+    "v_proj"
+  ],
+  "name_module_trainable": "mlp",
+  "num_hidden_layers": 32,
+  "num_layer_trainable": 3
+}

ppo_8_2/checkpoint-2500/reward/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-2500/reward/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406
+size 443

ppo_8_2/checkpoint-2500/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d62ae8853df9b7076a445889032c6f5e0e6027dd349ea6633ce27d8f17c6c3f2
+size 3359

ppo_8_2/checkpoint-2500/value_head.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:449a3bc0c64e508f458b2d25423d2b1b1cc4aefd2b77836d0d24438044d47764
+size 21491

ppo_8_2/checkpoint-3000/README.md ADDED Viewed

	@@ -0,0 +1,9 @@

+---
+library_name: peft
+---
+## Training procedure
+### Framework versions
+- PEFT 0.4.0

ppo_8_2/checkpoint-3000/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-3000/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b1cddedf88eb5949bf2f92a31823f7dae138a9b27e552274e7487121e55e1f8b
+size 26269517

ppo_8_2/checkpoint-3000/finetuning_args.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "finetuning_type": "lora",
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "lora_rank": 8,
+  "lora_target": [
+    "q_proj",
+    "v_proj"
+  ],
+  "name_module_trainable": "mlp",
+  "num_hidden_layers": 32,
+  "num_layer_trainable": 3
+}

ppo_8_2/checkpoint-3000/reward/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-3000/reward/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406
+size 443

ppo_8_2/checkpoint-3000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d62ae8853df9b7076a445889032c6f5e0e6027dd349ea6633ce27d8f17c6c3f2
+size 3359

ppo_8_2/checkpoint-3000/value_head.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff7d97a52142494b42184b5e5873fa764f12e053ace8543cca9d5ca06375419d
+size 21491

ppo_8_2/checkpoint-3500/README.md ADDED Viewed

	@@ -0,0 +1,9 @@

+---
+library_name: peft
+---
+## Training procedure
+### Framework versions
+- PEFT 0.4.0

ppo_8_2/checkpoint-3500/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-3500/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e7386a10fda60048403b823666286102ca2a4970b45c718d62879e0ab3b302b5
+size 26269517

ppo_8_2/checkpoint-3500/finetuning_args.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "finetuning_type": "lora",
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "lora_rank": 8,
+  "lora_target": [
+    "q_proj",
+    "v_proj"
+  ],
+  "name_module_trainable": "mlp",
+  "num_hidden_layers": 32,
+  "num_layer_trainable": 3
+}

ppo_8_2/checkpoint-3500/reward/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/hy-tmp/Ziya-LLaMA-13B-v1",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 32.0,
+  "lora_dropout": 0.1,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

ppo_8_2/checkpoint-3500/reward/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406
+size 443

ppo_8_2/checkpoint-3500/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d62ae8853df9b7076a445889032c6f5e0e6027dd349ea6633ce27d8f17c6c3f2
+size 3359