tykiww commited on
Commit
7ebc9c5
·
verified ·
1 Parent(s): 38d7f73

Update config/config.json

Browse files
Files changed (1) hide show
  1. config/config.json +14 -10
config/config.json CHANGED
@@ -1,32 +1,36 @@
1
  {
2
  "model": {
 
 
 
 
3
  "peft": {
4
  "r": 64,
5
  "alpha": 16,
6
  "dropout": 0,
7
  "bias": "none",
8
- "seed": 3407,
9
  "rslora": false,
10
  "loftq_config": null
11
  },
12
  "sft": {
13
  "output_dir": "outputs",
14
- "num_train_epochs": 3,
15
- "per_device_train_batch_size": 4,
16
- "gradient_accumulation_steps": 8,
17
- "learning_rate": 5e-5,
18
- "warmup_steps": 10,
19
- "fp16": true,
20
- "bf16": false,
21
  "logging_steps": 1,
22
  "optim": "adamw_8bit",
23
  "weight_decay": 0.01,
24
  "lr_scheduler_type": "linear",
25
- "seed": 42,
26
- "max_seq_length": 128,
27
  "dataset_num_proc": 2,
28
  "packing": false
29
  },
30
  "choices": ["gpt2", "bert-base-uncased", "llama3-8b"]
31
  }
32
  }
 
 
 
 
1
  {
2
  "model": {
3
+ "general": {
4
+ "max_seq_length": 128,
5
+ "seed": 42,
6
+ },
7
  "peft": {
8
  "r": 64,
9
  "alpha": 16,
10
  "dropout": 0,
11
  "bias": "none",
 
12
  "rslora": false,
13
  "loftq_config": null
14
  },
15
  "sft": {
16
  "output_dir": "outputs",
17
+ "num_train_epochs": null,
18
+ "dataset_text_field" = "text",
19
+ "max_steps": 60,
20
+ "per_device_train_batch_size": 2,
21
+ "gradient_accumulation_steps": 4,
22
+ "learning_rate": 2e-4,
23
+ "warmup_steps": 5,
24
  "logging_steps": 1,
25
  "optim": "adamw_8bit",
26
  "weight_decay": 0.01,
27
  "lr_scheduler_type": "linear",
 
 
28
  "dataset_num_proc": 2,
29
  "packing": false
30
  },
31
  "choices": ["gpt2", "bert-base-uncased", "llama3-8b"]
32
  }
33
  }
34
+
35
+
36
+