MiniLLM-1.1B-WithWudao-SFT / pretrain_args.json
Tongjilibo's picture
Upload 7 files
6ae83e2 verified
raw
history blame contribute delete
No virus
407 Bytes
{
"include_wudao_corpus": true,
"lr": 1.5e-4,
"batch_size": 16,
"grad_accumulation_steps": 1,
"pad_token_id": 0,
"max_length": 896,
"epochs": 1,
"weight_decay": 0.1,
"interval": 2000,
"torch_dtype": null,
"data_path": "../data/*.bin",
"config_path": "../config/MiniLLM-1.1B-WithWudao/bert4torch_config.json",
"save_dir": "../ckpt/MiniLLM-1.1B-WithWudao"
}