|
{ |
|
"output_dir": "../drive/MyDrive/NICE/model/0422_train_encoder", |
|
"model_name_or_path": "../drive/MyDrive/NICE/model/cap_best/OFA-huge-caption", |
|
"train_caption_file": "./data/train_caption.jsonl", |
|
"train_image_file": "../drive/MyDrive/NICE/train_image.tsv", |
|
"test_caption_file": null, |
|
"test_image_file": null, |
|
"freeze_encoder": false, |
|
"freeze_word_embed": false, |
|
"num_train_epochs": 30, |
|
"max_steps": -1, |
|
"per_device_train_batch_size": 12, |
|
"per_device_eval_batch_size": 256, |
|
"learning_rate": 5e-05, |
|
"max_seq_length": 150, |
|
"logging_steps": 5000, |
|
"save_steps": 5000, |
|
"save_total_limit": 2, |
|
"lr_scheduler_type": "cosine", |
|
"warmup_steps": 2000, |
|
"warmup_ratio": 0, |
|
"gradient_accumulation_steps": 1, |
|
"optim": "adamw_torch", |
|
"seed": 69, |
|
"fp16": false, |
|
"no_cuda": false, |
|
"dataloader_num_workers": 8, |
|
"save_strategy": "steps", |
|
"weight_decay": 0, |
|
"max_grad_norm": 1.0, |
|
"remove_unused_columns": false |
|
} |