flan-t5-base-squad-qag / trainer_config.json
asahi417's picture
model update
27d59de
raw
history blame contribute delete
362 Bytes
{"dataset_path": "lmqg/qag_squad", "dataset_name": "default", "input_types": ["paragraph"], "output_types": ["questions_answers"], "prefix_types": ["qag"], "model": "google/flan-t5-base", "max_length": 512, "max_length_output": 256, "epoch": 14, "batch": 8, "lr": 0.0001, "fp16": false, "random_seed": 1, "gradient_accumulation_steps": 8, "label_smoothing": 0.0}