mbart-large-cc25-jaquad-qg / trainer_config.json
asahi417's picture
model update
ea1cf38
raw
history blame
364 Bytes
{"dataset_path": "lmqg/qg_jaquad", "dataset_name": "default", "input_types": ["paragraph_answer"], "output_types": ["question"], "prefix_types": null, "model": "facebook/mbart-large-cc25", "max_length": 512, "max_length_output": 32, "epoch": 12, "batch": 64, "lr": 0.0001, "fp16": false, "random_seed": 1, "gradient_accumulation_steps": 1, "label_smoothing": 0.15}