t5-tiny-nl6-finnish / tiny_nl6_pretrain.gin
aapot
Add 20k train step and HF flax model
0998a82
raw
history blame contribute delete
578 Bytes
# Register necessary SeqIO Tasks/Mixtures.
from __gin__ import dynamic_registration
from t5x import utils
import tasks
import __main__ as train_script
include 'tiny_nl6.gin'
include 't5x/configs/runs/pretrain.gin'
# ------------------- Training specification overrides --------------------------
train_script.train:
eval_period = 10000
utils.SaveCheckpointConfig:
period = 10000
keep = 10
MIXTURE_OR_TASK_NAME = "pretrain_finnish"
USE_CACHED_TASKS = False
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
TRAIN_STEPS = 500000
DROPOUT_RATE = 0.0
BATCH_SIZE = 512