bogdancazan
commited on
Commit
•
1b7276f
1
Parent(s):
2810bdc
Create README.md
Browse files
README.md
ADDED
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
training_args = TrainingArguments(
|
2 |
+
output_dir='t5-small-newsela-biendata-with-domain-adaptation',
|
3 |
+
num_train_epochs=20,
|
4 |
+
warmup_steps=250,
|
5 |
+
per_device_train_batch_size=BATCH_SIZE,
|
6 |
+
weight_decay=0.01,
|
7 |
+
learning_rate=2e-4,
|
8 |
+
fp16=True,
|
9 |
+
optim="adafactor",
|
10 |
+
)
|
11 |
+
|
12 |
+
|
13 |
+
Step Training Loss
|
14 |
+
500 35.466600
|
15 |
+
1000 25.795400
|
16 |
+
1500 10.923200
|
17 |
+
2000 4.515500
|
18 |
+
TrainOutput(global_step=2320, training_loss=16.92537920721646, metrics={'train_runtime': 628.0033, 'train_samples_per_second': 472.418, 'train_steps_per_second': 3.694, 'total_flos': 0.0, 'train_loss': 16.92537920721646, 'epoch': 20.0})
|