Update README.md
Browse files
README.md
CHANGED
@@ -50,6 +50,7 @@ The following hyperparameters were used during training:
|
|
50 |
<li>num_epochs:20</li>
|
51 |
<li>num_beams:6</li>
|
52 |
<li>learning_rate:lr=5e-5</li>
|
|
|
53 |
<li>activation_function:gelu</li>
|
54 |
<li>add_bias_logits:True</li>
|
55 |
<li>normalize_embedding:True</li>
|
|
|
50 |
<li>num_epochs:20</li>
|
51 |
<li>num_beams:6</li>
|
52 |
<li>learning_rate:lr=5e-5</li>
|
53 |
+
<li>optimizer:AdamW with betas=(0.9,0.999) and epsilon=1e-08</li>
|
54 |
<li>activation_function:gelu</li>
|
55 |
<li>add_bias_logits:True</li>
|
56 |
<li>normalize_embedding:True</li>
|