Update README.md
#52
by
aman4vr
- opened
README.md
CHANGED
@@ -153,7 +153,7 @@ llama-30b-sft-6:
|
|
153 |
deepspeed_config: configs/zero3_config_sft.json
|
154 |
weight_decay: 0.0
|
155 |
residual_dropout: 0.0
|
156 |
-
max_length:
|
157 |
use_flash_attention: true
|
158 |
warmup_steps: 20
|
159 |
gradient_checkpointing: true
|
|
|
153 |
deepspeed_config: configs/zero3_config_sft.json
|
154 |
weight_decay: 0.0
|
155 |
residual_dropout: 0.0
|
156 |
+
max_length: 4096
|
157 |
use_flash_attention: true
|
158 |
warmup_steps: 20
|
159 |
gradient_checkpointing: true
|