aapot
commited on
Commit
•
53bb57b
1
Parent(s):
31c84b0
Add 180k train step and HF flax model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint_180000/checkpoint +3 -0
- checkpoint_180000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray +3 -0
- checkpoint_180000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 +3 -0
- checkpoint_180000/state.param_states.encoder.encoder_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.encoder.encoder_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_180000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_180000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
checkpoint_180000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ecd8016072cd1aa0f08eeb8f455fcb80d17a0ec905477a1595586b2abd6b867
|
3 |
+
size 640339
|
checkpoint_180000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18770517cc92921856ce4aa54a2fe5c883270ab4bf7f16af51630b318536e748
|
3 |
+
size 956
|
checkpoint_180000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:698fa6164891309c27ce6f8b83fd6accc7ddac2d35ea8b5a04fac47611dcc5bf
|
3 |
+
size 983
|
checkpoint_180000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df9ea7b731a9d7b3c149692c1093d689be655ef21e35f617a5d487be27759305
|
3 |
+
size 974
|
checkpoint_180000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93ccec5a2c978b4fa8716182a92d50abda92b60791a80f0000cf4f2f2a4391e9
|
3 |
+
size 985
|
checkpoint_180000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4df880d12e7c787d17ce06cd7e611c50d3f6337ffd445f2b69f4688dd3e833d
|
3 |
+
size 988
|
checkpoint_180000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e964e629f4da6af8c4ae4327e37471792039c3a00e96efcc88606efe2a52ee22
|
3 |
+
size 963
|
checkpoint_180000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95c4c66536cee0850ad4b2feb5d17e922244979763dac6a698038266790a4bb6
|
3 |
+
size 1007
|
checkpoint_180000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3adc956b23027460c1a3d28ce80410c023eeacb0b26fda8d00ae00b72fe20f46
|
3 |
+
size 973
|
checkpoint_180000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a25990dbe74a05a5f4fb7baf9bf41b190aa2e5e8130e0ad4e69e7cc0ebe7439b
|
3 |
+
size 985
|
checkpoint_180000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0a47b7f7ffbca11f0aa6041288de18aae22accf94de341b8a72b05516080d33
|
3 |
+
size 975
|
checkpoint_180000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:467a8ca0d6370bc8ac2fb4c814948cdfa18917c9db076309a7dfa7844bd95004
|
3 |
+
size 979
|
checkpoint_180000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c5af9cb6acf484a1b953a6ceda07f1bb76af3270f87c47174bf49d861f9c152
|
3 |
+
size 971
|
checkpoint_180000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9447bfbd1da932c8061ca1d2823f4509a257aa71de539161db3020320d594ac7
|
3 |
+
size 983
|
checkpoint_180000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed22cadfbf1b70e655ff5aad702b0fa5271e9cded8d1e7e54f50d25dfbff91c5
|
3 |
+
size 969
|
checkpoint_180000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67b23a4e4c20453dd432e6f237c2310ed6af632c299486092069f03ae6755877
|
3 |
+
size 958
|
checkpoint_180000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20988c0fc5a8f5550899fe1fd4280b4074796e7c45d4b6140084771f9296b43a
|
3 |
+
size 965
|
checkpoint_180000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf49febc47f30dcdca8721bf81095d935f485b8818e829bb8038df9f2773e3fe
|
3 |
+
size 955
|
checkpoint_180000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90200103a28709ef86c3652acdc75d0321fcd8b6bc3df4a393bf4877a9fa945d
|
3 |
+
size 966
|
checkpoint_180000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7654b1d5e90ebe8bb683d5c8944d7a62c6a1e533eb572833410234df4b9936f
|
3 |
+
size 980
|
checkpoint_180000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29b0b4f4727db7bbeacbac66511f4e0ea2d73d7e962302934561781052f7e5c3
|
3 |
+
size 170
|
checkpoint_180000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7ab0997aab2185373488ebcaabed06d1a79e74cb6840bd5b282a736404d8449
|
3 |
+
size 535
|
checkpoint_180000/state.param_states.encoder.encoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.encoder.encoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8536e78c5d4ca6d3fff28b355dc52e25cba01708014e069f6093ef8d0530ea85
|
3 |
+
size 984
|
checkpoint_180000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31ad646d8e056f599503187685a3eb4824fc9993b11c50cbafc3849f7f902d4e
|
3 |
+
size 953
|
checkpoint_180000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:864fcdee95209a250c23642f01774e55733787796c968853c66dda00ee0df01f
|
3 |
+
size 954
|
checkpoint_180000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_180000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d3b5f8cafe37edffa4ee408a7409d5b15a50468f2a03106e268bb67393d1071
|
3 |
+
size 971
|
checkpoint_180000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|