aapot commited on
Commit
5ac1b5f
1 Parent(s): 53bb57b

Add 200k train step and HF flax model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. checkpoint_200000/checkpoint +3 -0
  2. checkpoint_200000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
  3. checkpoint_200000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
  4. checkpoint_200000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  5. checkpoint_200000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  6. checkpoint_200000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  7. checkpoint_200000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
  8. checkpoint_200000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  9. checkpoint_200000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
  10. checkpoint_200000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  11. checkpoint_200000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  12. checkpoint_200000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  13. checkpoint_200000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
  14. checkpoint_200000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  15. checkpoint_200000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
  16. checkpoint_200000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  17. checkpoint_200000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  18. checkpoint_200000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  19. checkpoint_200000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
  20. checkpoint_200000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  21. checkpoint_200000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
  22. checkpoint_200000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  23. checkpoint_200000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  24. checkpoint_200000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  25. checkpoint_200000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
  26. checkpoint_200000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  27. checkpoint_200000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
  28. checkpoint_200000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  29. checkpoint_200000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  30. checkpoint_200000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  31. checkpoint_200000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
  32. checkpoint_200000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  33. checkpoint_200000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
  34. checkpoint_200000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  35. checkpoint_200000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  36. checkpoint_200000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  37. checkpoint_200000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
  38. checkpoint_200000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  39. checkpoint_200000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
  40. checkpoint_200000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray +3 -0
  41. checkpoint_200000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 +3 -0
  42. checkpoint_200000/state.param_states.encoder.encoder_norm.scale.v/.zarray +3 -0
  43. checkpoint_200000/state.param_states.encoder.encoder_norm.scale.v/0 +3 -0
  44. checkpoint_200000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray +3 -0
  45. checkpoint_200000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0 +3 -0
  46. checkpoint_200000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  47. checkpoint_200000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
  48. checkpoint_200000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray +3 -0
  49. checkpoint_200000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0 +3 -0
  50. checkpoint_200000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
checkpoint_200000/checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:422cf46e2e41ed2f7832e23df18c6dc725165118d35c71f8dd04cf90f4ab7af4
3
+ size 640339
checkpoint_200000/state.param_states.decoder.decoder_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.decoder_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c7474734cf2fd588c2bb1b48789ae3e92bffd6d411d8c2241834f350dc38e3f
3
+ size 946
checkpoint_200000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b6dcfdefb1daa7cf99baa29adede43d4eb218881074bddf12643d3bf4dd482c
3
+ size 980
checkpoint_200000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0146125b97e87a4bcd31fa2c168e993037d8af1fe3098ac391230d904ff5afb
3
+ size 976
checkpoint_200000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c97dc8c44f930cdbb5bfced148e10e833e7958f0807cfe124a142fe2c37f89e9
3
+ size 994
checkpoint_200000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e906976320427062d02fb8ed094736fae98bfde339d753abff9c34a661aeea1
3
+ size 988
checkpoint_200000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b1a9dc776010189a046e05acca1ea8e5c235cea81233fd11a9ad9b69c268f14
3
+ size 959
checkpoint_200000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50194e943311bc3dda7b8fcf12cce19c11c9216bc3fb24f8e66e0e4f1e0e30b8
3
+ size 994
checkpoint_200000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08af43b04a914a0837408c362170601f93599aa2e940f357ec05371fa01e6268
3
+ size 970
checkpoint_200000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0e160745fb57aaf4d61edcb60519bef4b1cb22907c4fc7b011f9dd0e04f31f2
3
+ size 979
checkpoint_200000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b69e6cb1ad006691840681f7042838c120b066ec354917ed1b8c919c7211d1a4
3
+ size 978
checkpoint_200000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9a1fef1ef80c2fc3554ecd6a2a6058a8ebee8b83d467a1d70973c4ec8aa6094
3
+ size 978
checkpoint_200000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8be19addb9b5036ed5846dfcdb199cb3080bb1298adb0de3b86a85a0e12dbc8d
3
+ size 977
checkpoint_200000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6624b9203aed3ea0f997f4a8654ba0a4ff7f2cdbb5f71ba59c9ba67ab4c082be
3
+ size 979
checkpoint_200000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:316816edf4421009811e461c63d2e73f4a7176d8013d8ce7630f1f9ac6f6ed11
3
+ size 967
checkpoint_200000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fd37737aa5a85a4c2f980c56f724e224dd34995c518d035958eb660ed8f558a
3
+ size 958
checkpoint_200000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ada2db6c3a3275bbe30c2497fb5283ec7654fdfcd1bd9f6cd04ecf24785cbe07
3
+ size 962
checkpoint_200000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:404f3cd6721a25bff458f9caa76180c68775352faeca06fe46482a8b77c43766
3
+ size 962
checkpoint_200000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8351eaa476861238d688254fdf3d5f193d20aa497086b0e70ab760c3c03bd48f
3
+ size 964
checkpoint_200000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dc89059dd65f07e553fd7759625a0e42afed3710d4b1b4cda418418ca2758dd
3
+ size 983
checkpoint_200000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29b0b4f4727db7bbeacbac66511f4e0ea2d73d7e962302934561781052f7e5c3
3
+ size 170
checkpoint_200000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c71d585b29595a85a0ef2e8d45baa2d27e1fb97a1d77e7c31619b47c1990d93
3
+ size 535
checkpoint_200000/state.param_states.encoder.encoder_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.encoder.encoder_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed7298a85d4df4357176fba678bd130280e3cb85eaef9f3995b9be10ddcf8bba
3
+ size 978
checkpoint_200000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5c91673f6afa3be29ad391a7ec2b5447e7f9812a0b943ec70482682e2547914
3
+ size 951
checkpoint_200000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27d860ac763ae263486f6b2a6087e62a2d985daa150485f01597430a996efd17
3
+ size 952
checkpoint_200000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_200000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f0e442b539a0c8b6aa17a9e9f6d0b6aad141290b4f50c7f9cc1510d0b853c52
3
+ size 982
checkpoint_200000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168