aapot commited on
Commit
d6e8c72
1 Parent(s): 5ac1b5f

Add 250k train step and HF flax model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. checkpoint_250000/checkpoint +3 -0
  2. checkpoint_250000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
  3. checkpoint_250000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
  4. checkpoint_250000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  5. checkpoint_250000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  6. checkpoint_250000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  7. checkpoint_250000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
  8. checkpoint_250000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  9. checkpoint_250000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
  10. checkpoint_250000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  11. checkpoint_250000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  12. checkpoint_250000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  13. checkpoint_250000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
  14. checkpoint_250000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  15. checkpoint_250000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
  16. checkpoint_250000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  17. checkpoint_250000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  18. checkpoint_250000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  19. checkpoint_250000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
  20. checkpoint_250000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  21. checkpoint_250000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
  22. checkpoint_250000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  23. checkpoint_250000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  24. checkpoint_250000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  25. checkpoint_250000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
  26. checkpoint_250000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  27. checkpoint_250000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
  28. checkpoint_250000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  29. checkpoint_250000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  30. checkpoint_250000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  31. checkpoint_250000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
  32. checkpoint_250000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  33. checkpoint_250000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
  34. checkpoint_250000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  35. checkpoint_250000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  36. checkpoint_250000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  37. checkpoint_250000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
  38. checkpoint_250000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  39. checkpoint_250000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
  40. checkpoint_250000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray +3 -0
  41. checkpoint_250000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 +3 -0
  42. checkpoint_250000/state.param_states.encoder.encoder_norm.scale.v/.zarray +3 -0
  43. checkpoint_250000/state.param_states.encoder.encoder_norm.scale.v/0 +3 -0
  44. checkpoint_250000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray +3 -0
  45. checkpoint_250000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0 +3 -0
  46. checkpoint_250000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  47. checkpoint_250000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
  48. checkpoint_250000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray +3 -0
  49. checkpoint_250000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0 +3 -0
  50. checkpoint_250000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
checkpoint_250000/checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aac68fb7c056763958c32423211dde97758e3ae5411a219936ebecd465c8d9f4
3
+ size 640339
checkpoint_250000/state.param_states.decoder.decoder_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.decoder_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e1f8fd9271cf6e914d8d9755f26cc9f5dd2b55a3dddb6bdc4885bf05b9e4b38
3
+ size 955
checkpoint_250000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2077c9cb1a292c6afc66ee748c70fd6a1dd582b9234e3177c9a567ed624f0f7a
3
+ size 964
checkpoint_250000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb692543406f21c030407d2a5c964ea5988cbe59788e78e126c1312e3739a45b
3
+ size 962
checkpoint_250000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ead86bdf32daf0a196a24a3629bd3c8df1e7611ee7810c63410821da5616940
3
+ size 987
checkpoint_250000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cec2f91854d8956475516b3c10add4308b916da3124379c19233794653244d22
3
+ size 986
checkpoint_250000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1166d6d35c5d3744e7ea635ec1a9c5534cadd552d7da7dfc59aabd7f168de26d
3
+ size 951
checkpoint_250000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8119ce8ed84132ffad5797ff1f657fc11c9691e00f4e774fa4ab5c4aa23dfce
3
+ size 1005
checkpoint_250000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:754c44439af7a74874ca932d2195bedbf23f31f7c215d4f4211d4f87fa704ec8
3
+ size 979
checkpoint_250000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57738d4a6c6129fbb1448e3c361a0f706b16c7ca45b7c231cfbe67f0e8df05f7
3
+ size 963
checkpoint_250000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6605ce15e7183d10e9864e0e4fa83d2f95a18bc7dfe3f0cd5508672055b11ab2
3
+ size 983
checkpoint_250000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7ea50cb438053f9aa0e14b2ea488c6df70cb2dce4ce1727f4af9f2f089912f8
3
+ size 982
checkpoint_250000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f56acab553ebea2e007ae8844023153e1e80e2eb4300545a943137ddf7945c4
3
+ size 979
checkpoint_250000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff03482c9a530cd687497d177d3fa2cca60c14a3e247d52e9ded3eda07f67992
3
+ size 985
checkpoint_250000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8e9fc779864f93ac6dcef8fa5b4e122c8942931cea9b19d0b3690e053155f57
3
+ size 967
checkpoint_250000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1c7a466fd5ceb37575966fcf5c66c51a3f436510305b8cc2a866e23462b1d4a
3
+ size 967
checkpoint_250000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5e33e60060e53f5e0f5d016eee37a2af12c5d43e92e05146d5448a1bc49c0ea
3
+ size 965
checkpoint_250000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6263298048a9964fb3a56bdbbeb41998c6a8a3e200b02b1d4e25cb20604bb43
3
+ size 964
checkpoint_250000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cdc8a3d3bb9dad73a6c11071db224ef62c5ef61869f885f0df48f27d841f44e
3
+ size 963
checkpoint_250000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36cd2abd5510e0510e12629751c68343bf9ab0b7f5967a617c69ba75e7fa29b5
3
+ size 972
checkpoint_250000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29b0b4f4727db7bbeacbac66511f4e0ea2d73d7e962302934561781052f7e5c3
3
+ size 170
checkpoint_250000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6beeaf426c7941930ed973981b9676ac52b47047ee83ea14345117a252560561
3
+ size 535
checkpoint_250000/state.param_states.encoder.encoder_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.encoder.encoder_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:462f29fd5617f00a8974a474c9b9b20142188c19d5814e1c208bf993726fad55
3
+ size 981
checkpoint_250000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a604445670fce12c0435f8664051aa5162eb26cf98122cdc9d5635a04578b6c1
3
+ size 961
checkpoint_250000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43087f88ad5d3679b61b23b894cc1b9f5fdd8f148d47e1125632719de5d316f5
3
+ size 957
checkpoint_250000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_250000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cd36be5d8aabc1fed77ff84ad2224be833ba2a234669043d9e6805a16d7bbda
3
+ size 977
checkpoint_250000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168