aapot commited on
Commit
b9000ce
1 Parent(s): e385993

Add 400k train step and HF flax model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. checkpoint_400000/checkpoint +3 -0
  2. checkpoint_400000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
  3. checkpoint_400000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
  4. checkpoint_400000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  5. checkpoint_400000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  6. checkpoint_400000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  7. checkpoint_400000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
  8. checkpoint_400000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  9. checkpoint_400000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
  10. checkpoint_400000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  11. checkpoint_400000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  12. checkpoint_400000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  13. checkpoint_400000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
  14. checkpoint_400000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  15. checkpoint_400000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
  16. checkpoint_400000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  17. checkpoint_400000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  18. checkpoint_400000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  19. checkpoint_400000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
  20. checkpoint_400000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  21. checkpoint_400000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
  22. checkpoint_400000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  23. checkpoint_400000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  24. checkpoint_400000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  25. checkpoint_400000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
  26. checkpoint_400000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  27. checkpoint_400000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
  28. checkpoint_400000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  29. checkpoint_400000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  30. checkpoint_400000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  31. checkpoint_400000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
  32. checkpoint_400000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  33. checkpoint_400000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
  34. checkpoint_400000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  35. checkpoint_400000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  36. checkpoint_400000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  37. checkpoint_400000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
  38. checkpoint_400000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  39. checkpoint_400000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
  40. checkpoint_400000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  41. checkpoint_400000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  42. checkpoint_400000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  43. checkpoint_400000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/0 +3 -0
  44. checkpoint_400000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  45. checkpoint_400000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/0 +3 -0
  46. checkpoint_400000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  47. checkpoint_400000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  48. checkpoint_400000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  49. checkpoint_400000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/0 +3 -0
  50. checkpoint_400000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_400000/checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b44bbcb1af196553bece74a31d5d8fe614a2c25d3513fe29c424173a58deba36
3
+ size 1037969
checkpoint_400000/state.param_states.decoder.decoder_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.decoder_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9975b4b4d508150cbb57346c8b6aa7b4b0b9bd672eda7ec4571c6d09fedbfcf
3
+ size 1387
checkpoint_400000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d449427008e826b8be568180bcd4d2bfcdafbfdd1c8eec01c86961f7897c3826
3
+ size 1420
checkpoint_400000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c4199855111d18ecf3548dd6b4c403305d96c676db7b60e4292e5f5fd8d1f0b
3
+ size 1374
checkpoint_400000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a921a899d26c8273c1140a465ab196628a8cf96a0514c3836808c1b678ecb21
3
+ size 1427
checkpoint_400000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b995c45b0f556ed7dba66b389ed6aa273db655b7a4ed4a20ec99e40a68f1541
3
+ size 1437
checkpoint_400000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84a87854bb35ff1f4c7306e7c71af00557b3059021f7bdac137cfcbf4fad0916
3
+ size 1410
checkpoint_400000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f2ca29a77d6a95a621c1f6be982ef82dbd25aa67012b1e8840a94331a8cad5a
3
+ size 1439
checkpoint_400000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17820312b4dac3017ae33e0fd7caec45dcf0e46a50dc065cccd7b4c7915eb5a4
3
+ size 1441
checkpoint_400000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cff9b8c784ad3386e8c655dd43aa1288dcd7187bd4c55178c6542ca7e24c71e1
3
+ size 1425
checkpoint_400000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb57646bb3f597d0c4d4bd310f5ebaae44e00e6992cfa2bad1ab2c6b420c5d3b
3
+ size 1432
checkpoint_400000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0fa30298afe54116f3d915776461dbde28a03c021a0879024e0096c95e05130
3
+ size 1424
checkpoint_400000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e4e43e52c40aef2f6fc77f964467bd8d1aa8c0990f234281a0d23783d9c0be1
3
+ size 1390
checkpoint_400000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f93d49ff08c617023d03439151653cec1b8e2ff7c37b6567a3ea8d29536d5d07
3
+ size 1420
checkpoint_400000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b677d985f030b824ad2eb1d9336327b71c87bb11f7db49cc676f80035311bffa
3
+ size 1401
checkpoint_400000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:894881346c84d230e983b05872f01c3e8df85c23ef68c6a2a6199f2043b52bcd
3
+ size 1384
checkpoint_400000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79c03a1ad6b2e4e61c22aec09aab0c3f4a4485d43036b953ddc6738c6cf30e09
3
+ size 1402
checkpoint_400000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6621a5e8be9a8a61340bbe5d3d4fd2fc7baa30021e7c2df56d000184906334ba
3
+ size 1393
checkpoint_400000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:127cb389fc5cac2d939abd104b8b0740dce045cd28caf5683ff1a278a95835cc
3
+ size 1376
checkpoint_400000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b7a8fc557d00cfdbe02edc515e47c025e1679c3a4a898113cd8edfbc7e00dd9
3
+ size 1393
checkpoint_400000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f8a531e16c04e8cbe39c142de88d31cad0d7c8f065cd94f234dd002a2959e5f
3
+ size 1404
checkpoint_400000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e87689731ef98348d57acea9f635ee80ea633f5e36d4722ee82fa0674a998c92
3
+ size 1379
checkpoint_400000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92de7c2f747b9a27f10c83a3fd5e220c7a103d328926d3c8ea68b9a27256f0de
3
+ size 1387
checkpoint_400000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f07c851e5ce030e639f8f5e8523a72ed593f785c47cf6a84ed00c94771e6bf5
3
+ size 1440
checkpoint_400000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168
checkpoint_400000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66aa50a432ae36efbc9521789d9f000720b88b9b07fe98c25a05833d327f39bb
3
+ size 1419
checkpoint_400000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
3
+ size 168