aapot
commited on
Commit
•
459f258
1
Parent(s):
ed3412d
Add 500k train step
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint_500000/checkpoint +3 -0
- checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_500000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_500000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_500000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e9848752b8f1feee31620100b2a087cb1a01bc1de2e6b1599cdbc39372959fb
|
3 |
+
size 1037969
|
checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1cc21e5b9a43351079a2eb797b820f30270913db3f4fc0b13c929677413077b1
|
3 |
+
size 1413
|
checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:995dd9180d2eb437344d3056c0f245676b0ec2e49061d374069c254b80f81883
|
3 |
+
size 1435
|
checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4be8e8cc00ceb8cac7d2d446b08f07a0c6bded361d08f3ca90eca5df5d56303
|
3 |
+
size 1372
|
checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c680f46e87e4171e1b2d3b72d9c23c654c5836f55a9ea66cb30908b903866054
|
3 |
+
size 1437
|
checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68450710352254809d2c7298c01aa7725d3fa9164a439a431df7d4dd584ebb1d
|
3 |
+
size 1429
|
checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a61965bc3e982d970a2f621016a2ebe5c7966c99e8917dd667024f5305842077
|
3 |
+
size 1388
|
checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5baa5ae9f05d4e102dbe37a094019099a28db52d4922ad7bb836a3adf760aaa
|
3 |
+
size 1437
|
checkpoint_500000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b51abbc66ade27ea072ebbf4188b99977cea30e5ddade32cb1a6938c2c2f417
|
3 |
+
size 1428
|
checkpoint_500000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbc8566f2220ff1a5a606b7b7e89dad79722327e7d68cb0833e870a143bb2196
|
3 |
+
size 1415
|
checkpoint_500000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fed1f2c8f0fc478954233d9350eb3dca60096285ea2fb5d14247c2b6102872fd
|
3 |
+
size 1423
|
checkpoint_500000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c00cf0504609886b6ef98a457cd971da039041d173d66c15e9adf423fcdb26a6
|
3 |
+
size 1396
|
checkpoint_500000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ae8dfc719914852f84fcdba34ccb74068e092a098a9c5bd7cb2b0234330891b
|
3 |
+
size 1397
|
checkpoint_500000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d4e1056cb0ca0642beb4f55a1729218c99d381599599d0026f88279cb679147
|
3 |
+
size 1400
|
checkpoint_500000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9a52bc395916d2e1d491b66efa36827fe032ab8884a433e131db0679a072df6
|
3 |
+
size 1415
|
checkpoint_500000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a46e41c782ab9ba3d3eb1c60d5d30b587631828f5c293384e56ff878775ba88e
|
3 |
+
size 1402
|
checkpoint_500000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34727f38b5c84942de5424023a40479c75273d766204a542c60477d00b86a675
|
3 |
+
size 1416
|
checkpoint_500000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcd20f3327205247c5ea21988a961e85497e0fa37a8f7c7bd9d672eb047efb3d
|
3 |
+
size 1431
|
checkpoint_500000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a1f7eb95fc9780b751d26918dd0dce103e6cd4674f4d76a011bd0130a5a09cd
|
3 |
+
size 1382
|
checkpoint_500000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d932660a6184efb36321e05db330a5f6ef6aacf5780200c9440a3670b8541d1c
|
3 |
+
size 1433
|
checkpoint_500000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75035cb604b3ba2a87853a5547df6f30fb294720246a3a99460f8ac51d26c522
|
3 |
+
size 1392
|
checkpoint_500000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abec15dd99642a3fd0c50f3a01e9d2d2b422c190b011dad649174c1918cbe729
|
3 |
+
size 1376
|
checkpoint_500000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c916d8dd1f1cc62359f617c0bad96465f983661182ad94966efb63c51207137
|
3 |
+
size 1396
|
checkpoint_500000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad40088499ca8b5d57e1a44806e9797ccf875469ad1d3ad3f75824178da95a91
|
3 |
+
size 1410
|
checkpoint_500000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_500000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c06bf20aaf512443d87706a6c68ca34d01288490ea8fe7801e9b8b12694e688a
|
3 |
+
size 1419
|
checkpoint_500000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|