aapot
commited on
Commit
•
0998a82
1
Parent(s):
5d71dc2
Add 20k train step and HF flax model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- .gitignore +1 -0
- checkpoint_10000/checkpoint +3 -0
- checkpoint_10000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray +3 -0
- checkpoint_10000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 +3 -0
- checkpoint_10000/state.param_states.encoder.encoder_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.encoder.encoder_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_10000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_10000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray +3 -0
.gitattributes
CHANGED
@@ -26,3 +26,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
26 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
27 |
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
28 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
26 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
27 |
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
28 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
29 |
+
checkpoint*/** filter=lfs diff=lfs merge=lfs -text
|
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
__pycache__/
|
checkpoint_10000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5489e622f07d4ae66eb5da3f6d2e993806acce6e5eda70437de8fe60119a66c3
|
3 |
+
size 640339
|
checkpoint_10000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56d48dbb2ad1182f68360ec9994824034b69e8c52a037f8581d2ecbce6533fa4
|
3 |
+
size 984
|
checkpoint_10000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:caba6a623e094f02bf5fde1c73ade8cb01dbf7820fc24552c785371351d643dd
|
3 |
+
size 994
|
checkpoint_10000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24b236716123c3ce24c9c322388fa75a3284bfa4e18ce51811c41d049724ebc8
|
3 |
+
size 953
|
checkpoint_10000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfcd88f8c69d4a4f05b6082faa3572787c6a42a7e875d4bcfc5109c558b5ce5d
|
3 |
+
size 972
|
checkpoint_10000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:625874cbccd7fd13a63537debde2eaec26ced3ffdccfb29a821a67701374c194
|
3 |
+
size 993
|
checkpoint_10000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54c914d4b5981462e880e6759116c33efbf88bdedf6d9b98f03c8410ec5f4480
|
3 |
+
size 960
|
checkpoint_10000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a59dc255993fd6d97caa2ed0076fc96c55cd0292c29d067f6e895ffb1764dfbc
|
3 |
+
size 1004
|
checkpoint_10000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:727711d92dcf3d0d9bb4354614867ad43f1c29c7870361cce95cfbd286c0d6c3
|
3 |
+
size 974
|
checkpoint_10000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27141c7a95fb7561f43f336e11b0f3048ce44ce43d107415c77a0d6f806d51d4
|
3 |
+
size 978
|
checkpoint_10000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a84738832cc779d9edf025bcd83db953c2f62fa1324f33801feeb3b3ed75204e
|
3 |
+
size 1000
|
checkpoint_10000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52c90e728ae55d927ae3df8caf485da5e8b48d07d26ea0f9a29ec56e94225bfa
|
3 |
+
size 983
|
checkpoint_10000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd7da91e6b447d01edb3bab91bb17f79a211d75063d5554be48e74b31116452d
|
3 |
+
size 979
|
checkpoint_10000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b227dda62f36a8143cf43daf1114339bfe43401c01f94af196dfd5f7cdefa409
|
3 |
+
size 990
|
checkpoint_10000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f97424080eea16132a3ba837bba4c0a277c3ac5580fa0160c5d8694d66c7e1a
|
3 |
+
size 971
|
checkpoint_10000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8382931a106f0d8bf031578ed446d5647f1f591e698746af6f6cffde8123793
|
3 |
+
size 979
|
checkpoint_10000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4a70f184e1531a56f8b86a8c783af089edda74e5a657f9b8376688c99f6ef65
|
3 |
+
size 988
|
checkpoint_10000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41cf282d0f381498839c55251f6aa81c5b76dc75a105eb42d2014d94a8f1ac7c
|
3 |
+
size 983
|
checkpoint_10000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2638fadb0cc78e8f46a03da631a1cf458b177652ac0f9769e526750a20137ec0
|
3 |
+
size 985
|
checkpoint_10000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:259e978006b4b4b9e03b3e8246146c3719ae26481c3ea84e9df6070b46b2b853
|
3 |
+
size 990
|
checkpoint_10000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29b0b4f4727db7bbeacbac66511f4e0ea2d73d7e962302934561781052f7e5c3
|
3 |
+
size 170
|
checkpoint_10000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e02eb135cc9b64a58994c116eb73c90e8edee68eede4b67fae1f5dc3eca4450c
|
3 |
+
size 535
|
checkpoint_10000/state.param_states.encoder.encoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.encoder.encoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16ff665d2795bb938d1fa241b38e710f98bd9a3d14a83b82ddb9d0301cad6b6b
|
3 |
+
size 964
|
checkpoint_10000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0a384f59db99316e2a373fe67bc82dd45bf8eeb7b11b1781b34bc20e9cd6bdb
|
3 |
+
size 951
|
checkpoint_10000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_10000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0edb8b86f5da06dacd0dfb486f779992aac0730a7d8ad73d6a2adad4691b31e0
|
3 |
+
size 952
|
checkpoint_10000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|