aapot
commited on
Commit
•
06dc3e1
1
Parent(s):
65983d1
Add 850K train step and HF flax model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint_850000/checkpoint +3 -0
- checkpoint_850000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 +3 -0
- checkpoint_850000/state.param_states.encoder.encoder_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.encoder.encoder_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
checkpoint_850000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f0ce29e3d1453a9560f2a753b86b16de9581b1785fd415635d0c6e3d27041ed
|
3 |
+
size 2792047
|
checkpoint_850000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a450853aaa2f97d05c6c7894ac8ee2f8af3279958c7b08a96834dc0bed994da5
|
3 |
+
size 5671
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1936f62962d5fd89cf784578e5105a20686b736c032c26474f26a2707a1ede1
|
3 |
+
size 5605
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9750deb0fdd75d5b480543b34b9e4cdc2cbd101c3811e17778ecd8beae561e71
|
3 |
+
size 5502
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85ee78e455c3fb6287e8f81a5daddd82071fe604a45a08a09c5691c0d56f3b2d
|
3 |
+
size 5698
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e273a5c6905c05f6d526192812b1412edfe03b2ec504ddc64427cf5ffb3fecfc
|
3 |
+
size 5525
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a16f42add4c7b9bd25964aab0fd6f00edc4852cbc78e65202c8fc8bac91213a0
|
3 |
+
size 5369
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19c5ead7d0bad6e8c8474082b28340b8f0a309cd690c07aae8aac66cf9ed40fc
|
3 |
+
size 5442
|
checkpoint_850000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52e3ffca647ec32d3f12e9083e4b0eaea58e6db1de56ba4324552fed51ed58b0
|
3 |
+
size 5447
|
checkpoint_850000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68d047f65c9aac59e62f6b04cac97b8c0545a0015a2bebb2bb4f74f718c4d106
|
3 |
+
size 5408
|
checkpoint_850000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a8b847c768c3516c1edea881383593f241647cd92ad6ea34ae2099d4ef7a632
|
3 |
+
size 5329
|
checkpoint_850000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b7718f6092ef2e6180cea084cb760d6c824d04c6525f66b6fba3c28ff01c7b1
|
3 |
+
size 5426
|
checkpoint_850000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46924384e491b365d98add5f7f6f5b6c1c7d3815ddcbe9858422860b492da77a
|
3 |
+
size 5431
|
checkpoint_850000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ead91c86910bdf3dcbc6f03373cf34c51c149a965c633bc771cb3a05460c18a6
|
3 |
+
size 5352
|
checkpoint_850000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3af565877f93e1d694f4d7fa1cf6e93469716b64b37b09a01b018e00066400d0
|
3 |
+
size 5385
|
checkpoint_850000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79fee684e9e651c94897775abbfd1ebe05eb06d2d84830c249d429f72bd3cfdb
|
3 |
+
size 5267
|
checkpoint_850000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b98f2d6a043b0eb69cfce9a4fe0e4da50c967054c9c34b901d008c566a25ef5c
|
3 |
+
size 5368
|
checkpoint_850000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:959c02f078e9ee882142e8c7c7a7b17d418acc45b603cbda013a0bad6e3bc43a
|
3 |
+
size 5469
|
checkpoint_850000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6fa091b96318f455abd1ce5a9b4291dfc79716032373d96cf813fe3c99676ad
|
3 |
+
size 5288
|
checkpoint_850000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c316b0539fbc20a6c8de641e9c9e9365a656b1d45a408760adf17ede88e0b68b
|
3 |
+
size 5294
|
checkpoint_850000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7028b3f2007ef72746d64487314ca6723cab7f9713ecb30bd30b73a22418e831
|
3 |
+
size 172
|
checkpoint_850000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:286f2d54c3492fb2c2bce5e3445531fb02a769d3fabf1a13877952f91cdce2f6
|
3 |
+
size 1427
|
checkpoint_850000/state.param_states.encoder.encoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.encoder.encoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa666465c9b25a22f51c246314f66152e095a3a6c7daaa2fb06d40dce3553122
|
3 |
+
size 5376
|
checkpoint_850000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52d3bb7d320510d70c19c6a59d7d6808047053eca7959ab34cddb86ceabf1cbd
|
3 |
+
size 5696
|
checkpoint_850000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eeb23c5b86d4085711e99c227af9facb3ee0f43ad724ba6b1a34cedf894d7f98
|
3 |
+
size 5541
|
checkpoint_850000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c5ad033cc745211def52d7637cf9d54d2c9082cc87053288aed44294b8f2160
|
3 |
+
size 5581
|
checkpoint_850000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|