aapot
commited on
Commit
•
65983d1
1
Parent(s):
7c9d89f
Add 820K train step and HF flax model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint_820000/checkpoint +3 -0
- checkpoint_820000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray +3 -0
- checkpoint_820000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 +3 -0
- checkpoint_820000/state.param_states.encoder.encoder_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.encoder.encoder_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_820000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_820000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
checkpoint_820000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3b37ff2fd870e6e30a553ae2255cda5a470d66d72ccc13b595ac261b0751d64
|
3 |
+
size 2792047
|
checkpoint_820000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09bbba355c34baaddac1bc8632014e0b8b58d1889981289b7cc23127034245f4
|
3 |
+
size 5673
|
checkpoint_820000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc245f7c2be245fc796730e7ac59c83d5ee8fedaac73095cb94678b61a2c628a
|
3 |
+
size 5613
|
checkpoint_820000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6aa4b65c00d0519cadcb821478c1289ec8a75f15a0311962a5879c050368d9c8
|
3 |
+
size 5502
|
checkpoint_820000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9ef25d9637607d1b5a2853e1a445a0107dfba4a90641bf4c657c01b8fd36856
|
3 |
+
size 5697
|
checkpoint_820000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f13fb52167776a1568671f14ef11a3587e460ae08bc4b9da15691cdd710fb93e
|
3 |
+
size 5518
|
checkpoint_820000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fa72e1af81f48d0d9e309e034f9eb07b5a8ce23772b36a4044fb8017fa79d2f
|
3 |
+
size 5370
|
checkpoint_820000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e94692afc46bf71e75d7f993c285ff2ef690096e148a49cf61e2f9bb82c769cb
|
3 |
+
size 5443
|
checkpoint_820000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a08e7d036398f7ce052fd0558e9d7dd2578bebf7dceea1b3a0031b4150ad64c0
|
3 |
+
size 5433
|
checkpoint_820000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:032771ab393d1c84fe6f61c2ecf417502ddaba7576df4b29298896fd8942dd9f
|
3 |
+
size 5410
|
checkpoint_820000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1f3ca009dce3ea1611426f64baec8f3056aba61862bd8480ac108df27477455
|
3 |
+
size 5342
|
checkpoint_820000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9b4479cd727082c0272929c336e6cd1d467f373debc9177476c41966be7d57d
|
3 |
+
size 5420
|
checkpoint_820000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae52debf1bd864839ea600a3e1f9dda2e1a96fa02154b2b49d1a93b5df275892
|
3 |
+
size 5408
|
checkpoint_820000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be89b1f54592f82e83f2ebdc6d21dd2df17991022194bc1a29829896cb34d3a8
|
3 |
+
size 5340
|
checkpoint_820000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:186e158de8905705a498dc48e2cf043a771dbc0bf461c39e991d3847eb7dd530
|
3 |
+
size 5367
|
checkpoint_820000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:032a9cf24f59394177911dcadf5eb0257776f581513762645fc5f274dddae2a8
|
3 |
+
size 5273
|
checkpoint_820000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f748e1a69aa8d570626c28c8cf5884abb8130ae46250c9f325bac93d9bb0c9d
|
3 |
+
size 5422
|
checkpoint_820000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f9f9782d4856b45564d33e6703093175501cc83227b1dfcbabbbbcb2873b3a2
|
3 |
+
size 5469
|
checkpoint_820000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76d87623f00ca71138e4a86cd5caa943ec1103a91da92609962f4d000709e0a6
|
3 |
+
size 5275
|
checkpoint_820000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6418a0c450d3b37644159db743e867f7e19312e7aa6a59d1411f05ed38b5d482
|
3 |
+
size 5305
|
checkpoint_820000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7028b3f2007ef72746d64487314ca6723cab7f9713ecb30bd30b73a22418e831
|
3 |
+
size 172
|
checkpoint_820000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4463c4fd019d1f8e710341ca8e25fcbc4ca65fc5543d9cad8be4aa992bfe098a
|
3 |
+
size 1427
|
checkpoint_820000/state.param_states.encoder.encoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.encoder.encoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3376d0b76ca91ca2a117daef7e7626afb9ea054bcd0137f6c59754b209fa507
|
3 |
+
size 5398
|
checkpoint_820000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dc5cc7ad265b9aebea5afb69393aff614077009f99f648729a31e2126c092d2
|
3 |
+
size 5696
|
checkpoint_820000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8e9ee9c4c0857ad8fa0667f35acf04e466cb19e4758f0ebcb5081994cbdde96
|
3 |
+
size 5545
|
checkpoint_820000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|
checkpoint_820000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3d6d69ad755e2c060675bea8735da70c63ab9674eb9ae716739b9aa7e647432
|
3 |
+
size 5571
|
checkpoint_820000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15454ca58ace9d64cc661f694fa3a5c43479ab9e9298e3f5d36932e899b8ecc
|
3 |
+
size 170
|