aapot
commited on
Commit
·
ec03465
1
Parent(s):
4e41742
Add 350k train step and HF flax model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint_350000/checkpoint +3 -0
- checkpoint_350000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 +3 -0
- checkpoint_350000/state.param_states.encoder.encoder_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.encoder.encoder_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
checkpoint_350000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4cb2800c5c4f200581c7f7076307b8199ba2552b850434005bde2327211be0f
|
3 |
+
size 640339
|
checkpoint_350000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d47526e7e9486a4fe8b6cdfd03c7f9193f473ba0530582636d2a74f9345d80e
|
3 |
+
size 957
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e13b6e4230a517a4c2cae060350bcb01d5ad0eba6e9017feaf035f9d6637e6b
|
3 |
+
size 972
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9aebc9f7a641513861bdac6ee4ce75b321b756464069c12edb23cb86fe69439
|
3 |
+
size 975
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2627eab5341996661e7f2e33f893176a1e3f2cd16a7fa67866b7ea686888113
|
3 |
+
size 1001
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:294eaaaf846137fbb9060878d5a1886911fd7a9f043fddf01a7c394690451c4a
|
3 |
+
size 987
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:884ecae0f0eea73ab3d767a7b3dfba847d3e17cd6a2a815cbc0d7c036613bb3a
|
3 |
+
size 952
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a0317f41bb49d3f186e911f698d1741e96d5d025e5691bbb5b2881d9f766598
|
3 |
+
size 1002
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57d7c0aa8ec9fde785786c16e0fce0a922e8c8295c0cd9a9bea19394bb808416
|
3 |
+
size 980
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec70e467ea08b56796860b8221ebdd5a8f652ad2bf5ae49b2fee2cdf3fe237a9
|
3 |
+
size 961
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cb03a5b798076888a422201d77206767e2c11ab2f36127e9464044e23137368
|
3 |
+
size 986
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cca18ec2a3fa525703da92ce1db416f045f039aee294da2e02191b12b1c43e26
|
3 |
+
size 971
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae4346c8221b156b40cccffaa68907cdb5c58c813ef971a9c5fbe325a3a5875c
|
3 |
+
size 979
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7824efdc3ef1dcdf753cb6c2a9924e92b430428a9e9d16f2b31b5a61abc10b26
|
3 |
+
size 988
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30a1839d234b4018337211f90c303c99f818d3e6b3cb4d2e6441c7eb6b2b6114
|
3 |
+
size 980
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b79a8ca42844d2d3a851468a05aaf3bb73e250dd135a9ff284e5099b45653f5e
|
3 |
+
size 979
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ea2e1bfdc9e6e3566844c34ce011abef2d5433581cbffdbb2f42b5de7daf81f
|
3 |
+
size 973
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:918c1ea46da62c71cacd6d59257a36cc8cfd5eaca211af6f986bfd954b95750d
|
3 |
+
size 979
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd0f2c021b6ad9c57a7a308895bd5860c3a41349372659723228c96c32b594cf
|
3 |
+
size 973
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:151b4e4e2b62577995f16391a6abbc2ea2f5583dc0f65da7e8f50c98bc0a152c
|
3 |
+
size 962
|
checkpoint_350000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29b0b4f4727db7bbeacbac66511f4e0ea2d73d7e962302934561781052f7e5c3
|
3 |
+
size 170
|
checkpoint_350000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ffef5170858ad37a2dd390f83dd18ef9e5edb7ef6d0a023de4b340bddfed3b4
|
3 |
+
size 535
|
checkpoint_350000/state.param_states.encoder.encoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.encoder.encoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:015a47fd8b68c163b247d358334fb2a45d9366ae2b38ae89b225ea134fbfb1e1
|
3 |
+
size 984
|
checkpoint_350000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d8f056d19bb4360ea8e9d0c5f6f1b6697493203a6e5ffcde5c9e3cabc9f2e44
|
3 |
+
size 974
|
checkpoint_350000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a405392327b0be6358e87db46f29361c37ad7fa77c68b9b3469c912661dcce0f
|
3 |
+
size 974
|
checkpoint_350000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:252ae51790d790172959df3aad71e71a43798013443d2e821cfb40cd3636e625
|
3 |
+
size 990
|
checkpoint_350000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
|
3 |
+
size 168
|