Add mt5 causal analysis with decoder ids
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf +0 -0
- causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf +0 -0
- causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz +3 -0
- causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz +3 -0
- causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz +3 -0
- causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_mlp.pdf +0 -0
- causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_None.pdf +0 -0
- causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_attn.pdf +0 -0
- causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_mlp.pdf +0 -0
- causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf +0 -0
- causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf +0 -0
- causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz +3 -0
- causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz +3 -0
- causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz +3 -0
- causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_mlp.pdf +0 -0
- causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_None.pdf +0 -0
- causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_attn.pdf +0 -0
- causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_mlp.pdf +0 -0
- causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf +0 -0
- causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf +0 -0
- causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz +3 -0
- causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz +3 -0
- causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz +3 -0
- causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_mlp.pdf +0 -0
- causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_None.pdf +0 -0
- causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_attn.pdf +0 -0
- causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_mlp.pdf +0 -0
- causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf +0 -0
- causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf +0 -0
- causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz +3 -0
- causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz +3 -0
- causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz +3 -0
- causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_mlp.pdf +0 -0
- causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_None.pdf +0 -0
- causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_attn.pdf +0 -0
- causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_mlp.pdf +0 -0
- causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf +0 -0
- causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf +0 -0
- causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz +3 -0
- causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz +3 -0
- causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz +3 -0
- causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_mlp.pdf +0 -0
- causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_None.pdf +0 -0
- causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_attn.pdf +0 -0
- causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_mlp.pdf +0 -0
- causal_analysis/google__mt5-xl/ja_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf +0 -0
- causal_analysis/google__mt5-xl/ja_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf +0 -0
- causal_analysis/google__mt5-xl/ja_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz +3 -0
- causal_analysis/google__mt5-xl/ja_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz +3 -0
- causal_analysis/google__mt5-xl/ja_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz +3 -0
causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf
ADDED
Binary file (24.1 kB). View file
|
|
causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf
ADDED
Binary file (23.3 kB). View file
|
|
causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c42a1a5bbcb255af59638cb6b06f7fc0dc7522601c04fb15286a53119b513bd
|
3 |
+
size 11136
|
causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1f4be827c7569ae0f500c2a18abe7e9ab4923a09c516ed88f674895544d084b
|
3 |
+
size 11002
|
causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7749886ae3dd57b6a80d885b36e21f4a1dd1cda028aec258d91b3094942d38ba
|
3 |
+
size 10998
|
causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_mlp.pdf
ADDED
Binary file (26 kB). View file
|
|
causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_None.pdf
ADDED
Binary file (24.6 kB). View file
|
|
causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_attn.pdf
ADDED
Binary file (25.2 kB). View file
|
|
causal_analysis/google__mt5-xl/ar_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_mlp.pdf
ADDED
Binary file (26.6 kB). View file
|
|
causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf
ADDED
Binary file (24.5 kB). View file
|
|
causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf
ADDED
Binary file (24.2 kB). View file
|
|
causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e72d30152fb02670217c24d331b2e3555d74bc3a01ffe3a7cddb72de682c228d
|
3 |
+
size 11136
|
causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58727d958ff94c16c222489ec31c972a4992d76b008881fc6fc41b04c74b20ba
|
3 |
+
size 11002
|
causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c03169f26dba7f0c6a1380ccd2c3979f3429d45d665d98a037467e83411864bf
|
3 |
+
size 10998
|
causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_mlp.pdf
ADDED
Binary file (25.8 kB). View file
|
|
causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_None.pdf
ADDED
Binary file (25.1 kB). View file
|
|
causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_attn.pdf
ADDED
Binary file (26.2 kB). View file
|
|
causal_analysis/google__mt5-xl/en_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_mlp.pdf
ADDED
Binary file (26.5 kB). View file
|
|
causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf
ADDED
Binary file (24.2 kB). View file
|
|
causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf
ADDED
Binary file (23.4 kB). View file
|
|
causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90616d1d8b5b2c4c99c7c2e0fc6ae6e7f12b6cda5a2a574662812bc44e453e82
|
3 |
+
size 11136
|
causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f3fbf29080fdc1c16a0d400889b82186240d55fce55d6df5e4cbfd5d83ec93b
|
3 |
+
size 11002
|
causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ba1fc50d26a5cb4961bdc3a308a126d1b40d3c0ae67c27891d1182638ac3cf3
|
3 |
+
size 10998
|
causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_mlp.pdf
ADDED
Binary file (25.7 kB). View file
|
|
causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_None.pdf
ADDED
Binary file (25 kB). View file
|
|
causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_attn.pdf
ADDED
Binary file (25.2 kB). View file
|
|
causal_analysis/google__mt5-xl/es_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_mlp.pdf
ADDED
Binary file (26.5 kB). View file
|
|
causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf
ADDED
Binary file (24.3 kB). View file
|
|
causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf
ADDED
Binary file (23.9 kB). View file
|
|
causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3243245310ecde0a09e1cd06b6d9c28451229fb21458ee6b05e8171a8d0e4bac
|
3 |
+
size 11136
|
causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a7c6b872bf115282be28f1e07953695480dad9ef54889ca95e5304d8d54c965
|
3 |
+
size 11002
|
causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:215f5143bed35c52edd66c6e6e3d916546874ec1204fc3a4f16bcc6600a12369
|
3 |
+
size 10998
|
causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_mlp.pdf
ADDED
Binary file (26.3 kB). View file
|
|
causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_None.pdf
ADDED
Binary file (24.8 kB). View file
|
|
causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_attn.pdf
ADDED
Binary file (25.4 kB). View file
|
|
causal_analysis/google__mt5-xl/fa_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_mlp.pdf
ADDED
Binary file (26.6 kB). View file
|
|
causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf
ADDED
Binary file (24.2 kB). View file
|
|
causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf
ADDED
Binary file (24.1 kB). View file
|
|
causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3771edd4f2405375a366ef29cc3721c6cc5a745362550c3a0cb2b37e36e79bd6
|
3 |
+
size 11136
|
causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7e3af987540eeec34253a770a690f2b267c433a72dbd232aed25af66b005480
|
3 |
+
size 11002
|
causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:187fe2eb395df9ab4ea79ca2e1b9c987b5ad189af36982c832b4ae20e04cea5b
|
3 |
+
size 10998
|
causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_mlp.pdf
ADDED
Binary file (26.3 kB). View file
|
|
causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_None.pdf
ADDED
Binary file (24.6 kB). View file
|
|
causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_attn.pdf
ADDED
Binary file (25.8 kB). View file
|
|
causal_analysis/google__mt5-xl/he_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/ticks_avg_mlp.pdf
ADDED
Binary file (27.1 kB). View file
|
|
causal_analysis/google__mt5-xl/ja_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_None.pdf
ADDED
Binary file (23.7 kB). View file
|
|
causal_analysis/google__mt5-xl/ja_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_attn.pdf
ADDED
Binary file (24.6 kB). View file
|
|
causal_analysis/google__mt5-xl/ja_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_None.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2509585878c1a247773bb14f22be2843a82b42f7458fd0340c9a73872d388635
|
3 |
+
size 11136
|
causal_analysis/google__mt5-xl/ja_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_attn.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1bd697f8debca1434820686b33c4f47f7b63aeef15ef79da9a9c652f650178f
|
3 |
+
size 11002
|
causal_analysis/google__mt5-xl/ja_xlingual_mpararel_mlm_subset_window=6/plots_resample_trivial/avg_data_mlp.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:018894ffe1a71a12758808ac7ab877dddff3405f0163729176a146f72214cf7b
|
3 |
+
size 10998
|