Adrià Garriga-Alonso
commited on
Commit
·
7503349
1
Parent(s):
4254568
All models and their resets
Browse files- docstring_reset_heads_neurons.pt +3 -0
- docstring_reset_heads_neurons_test_metrics.json +1 -0
- greaterthan_reset_heads_neurons.pt +3 -0
- greaterthan_reset_heads_neurons_test_metrics.json +1 -0
- induction_reset_heads_neurons.pt +3 -0
- induction_reset_heads_neurons_test_metrics.json +1 -0
- ioi_reset_heads_neurons.pt +3 -0
- ioi_reset_heads_neurons_test_metrics.json +1 -0
- tracr_proportion_reset_heads_head_outputs_neurons.pt +3 -0
- tracr_proportion_reset_heads_head_outputs_neurons_test_metrics.json +1 -0
- tracr_proportion_reset_heads_neurons.pt +3 -0
- tracr_proportion_reset_heads_neurons_test_metrics.json +1 -0
- tracr_reverse_reset_heads_head_outputs_neurons.pt +3 -0
- tracr_reverse_reset_heads_head_outputs_neurons_test_metrics.json +1 -0
- tracr_reverse_reset_heads_neurons.pt +3 -0
- tracr_reverse_reset_heads_neurons_test_metrics.json +1 -0
docstring_reset_heads_neurons.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a771d91c94c7d8d875ace5c438d46b1bc2c23388bfa8387eb91f910b7e43643
|
3 |
+
size 220989397
|
docstring_reset_heads_neurons_test_metrics.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"trained_orig": {"kl_div": 0.0, "docstring_metric": -0.8751506805419922, "docstring_stefan": -0.6599999666213989, "nll": 1.5616439580917358, "match_nll": 0.0}, "trained_patched": {"kl_div": 3.2466509342193604, "docstring_metric": 5.734002113342285, "docstring_stefan": -0.0, "nll": 7.317677021026611, "match_nll": 5.756032466888428}, "reset_orig": {"kl_div": 9.219705581665039, "docstring_metric": 3.7328319549560547, "docstring_stefan": -0.03999999910593033, "nll": 12.243091583251953, "match_nll": 10.681447982788086}, "reset_patched": {"kl_div": 9.179398536682129, "docstring_metric": 3.727224826812744, "docstring_stefan": -0.03999999910593033, "nll": 12.215778350830078, "match_nll": 10.654132843017578}}
|
greaterthan_reset_heads_neurons.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9b28252a917f141e9280dcca7fbe82f58e670e1b0e2a6f0d77e37575f595bfb
|
3 |
+
size 664833785
|
greaterthan_reset_heads_neurons_test_metrics.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"trained_orig": {"greaterthan": -0.899685800075531, "kl_div": -3.2660567583775446e-09}, "trained_patched": {"greaterthan": 0.546195387840271, "kl_div": 2.0358293056488037}, "reset_orig": {"greaterthan": 3.6216224543750286e-06, "kl_div": 16.261964797973633}, "reset_patched": {"greaterthan": 3.66029235010501e-06, "kl_div": 16.13994026184082}}
|
induction_reset_heads_neurons.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bc0d492cd984c58ee4e7077e0013bb628c5b002f76b0476e305e6eaf366ced9
|
3 |
+
size 115738059
|
induction_reset_heads_neurons_test_metrics.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"trained_orig": {"kl_div": 0.0, "nll": 1.0137733221054077, "match_nll": 0.0}, "trained_patched": {"kl_div": 15.689358711242676, "nll": 16.729799270629883, "match_nll": 15.716024398803711}, "reset_orig": {"kl_div": 15.230734825134277, "nll": 16.419483184814453, "match_nll": 15.405710220336914}, "reset_patched": {"kl_div": 16.83327865600586, "nll": 17.941612243652344, "match_nll": 16.927837371826172}}
|
ioi_reset_heads_neurons.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82e43314f88b108fc1b366714eb6ed01943551854832438bc7f2fce376774298
|
3 |
+
size 664832393
|
ioi_reset_heads_neurons_test_metrics.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"trained_orig": {"kl_div": 4.962598776359073e-09, "logit_diff": -4.112348556518555, "frac_correct": -1.0, "nll": 0.5148709416389465, "match_nll": -1.9147991636714323e-08}, "trained_patched": {"kl_div": 4.759255409240723, "logit_diff": -0.015997886657714844, "frac_correct": -0.550000011920929, "nll": 7.773514270782471, "match_nll": 7.258643627166748}, "reset_orig": {"kl_div": 10.326383590698242, "logit_diff": -0.2732362747192383, "frac_correct": -0.5099999904632568, "nll": 13.974164962768555, "match_nll": 13.459294319152832}, "reset_patched": {"kl_div": 10.413257598876953, "logit_diff": -0.31786441802978516, "frac_correct": -0.5299999713897705, "nll": 14.055498123168945, "match_nll": 13.540627479553223}}
|
tracr_proportion_reset_heads_head_outputs_neurons.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2db397281e84edf8847dbd6a72e00b59dddc654448129c050100e46cb3a8ef9
|
3 |
+
size 15577
|
tracr_proportion_reset_heads_head_outputs_neurons_test_metrics.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"trained_orig": {"l2": 0.0, "kl_div": 0.0}, "trained_patched": {"l2": 0.14370369911193848, "kl_div": 0.011712733656167984}, "reset_orig": {"l2": 0.10203703492879868, "kl_div": 0.008652940392494202}, "reset_patched": {"l2": 0.10203703492879868, "kl_div": 0.008652940392494202}}
|
tracr_proportion_reset_heads_neurons.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14ee28f32cfab53319256c3da2d2b93283391a4a41a7fed8f2891a140bad61d3
|
3 |
+
size 14623
|
tracr_proportion_reset_heads_neurons_test_metrics.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"trained_orig": {"l2": 0.10203703492879868, "kl_div": 0.008652940392494202}, "trained_patched": {"l2": 0.10203703492879868, "kl_div": 0.008652940392494202}, "reset_orig": {"l2": 0.10203703492879868, "kl_div": 0.008652940392494202}, "reset_patched": {"l2": 0.10203703492879868, "kl_div": 0.008652940392494202}}
|
tracr_reverse_reset_heads_head_outputs_neurons.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96e4a781e7c6c7157a961ae94335092b52164cdf416c75e5eeabe45b98edb87f
|
3 |
+
size 96291
|
tracr_reverse_reset_heads_head_outputs_neurons_test_metrics.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"trained_orig": {"kl_div": 0.0}, "trained_patched": {"kl_div": 0.21243534982204437}, "reset_orig": {"kl_div": 0.09246326982975006}, "reset_patched": {"kl_div": 0.09246326982975006}}
|
tracr_reverse_reset_heads_neurons.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bd2638f0a4dbfca62cd5fae6aee77b2b534fadbfc02f04bcdcaee1f2a48d7bf
|
3 |
+
size 94653
|
tracr_reverse_reset_heads_neurons_test_metrics.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"trained_orig": {"kl_div": 0.09246326982975006}, "trained_patched": {"kl_div": 0.09246326982975006}, "reset_orig": {"kl_div": 0.09246326982975006}, "reset_patched": {"kl_div": 0.09246326982975006}}
|