diff --git a/emb-norm-6k/000-module.3.input_layernorm/events.out.tfevents.1638234920.r6i3n2.1319219.5 b/emb-norm-14.6k/000-module.3.input_layernorm/events.out.tfevents.1638234920.r6i3n2.1319219.5 similarity index 100% rename from emb-norm-6k/000-module.3.input_layernorm/events.out.tfevents.1638234920.r6i3n2.1319219.5 rename to emb-norm-14.6k/000-module.3.input_layernorm/events.out.tfevents.1638234920.r6i3n2.1319219.5 diff --git a/emb-norm-6k/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.13 b/emb-norm-14.6k/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.13 similarity index 100% rename from emb-norm-6k/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.13 rename to emb-norm-14.6k/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.13 diff --git a/emb-norm-6k/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.12 b/emb-norm-14.6k/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.12 similarity index 100% rename from emb-norm-6k/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.12 rename to emb-norm-14.6k/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.12 diff --git a/emb-norm-6k/000-module.3.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.14 b/emb-norm-14.6k/000-module.3.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.14 similarity index 100% rename from emb-norm-6k/000-module.3.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.14 rename to emb-norm-14.6k/000-module.3.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.14 diff --git a/emb-norm-6k/000-module.3.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.11 b/emb-norm-14.6k/000-module.3.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.11 similarity index 100% rename from emb-norm-6k/000-module.3.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.11 rename to emb-norm-14.6k/000-module.3.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.11 diff --git a/emb-norm-6k/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.8 b/emb-norm-14.6k/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.8 similarity index 100% rename from emb-norm-6k/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.8 rename to emb-norm-14.6k/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.8 diff --git a/emb-norm-6k/000-module.3.self_attention.dense/events.out.tfevents.1638234920.r6i3n2.1319219.9 b/emb-norm-14.6k/000-module.3.self_attention.dense/events.out.tfevents.1638234920.r6i3n2.1319219.9 similarity index 100% rename from emb-norm-6k/000-module.3.self_attention.dense/events.out.tfevents.1638234920.r6i3n2.1319219.9 rename to emb-norm-14.6k/000-module.3.self_attention.dense/events.out.tfevents.1638234920.r6i3n2.1319219.9 diff --git a/emb-norm-6k/000-module.3.self_attention.query_key_value/events.out.tfevents.1638234920.r6i3n2.1319219.6 b/emb-norm-14.6k/000-module.3.self_attention.query_key_value/events.out.tfevents.1638234920.r6i3n2.1319219.6 similarity index 100% rename from emb-norm-6k/000-module.3.self_attention.query_key_value/events.out.tfevents.1638234920.r6i3n2.1319219.6 rename to emb-norm-14.6k/000-module.3.self_attention.query_key_value/events.out.tfevents.1638234920.r6i3n2.1319219.6 diff --git a/emb-norm-6k/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638234920.r6i3n2.1319219.7 b/emb-norm-14.6k/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638234920.r6i3n2.1319219.7 similarity index 100% rename from emb-norm-6k/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638234920.r6i3n2.1319219.7 rename to emb-norm-14.6k/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638234920.r6i3n2.1319219.7 diff --git a/emb-norm-6k/000-module.3.self_attention/events.out.tfevents.1638234920.r6i3n2.1319219.10 b/emb-norm-14.6k/000-module.3.self_attention/events.out.tfevents.1638234920.r6i3n2.1319219.10 similarity index 100% rename from emb-norm-6k/000-module.3.self_attention/events.out.tfevents.1638234920.r6i3n2.1319219.10 rename to emb-norm-14.6k/000-module.3.self_attention/events.out.tfevents.1638234920.r6i3n2.1319219.10 diff --git a/emb-norm-6k/000-module.3/events.out.tfevents.1638234921.r6i3n2.1319219.15 b/emb-norm-14.6k/000-module.3/events.out.tfevents.1638234921.r6i3n2.1319219.15 similarity index 100% rename from emb-norm-6k/000-module.3/events.out.tfevents.1638234921.r6i3n2.1319219.15 rename to emb-norm-14.6k/000-module.3/events.out.tfevents.1638234921.r6i3n2.1319219.15 diff --git a/emb-norm-6k/000-module.4.input_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.16 b/emb-norm-14.6k/000-module.4.input_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.16 similarity index 100% rename from emb-norm-6k/000-module.4.input_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.16 rename to emb-norm-14.6k/000-module.4.input_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.16 diff --git a/emb-norm-6k/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.24 b/emb-norm-14.6k/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.24 similarity index 100% rename from emb-norm-6k/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.24 rename to emb-norm-14.6k/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.24 diff --git a/emb-norm-6k/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.23 b/emb-norm-14.6k/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.23 similarity index 100% rename from emb-norm-6k/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.23 rename to emb-norm-14.6k/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.23 diff --git a/emb-norm-6k/000-module.4.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.25 b/emb-norm-14.6k/000-module.4.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.25 similarity index 100% rename from emb-norm-6k/000-module.4.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.25 rename to emb-norm-14.6k/000-module.4.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.25 diff --git a/emb-norm-6k/000-module.4.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.22 b/emb-norm-14.6k/000-module.4.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.22 similarity index 100% rename from emb-norm-6k/000-module.4.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.22 rename to emb-norm-14.6k/000-module.4.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.22 diff --git a/emb-norm-6k/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638234921.r6i3n2.1319219.19 b/emb-norm-14.6k/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638234921.r6i3n2.1319219.19 similarity index 100% rename from emb-norm-6k/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638234921.r6i3n2.1319219.19 rename to emb-norm-14.6k/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638234921.r6i3n2.1319219.19 diff --git a/emb-norm-6k/000-module.4.self_attention.dense/events.out.tfevents.1638234921.r6i3n2.1319219.20 b/emb-norm-14.6k/000-module.4.self_attention.dense/events.out.tfevents.1638234921.r6i3n2.1319219.20 similarity index 100% rename from emb-norm-6k/000-module.4.self_attention.dense/events.out.tfevents.1638234921.r6i3n2.1319219.20 rename to emb-norm-14.6k/000-module.4.self_attention.dense/events.out.tfevents.1638234921.r6i3n2.1319219.20 diff --git a/emb-norm-6k/000-module.4.self_attention.query_key_value/events.out.tfevents.1638234921.r6i3n2.1319219.17 b/emb-norm-14.6k/000-module.4.self_attention.query_key_value/events.out.tfevents.1638234921.r6i3n2.1319219.17 similarity index 100% rename from emb-norm-6k/000-module.4.self_attention.query_key_value/events.out.tfevents.1638234921.r6i3n2.1319219.17 rename to emb-norm-14.6k/000-module.4.self_attention.query_key_value/events.out.tfevents.1638234921.r6i3n2.1319219.17 diff --git a/emb-norm-6k/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638234921.r6i3n2.1319219.18 b/emb-norm-14.6k/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638234921.r6i3n2.1319219.18 similarity index 100% rename from emb-norm-6k/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638234921.r6i3n2.1319219.18 rename to emb-norm-14.6k/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638234921.r6i3n2.1319219.18 diff --git a/emb-norm-6k/000-module.4.self_attention/events.out.tfevents.1638234921.r6i3n2.1319219.21 b/emb-norm-14.6k/000-module.4.self_attention/events.out.tfevents.1638234921.r6i3n2.1319219.21 similarity index 100% rename from emb-norm-6k/000-module.4.self_attention/events.out.tfevents.1638234921.r6i3n2.1319219.21 rename to emb-norm-14.6k/000-module.4.self_attention/events.out.tfevents.1638234921.r6i3n2.1319219.21 diff --git a/emb-norm-6k/000-module.4/events.out.tfevents.1638234921.r6i3n2.1319219.26 b/emb-norm-14.6k/000-module.4/events.out.tfevents.1638234921.r6i3n2.1319219.26 similarity index 100% rename from emb-norm-6k/000-module.4/events.out.tfevents.1638234921.r6i3n2.1319219.26 rename to emb-norm-14.6k/000-module.4/events.out.tfevents.1638234921.r6i3n2.1319219.26 diff --git a/emb-norm-6k/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.3 b/emb-norm-14.6k/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.3 similarity index 100% rename from emb-norm-6k/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.3 rename to emb-norm-14.6k/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.3 diff --git a/emb-norm-6k/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.2 b/emb-norm-14.6k/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.2 similarity index 100% rename from emb-norm-6k/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.2 rename to emb-norm-14.6k/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.2 diff --git a/emb-norm-6k/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1638234920.r6i3n2.1319219.0 b/emb-norm-14.6k/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1638234920.r6i3n2.1319219.0 similarity index 100% rename from emb-norm-6k/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1638234920.r6i3n2.1319219.0 rename to emb-norm-14.6k/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1638234920.r6i3n2.1319219.0 diff --git a/emb-norm-6k/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.1 b/emb-norm-14.6k/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.1 similarity index 100% rename from emb-norm-6k/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.1 rename to emb-norm-14.6k/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.1 diff --git a/emb-norm-6k/000-module.tied_modules.embed/events.out.tfevents.1638234920.r6i3n2.1319219.4 b/emb-norm-14.6k/000-module.tied_modules.embed/events.out.tfevents.1638234920.r6i3n2.1319219.4 similarity index 100% rename from emb-norm-6k/000-module.tied_modules.embed/events.out.tfevents.1638234920.r6i3n2.1319219.4 rename to emb-norm-14.6k/000-module.tied_modules.embed/events.out.tfevents.1638234920.r6i3n2.1319219.4 diff --git a/emb-norm-6k/000-module/events.out.tfevents.1638234921.r6i3n2.1319219.27 b/emb-norm-14.6k/000-module/events.out.tfevents.1638234921.r6i3n2.1319219.27 similarity index 100% rename from emb-norm-6k/000-module/events.out.tfevents.1638234921.r6i3n2.1319219.27 rename to emb-norm-14.6k/000-module/events.out.tfevents.1638234921.r6i3n2.1319219.27 diff --git a/emb-norm-6k/056-module.17.input_layernorm/events.out.tfevents.1638234932.r6i5n3.61809.0 b/emb-norm-14.6k/056-module.17.input_layernorm/events.out.tfevents.1638234932.r6i5n3.61809.0 similarity index 100% rename from emb-norm-6k/056-module.17.input_layernorm/events.out.tfevents.1638234932.r6i5n3.61809.0 rename to emb-norm-14.6k/056-module.17.input_layernorm/events.out.tfevents.1638234932.r6i5n3.61809.0 diff --git a/emb-norm-6k/056-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.8 b/emb-norm-14.6k/056-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.8 similarity index 100% rename from emb-norm-6k/056-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.8 rename to emb-norm-14.6k/056-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.8 diff --git a/emb-norm-6k/056-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.7 b/emb-norm-14.6k/056-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.7 similarity index 100% rename from emb-norm-6k/056-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.7 rename to emb-norm-14.6k/056-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.7 diff --git a/emb-norm-6k/056-module.17.mlp/events.out.tfevents.1638234933.r6i5n3.61809.9 b/emb-norm-14.6k/056-module.17.mlp/events.out.tfevents.1638234933.r6i5n3.61809.9 similarity index 100% rename from emb-norm-6k/056-module.17.mlp/events.out.tfevents.1638234933.r6i5n3.61809.9 rename to emb-norm-14.6k/056-module.17.mlp/events.out.tfevents.1638234933.r6i5n3.61809.9 diff --git a/emb-norm-6k/056-module.17.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.6 b/emb-norm-14.6k/056-module.17.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.6 similarity index 100% rename from emb-norm-6k/056-module.17.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.6 rename to emb-norm-14.6k/056-module.17.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.6 diff --git a/emb-norm-6k/056-module.17.self_attention.attention_dropout/events.out.tfevents.1638234932.r6i5n3.61809.3 b/emb-norm-14.6k/056-module.17.self_attention.attention_dropout/events.out.tfevents.1638234932.r6i5n3.61809.3 similarity index 100% rename from emb-norm-6k/056-module.17.self_attention.attention_dropout/events.out.tfevents.1638234932.r6i5n3.61809.3 rename to emb-norm-14.6k/056-module.17.self_attention.attention_dropout/events.out.tfevents.1638234932.r6i5n3.61809.3 diff --git a/emb-norm-6k/056-module.17.self_attention.dense/events.out.tfevents.1638234932.r6i5n3.61809.4 b/emb-norm-14.6k/056-module.17.self_attention.dense/events.out.tfevents.1638234932.r6i5n3.61809.4 similarity index 100% rename from emb-norm-6k/056-module.17.self_attention.dense/events.out.tfevents.1638234932.r6i5n3.61809.4 rename to emb-norm-14.6k/056-module.17.self_attention.dense/events.out.tfevents.1638234932.r6i5n3.61809.4 diff --git a/emb-norm-6k/056-module.17.self_attention.query_key_value/events.out.tfevents.1638234932.r6i5n3.61809.1 b/emb-norm-14.6k/056-module.17.self_attention.query_key_value/events.out.tfevents.1638234932.r6i5n3.61809.1 similarity index 100% rename from emb-norm-6k/056-module.17.self_attention.query_key_value/events.out.tfevents.1638234932.r6i5n3.61809.1 rename to emb-norm-14.6k/056-module.17.self_attention.query_key_value/events.out.tfevents.1638234932.r6i5n3.61809.1 diff --git a/emb-norm-6k/056-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638234932.r6i5n3.61809.2 b/emb-norm-14.6k/056-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638234932.r6i5n3.61809.2 similarity index 100% rename from emb-norm-6k/056-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638234932.r6i5n3.61809.2 rename to emb-norm-14.6k/056-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638234932.r6i5n3.61809.2 diff --git a/emb-norm-6k/056-module.17.self_attention/events.out.tfevents.1638234932.r6i5n3.61809.5 b/emb-norm-14.6k/056-module.17.self_attention/events.out.tfevents.1638234932.r6i5n3.61809.5 similarity index 100% rename from emb-norm-6k/056-module.17.self_attention/events.out.tfevents.1638234932.r6i5n3.61809.5 rename to emb-norm-14.6k/056-module.17.self_attention/events.out.tfevents.1638234932.r6i5n3.61809.5 diff --git a/emb-norm-6k/056-module.17/events.out.tfevents.1638234933.r6i5n3.61809.10 b/emb-norm-14.6k/056-module.17/events.out.tfevents.1638234933.r6i5n3.61809.10 similarity index 100% rename from emb-norm-6k/056-module.17/events.out.tfevents.1638234933.r6i5n3.61809.10 rename to emb-norm-14.6k/056-module.17/events.out.tfevents.1638234933.r6i5n3.61809.10 diff --git a/emb-norm-6k/056-module.18.input_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.11 b/emb-norm-14.6k/056-module.18.input_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.11 similarity index 100% rename from emb-norm-6k/056-module.18.input_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.11 rename to emb-norm-14.6k/056-module.18.input_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.11 diff --git a/emb-norm-6k/056-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.19 b/emb-norm-14.6k/056-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.19 similarity index 100% rename from emb-norm-6k/056-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.19 rename to emb-norm-14.6k/056-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.19 diff --git a/emb-norm-6k/056-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.18 b/emb-norm-14.6k/056-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.18 similarity index 100% rename from emb-norm-6k/056-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.18 rename to emb-norm-14.6k/056-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.18 diff --git a/emb-norm-6k/056-module.18.mlp/events.out.tfevents.1638234933.r6i5n3.61809.20 b/emb-norm-14.6k/056-module.18.mlp/events.out.tfevents.1638234933.r6i5n3.61809.20 similarity index 100% rename from emb-norm-6k/056-module.18.mlp/events.out.tfevents.1638234933.r6i5n3.61809.20 rename to emb-norm-14.6k/056-module.18.mlp/events.out.tfevents.1638234933.r6i5n3.61809.20 diff --git a/emb-norm-6k/056-module.18.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.17 b/emb-norm-14.6k/056-module.18.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.17 similarity index 100% rename from emb-norm-6k/056-module.18.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.17 rename to emb-norm-14.6k/056-module.18.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.17 diff --git a/emb-norm-6k/056-module.18.self_attention.attention_dropout/events.out.tfevents.1638234933.r6i5n3.61809.14 b/emb-norm-14.6k/056-module.18.self_attention.attention_dropout/events.out.tfevents.1638234933.r6i5n3.61809.14 similarity index 100% rename from emb-norm-6k/056-module.18.self_attention.attention_dropout/events.out.tfevents.1638234933.r6i5n3.61809.14 rename to emb-norm-14.6k/056-module.18.self_attention.attention_dropout/events.out.tfevents.1638234933.r6i5n3.61809.14 diff --git a/emb-norm-6k/056-module.18.self_attention.dense/events.out.tfevents.1638234933.r6i5n3.61809.15 b/emb-norm-14.6k/056-module.18.self_attention.dense/events.out.tfevents.1638234933.r6i5n3.61809.15 similarity index 100% rename from emb-norm-6k/056-module.18.self_attention.dense/events.out.tfevents.1638234933.r6i5n3.61809.15 rename to emb-norm-14.6k/056-module.18.self_attention.dense/events.out.tfevents.1638234933.r6i5n3.61809.15 diff --git a/emb-norm-6k/056-module.18.self_attention.query_key_value/events.out.tfevents.1638234933.r6i5n3.61809.12 b/emb-norm-14.6k/056-module.18.self_attention.query_key_value/events.out.tfevents.1638234933.r6i5n3.61809.12 similarity index 100% rename from emb-norm-6k/056-module.18.self_attention.query_key_value/events.out.tfevents.1638234933.r6i5n3.61809.12 rename to emb-norm-14.6k/056-module.18.self_attention.query_key_value/events.out.tfevents.1638234933.r6i5n3.61809.12 diff --git a/emb-norm-6k/056-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638234933.r6i5n3.61809.13 b/emb-norm-14.6k/056-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638234933.r6i5n3.61809.13 similarity index 100% rename from emb-norm-6k/056-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638234933.r6i5n3.61809.13 rename to emb-norm-14.6k/056-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638234933.r6i5n3.61809.13 diff --git a/emb-norm-6k/056-module.18.self_attention/events.out.tfevents.1638234933.r6i5n3.61809.16 b/emb-norm-14.6k/056-module.18.self_attention/events.out.tfevents.1638234933.r6i5n3.61809.16 similarity index 100% rename from emb-norm-6k/056-module.18.self_attention/events.out.tfevents.1638234933.r6i5n3.61809.16 rename to emb-norm-14.6k/056-module.18.self_attention/events.out.tfevents.1638234933.r6i5n3.61809.16 diff --git a/emb-norm-6k/056-module.18/events.out.tfevents.1638234933.r6i5n3.61809.21 b/emb-norm-14.6k/056-module.18/events.out.tfevents.1638234933.r6i5n3.61809.21 similarity index 100% rename from emb-norm-6k/056-module.18/events.out.tfevents.1638234933.r6i5n3.61809.21 rename to emb-norm-14.6k/056-module.18/events.out.tfevents.1638234933.r6i5n3.61809.21 diff --git a/emb-norm-6k/056-module/events.out.tfevents.1638234933.r6i5n3.61809.22 b/emb-norm-14.6k/056-module/events.out.tfevents.1638234933.r6i5n3.61809.22 similarity index 100% rename from emb-norm-6k/056-module/events.out.tfevents.1638234933.r6i5n3.61809.22 rename to emb-norm-14.6k/056-module/events.out.tfevents.1638234933.r6i5n3.61809.22 diff --git a/emb-norm-6k/120-module.33.input_layernorm/events.out.tfevents.1638234945.r6i7n1.62062.0 b/emb-norm-14.6k/120-module.33.input_layernorm/events.out.tfevents.1638234945.r6i7n1.62062.0 similarity index 100% rename from emb-norm-6k/120-module.33.input_layernorm/events.out.tfevents.1638234945.r6i7n1.62062.0 rename to emb-norm-14.6k/120-module.33.input_layernorm/events.out.tfevents.1638234945.r6i7n1.62062.0 diff --git a/emb-norm-6k/120-module.33.mlp.dense_4h_to_h/events.out.tfevents.1638234946.r6i7n1.62062.8 b/emb-norm-14.6k/120-module.33.mlp.dense_4h_to_h/events.out.tfevents.1638234946.r6i7n1.62062.8 similarity index 100% rename from emb-norm-6k/120-module.33.mlp.dense_4h_to_h/events.out.tfevents.1638234946.r6i7n1.62062.8 rename to emb-norm-14.6k/120-module.33.mlp.dense_4h_to_h/events.out.tfevents.1638234946.r6i7n1.62062.8 diff --git a/emb-norm-6k/120-module.33.mlp.dense_h_to_4h/events.out.tfevents.1638234946.r6i7n1.62062.7 b/emb-norm-14.6k/120-module.33.mlp.dense_h_to_4h/events.out.tfevents.1638234946.r6i7n1.62062.7 similarity index 100% rename from emb-norm-6k/120-module.33.mlp.dense_h_to_4h/events.out.tfevents.1638234946.r6i7n1.62062.7 rename to emb-norm-14.6k/120-module.33.mlp.dense_h_to_4h/events.out.tfevents.1638234946.r6i7n1.62062.7 diff --git a/emb-norm-6k/120-module.33.mlp/events.out.tfevents.1638234946.r6i7n1.62062.9 b/emb-norm-14.6k/120-module.33.mlp/events.out.tfevents.1638234946.r6i7n1.62062.9 similarity index 100% rename from emb-norm-6k/120-module.33.mlp/events.out.tfevents.1638234946.r6i7n1.62062.9 rename to emb-norm-14.6k/120-module.33.mlp/events.out.tfevents.1638234946.r6i7n1.62062.9 diff --git a/emb-norm-6k/120-module.33.post_attention_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.6 b/emb-norm-14.6k/120-module.33.post_attention_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.6 similarity index 100% rename from emb-norm-6k/120-module.33.post_attention_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.6 rename to emb-norm-14.6k/120-module.33.post_attention_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.6 diff --git a/emb-norm-6k/120-module.33.self_attention.attention_dropout/events.out.tfevents.1638234946.r6i7n1.62062.3 b/emb-norm-14.6k/120-module.33.self_attention.attention_dropout/events.out.tfevents.1638234946.r6i7n1.62062.3 similarity index 100% rename from emb-norm-6k/120-module.33.self_attention.attention_dropout/events.out.tfevents.1638234946.r6i7n1.62062.3 rename to emb-norm-14.6k/120-module.33.self_attention.attention_dropout/events.out.tfevents.1638234946.r6i7n1.62062.3 diff --git a/emb-norm-6k/120-module.33.self_attention.dense/events.out.tfevents.1638234946.r6i7n1.62062.4 b/emb-norm-14.6k/120-module.33.self_attention.dense/events.out.tfevents.1638234946.r6i7n1.62062.4 similarity index 100% rename from emb-norm-6k/120-module.33.self_attention.dense/events.out.tfevents.1638234946.r6i7n1.62062.4 rename to emb-norm-14.6k/120-module.33.self_attention.dense/events.out.tfevents.1638234946.r6i7n1.62062.4 diff --git a/emb-norm-6k/120-module.33.self_attention.query_key_value/events.out.tfevents.1638234946.r6i7n1.62062.1 b/emb-norm-14.6k/120-module.33.self_attention.query_key_value/events.out.tfevents.1638234946.r6i7n1.62062.1 similarity index 100% rename from emb-norm-6k/120-module.33.self_attention.query_key_value/events.out.tfevents.1638234946.r6i7n1.62062.1 rename to emb-norm-14.6k/120-module.33.self_attention.query_key_value/events.out.tfevents.1638234946.r6i7n1.62062.1 diff --git a/emb-norm-6k/120-module.33.self_attention.scale_mask_softmax/events.out.tfevents.1638234946.r6i7n1.62062.2 b/emb-norm-14.6k/120-module.33.self_attention.scale_mask_softmax/events.out.tfevents.1638234946.r6i7n1.62062.2 similarity index 100% rename from emb-norm-6k/120-module.33.self_attention.scale_mask_softmax/events.out.tfevents.1638234946.r6i7n1.62062.2 rename to emb-norm-14.6k/120-module.33.self_attention.scale_mask_softmax/events.out.tfevents.1638234946.r6i7n1.62062.2 diff --git a/emb-norm-6k/120-module.33.self_attention/events.out.tfevents.1638234946.r6i7n1.62062.5 b/emb-norm-14.6k/120-module.33.self_attention/events.out.tfevents.1638234946.r6i7n1.62062.5 similarity index 100% rename from emb-norm-6k/120-module.33.self_attention/events.out.tfevents.1638234946.r6i7n1.62062.5 rename to emb-norm-14.6k/120-module.33.self_attention/events.out.tfevents.1638234946.r6i7n1.62062.5 diff --git a/emb-norm-6k/120-module.33/events.out.tfevents.1638234946.r6i7n1.62062.10 b/emb-norm-14.6k/120-module.33/events.out.tfevents.1638234946.r6i7n1.62062.10 similarity index 100% rename from emb-norm-6k/120-module.33/events.out.tfevents.1638234946.r6i7n1.62062.10 rename to emb-norm-14.6k/120-module.33/events.out.tfevents.1638234946.r6i7n1.62062.10 diff --git a/emb-norm-6k/120-module.34.input_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.11 b/emb-norm-14.6k/120-module.34.input_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.11 similarity index 100% rename from emb-norm-6k/120-module.34.input_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.11 rename to emb-norm-14.6k/120-module.34.input_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.11 diff --git a/emb-norm-6k/120-module.34.mlp.dense_4h_to_h/events.out.tfevents.1638234946.r6i7n1.62062.19 b/emb-norm-14.6k/120-module.34.mlp.dense_4h_to_h/events.out.tfevents.1638234946.r6i7n1.62062.19 similarity index 100% rename from emb-norm-6k/120-module.34.mlp.dense_4h_to_h/events.out.tfevents.1638234946.r6i7n1.62062.19 rename to emb-norm-14.6k/120-module.34.mlp.dense_4h_to_h/events.out.tfevents.1638234946.r6i7n1.62062.19 diff --git a/emb-norm-6k/120-module.34.mlp.dense_h_to_4h/events.out.tfevents.1638234946.r6i7n1.62062.18 b/emb-norm-14.6k/120-module.34.mlp.dense_h_to_4h/events.out.tfevents.1638234946.r6i7n1.62062.18 similarity index 100% rename from emb-norm-6k/120-module.34.mlp.dense_h_to_4h/events.out.tfevents.1638234946.r6i7n1.62062.18 rename to emb-norm-14.6k/120-module.34.mlp.dense_h_to_4h/events.out.tfevents.1638234946.r6i7n1.62062.18 diff --git a/emb-norm-6k/120-module.34.mlp/events.out.tfevents.1638234946.r6i7n1.62062.20 b/emb-norm-14.6k/120-module.34.mlp/events.out.tfevents.1638234946.r6i7n1.62062.20 similarity index 100% rename from emb-norm-6k/120-module.34.mlp/events.out.tfevents.1638234946.r6i7n1.62062.20 rename to emb-norm-14.6k/120-module.34.mlp/events.out.tfevents.1638234946.r6i7n1.62062.20 diff --git a/emb-norm-6k/120-module.34.post_attention_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.17 b/emb-norm-14.6k/120-module.34.post_attention_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.17 similarity index 100% rename from emb-norm-6k/120-module.34.post_attention_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.17 rename to emb-norm-14.6k/120-module.34.post_attention_layernorm/events.out.tfevents.1638234946.r6i7n1.62062.17 diff --git a/emb-norm-6k/120-module.34.self_attention.attention_dropout/events.out.tfevents.1638234946.r6i7n1.62062.14 b/emb-norm-14.6k/120-module.34.self_attention.attention_dropout/events.out.tfevents.1638234946.r6i7n1.62062.14 similarity index 100% rename from emb-norm-6k/120-module.34.self_attention.attention_dropout/events.out.tfevents.1638234946.r6i7n1.62062.14 rename to emb-norm-14.6k/120-module.34.self_attention.attention_dropout/events.out.tfevents.1638234946.r6i7n1.62062.14 diff --git a/emb-norm-6k/120-module.34.self_attention.dense/events.out.tfevents.1638234946.r6i7n1.62062.15 b/emb-norm-14.6k/120-module.34.self_attention.dense/events.out.tfevents.1638234946.r6i7n1.62062.15 similarity index 100% rename from emb-norm-6k/120-module.34.self_attention.dense/events.out.tfevents.1638234946.r6i7n1.62062.15 rename to emb-norm-14.6k/120-module.34.self_attention.dense/events.out.tfevents.1638234946.r6i7n1.62062.15 diff --git a/emb-norm-6k/120-module.34.self_attention.query_key_value/events.out.tfevents.1638234946.r6i7n1.62062.12 b/emb-norm-14.6k/120-module.34.self_attention.query_key_value/events.out.tfevents.1638234946.r6i7n1.62062.12 similarity index 100% rename from emb-norm-6k/120-module.34.self_attention.query_key_value/events.out.tfevents.1638234946.r6i7n1.62062.12 rename to emb-norm-14.6k/120-module.34.self_attention.query_key_value/events.out.tfevents.1638234946.r6i7n1.62062.12 diff --git a/emb-norm-6k/120-module.34.self_attention.scale_mask_softmax/events.out.tfevents.1638234946.r6i7n1.62062.13 b/emb-norm-14.6k/120-module.34.self_attention.scale_mask_softmax/events.out.tfevents.1638234946.r6i7n1.62062.13 similarity index 100% rename from emb-norm-6k/120-module.34.self_attention.scale_mask_softmax/events.out.tfevents.1638234946.r6i7n1.62062.13 rename to emb-norm-14.6k/120-module.34.self_attention.scale_mask_softmax/events.out.tfevents.1638234946.r6i7n1.62062.13 diff --git a/emb-norm-6k/120-module.34.self_attention/events.out.tfevents.1638234946.r6i7n1.62062.16 b/emb-norm-14.6k/120-module.34.self_attention/events.out.tfevents.1638234946.r6i7n1.62062.16 similarity index 100% rename from emb-norm-6k/120-module.34.self_attention/events.out.tfevents.1638234946.r6i7n1.62062.16 rename to emb-norm-14.6k/120-module.34.self_attention/events.out.tfevents.1638234946.r6i7n1.62062.16 diff --git a/emb-norm-6k/120-module.34/events.out.tfevents.1638234946.r6i7n1.62062.21 b/emb-norm-14.6k/120-module.34/events.out.tfevents.1638234946.r6i7n1.62062.21 similarity index 100% rename from emb-norm-6k/120-module.34/events.out.tfevents.1638234946.r6i7n1.62062.21 rename to emb-norm-14.6k/120-module.34/events.out.tfevents.1638234946.r6i7n1.62062.21 diff --git a/emb-norm-6k/120-module/events.out.tfevents.1638234946.r6i7n1.62062.22 b/emb-norm-14.6k/120-module/events.out.tfevents.1638234946.r6i7n1.62062.22 similarity index 100% rename from emb-norm-6k/120-module/events.out.tfevents.1638234946.r6i7n1.62062.22 rename to emb-norm-14.6k/120-module/events.out.tfevents.1638234946.r6i7n1.62062.22 diff --git a/emb-norm-6k/184-module.49.input_layernorm/events.out.tfevents.1638234959.r7i1n0.2708147.0 b/emb-norm-14.6k/184-module.49.input_layernorm/events.out.tfevents.1638234959.r7i1n0.2708147.0 similarity index 100% rename from emb-norm-6k/184-module.49.input_layernorm/events.out.tfevents.1638234959.r7i1n0.2708147.0 rename to emb-norm-14.6k/184-module.49.input_layernorm/events.out.tfevents.1638234959.r7i1n0.2708147.0 diff --git a/emb-norm-6k/184-module.49.mlp.dense_4h_to_h/events.out.tfevents.1638234960.r7i1n0.2708147.8 b/emb-norm-14.6k/184-module.49.mlp.dense_4h_to_h/events.out.tfevents.1638234960.r7i1n0.2708147.8 similarity index 100% rename from emb-norm-6k/184-module.49.mlp.dense_4h_to_h/events.out.tfevents.1638234960.r7i1n0.2708147.8 rename to emb-norm-14.6k/184-module.49.mlp.dense_4h_to_h/events.out.tfevents.1638234960.r7i1n0.2708147.8 diff --git a/emb-norm-6k/184-module.49.mlp.dense_h_to_4h/events.out.tfevents.1638234960.r7i1n0.2708147.7 b/emb-norm-14.6k/184-module.49.mlp.dense_h_to_4h/events.out.tfevents.1638234960.r7i1n0.2708147.7 similarity index 100% rename from emb-norm-6k/184-module.49.mlp.dense_h_to_4h/events.out.tfevents.1638234960.r7i1n0.2708147.7 rename to emb-norm-14.6k/184-module.49.mlp.dense_h_to_4h/events.out.tfevents.1638234960.r7i1n0.2708147.7 diff --git a/emb-norm-6k/184-module.49.mlp/events.out.tfevents.1638234960.r7i1n0.2708147.9 b/emb-norm-14.6k/184-module.49.mlp/events.out.tfevents.1638234960.r7i1n0.2708147.9 similarity index 100% rename from emb-norm-6k/184-module.49.mlp/events.out.tfevents.1638234960.r7i1n0.2708147.9 rename to emb-norm-14.6k/184-module.49.mlp/events.out.tfevents.1638234960.r7i1n0.2708147.9 diff --git a/emb-norm-6k/184-module.49.post_attention_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.6 b/emb-norm-14.6k/184-module.49.post_attention_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.6 similarity index 100% rename from emb-norm-6k/184-module.49.post_attention_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.6 rename to emb-norm-14.6k/184-module.49.post_attention_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.6 diff --git a/emb-norm-6k/184-module.49.self_attention.attention_dropout/events.out.tfevents.1638234959.r7i1n0.2708147.3 b/emb-norm-14.6k/184-module.49.self_attention.attention_dropout/events.out.tfevents.1638234959.r7i1n0.2708147.3 similarity index 100% rename from emb-norm-6k/184-module.49.self_attention.attention_dropout/events.out.tfevents.1638234959.r7i1n0.2708147.3 rename to emb-norm-14.6k/184-module.49.self_attention.attention_dropout/events.out.tfevents.1638234959.r7i1n0.2708147.3 diff --git a/emb-norm-6k/184-module.49.self_attention.dense/events.out.tfevents.1638234959.r7i1n0.2708147.4 b/emb-norm-14.6k/184-module.49.self_attention.dense/events.out.tfevents.1638234959.r7i1n0.2708147.4 similarity index 100% rename from emb-norm-6k/184-module.49.self_attention.dense/events.out.tfevents.1638234959.r7i1n0.2708147.4 rename to emb-norm-14.6k/184-module.49.self_attention.dense/events.out.tfevents.1638234959.r7i1n0.2708147.4 diff --git a/emb-norm-6k/184-module.49.self_attention.query_key_value/events.out.tfevents.1638234959.r7i1n0.2708147.1 b/emb-norm-14.6k/184-module.49.self_attention.query_key_value/events.out.tfevents.1638234959.r7i1n0.2708147.1 similarity index 100% rename from emb-norm-6k/184-module.49.self_attention.query_key_value/events.out.tfevents.1638234959.r7i1n0.2708147.1 rename to emb-norm-14.6k/184-module.49.self_attention.query_key_value/events.out.tfevents.1638234959.r7i1n0.2708147.1 diff --git a/emb-norm-6k/184-module.49.self_attention.scale_mask_softmax/events.out.tfevents.1638234959.r7i1n0.2708147.2 b/emb-norm-14.6k/184-module.49.self_attention.scale_mask_softmax/events.out.tfevents.1638234959.r7i1n0.2708147.2 similarity index 100% rename from emb-norm-6k/184-module.49.self_attention.scale_mask_softmax/events.out.tfevents.1638234959.r7i1n0.2708147.2 rename to emb-norm-14.6k/184-module.49.self_attention.scale_mask_softmax/events.out.tfevents.1638234959.r7i1n0.2708147.2 diff --git a/emb-norm-6k/184-module.49.self_attention/events.out.tfevents.1638234959.r7i1n0.2708147.5 b/emb-norm-14.6k/184-module.49.self_attention/events.out.tfevents.1638234959.r7i1n0.2708147.5 similarity index 100% rename from emb-norm-6k/184-module.49.self_attention/events.out.tfevents.1638234959.r7i1n0.2708147.5 rename to emb-norm-14.6k/184-module.49.self_attention/events.out.tfevents.1638234959.r7i1n0.2708147.5 diff --git a/emb-norm-6k/184-module.49/events.out.tfevents.1638234960.r7i1n0.2708147.10 b/emb-norm-14.6k/184-module.49/events.out.tfevents.1638234960.r7i1n0.2708147.10 similarity index 100% rename from emb-norm-6k/184-module.49/events.out.tfevents.1638234960.r7i1n0.2708147.10 rename to emb-norm-14.6k/184-module.49/events.out.tfevents.1638234960.r7i1n0.2708147.10 diff --git a/emb-norm-6k/184-module.50.input_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.11 b/emb-norm-14.6k/184-module.50.input_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.11 similarity index 100% rename from emb-norm-6k/184-module.50.input_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.11 rename to emb-norm-14.6k/184-module.50.input_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.11 diff --git a/emb-norm-6k/184-module.50.mlp.dense_4h_to_h/events.out.tfevents.1638234960.r7i1n0.2708147.19 b/emb-norm-14.6k/184-module.50.mlp.dense_4h_to_h/events.out.tfevents.1638234960.r7i1n0.2708147.19 similarity index 100% rename from emb-norm-6k/184-module.50.mlp.dense_4h_to_h/events.out.tfevents.1638234960.r7i1n0.2708147.19 rename to emb-norm-14.6k/184-module.50.mlp.dense_4h_to_h/events.out.tfevents.1638234960.r7i1n0.2708147.19 diff --git a/emb-norm-6k/184-module.50.mlp.dense_h_to_4h/events.out.tfevents.1638234960.r7i1n0.2708147.18 b/emb-norm-14.6k/184-module.50.mlp.dense_h_to_4h/events.out.tfevents.1638234960.r7i1n0.2708147.18 similarity index 100% rename from emb-norm-6k/184-module.50.mlp.dense_h_to_4h/events.out.tfevents.1638234960.r7i1n0.2708147.18 rename to emb-norm-14.6k/184-module.50.mlp.dense_h_to_4h/events.out.tfevents.1638234960.r7i1n0.2708147.18 diff --git a/emb-norm-6k/184-module.50.mlp/events.out.tfevents.1638234960.r7i1n0.2708147.20 b/emb-norm-14.6k/184-module.50.mlp/events.out.tfevents.1638234960.r7i1n0.2708147.20 similarity index 100% rename from emb-norm-6k/184-module.50.mlp/events.out.tfevents.1638234960.r7i1n0.2708147.20 rename to emb-norm-14.6k/184-module.50.mlp/events.out.tfevents.1638234960.r7i1n0.2708147.20 diff --git a/emb-norm-6k/184-module.50.post_attention_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.17 b/emb-norm-14.6k/184-module.50.post_attention_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.17 similarity index 100% rename from emb-norm-6k/184-module.50.post_attention_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.17 rename to emb-norm-14.6k/184-module.50.post_attention_layernorm/events.out.tfevents.1638234960.r7i1n0.2708147.17 diff --git a/emb-norm-6k/184-module.50.self_attention.attention_dropout/events.out.tfevents.1638234960.r7i1n0.2708147.14 b/emb-norm-14.6k/184-module.50.self_attention.attention_dropout/events.out.tfevents.1638234960.r7i1n0.2708147.14 similarity index 100% rename from emb-norm-6k/184-module.50.self_attention.attention_dropout/events.out.tfevents.1638234960.r7i1n0.2708147.14 rename to emb-norm-14.6k/184-module.50.self_attention.attention_dropout/events.out.tfevents.1638234960.r7i1n0.2708147.14 diff --git a/emb-norm-6k/184-module.50.self_attention.dense/events.out.tfevents.1638234960.r7i1n0.2708147.15 b/emb-norm-14.6k/184-module.50.self_attention.dense/events.out.tfevents.1638234960.r7i1n0.2708147.15 similarity index 100% rename from emb-norm-6k/184-module.50.self_attention.dense/events.out.tfevents.1638234960.r7i1n0.2708147.15 rename to emb-norm-14.6k/184-module.50.self_attention.dense/events.out.tfevents.1638234960.r7i1n0.2708147.15 diff --git a/emb-norm-6k/184-module.50.self_attention.query_key_value/events.out.tfevents.1638234960.r7i1n0.2708147.12 b/emb-norm-14.6k/184-module.50.self_attention.query_key_value/events.out.tfevents.1638234960.r7i1n0.2708147.12 similarity index 100% rename from emb-norm-6k/184-module.50.self_attention.query_key_value/events.out.tfevents.1638234960.r7i1n0.2708147.12 rename to emb-norm-14.6k/184-module.50.self_attention.query_key_value/events.out.tfevents.1638234960.r7i1n0.2708147.12 diff --git a/emb-norm-6k/184-module.50.self_attention.scale_mask_softmax/events.out.tfevents.1638234960.r7i1n0.2708147.13 b/emb-norm-14.6k/184-module.50.self_attention.scale_mask_softmax/events.out.tfevents.1638234960.r7i1n0.2708147.13 similarity index 100% rename from emb-norm-6k/184-module.50.self_attention.scale_mask_softmax/events.out.tfevents.1638234960.r7i1n0.2708147.13 rename to emb-norm-14.6k/184-module.50.self_attention.scale_mask_softmax/events.out.tfevents.1638234960.r7i1n0.2708147.13 diff --git a/emb-norm-6k/184-module.50.self_attention/events.out.tfevents.1638234960.r7i1n0.2708147.16 b/emb-norm-14.6k/184-module.50.self_attention/events.out.tfevents.1638234960.r7i1n0.2708147.16 similarity index 100% rename from emb-norm-6k/184-module.50.self_attention/events.out.tfevents.1638234960.r7i1n0.2708147.16 rename to emb-norm-14.6k/184-module.50.self_attention/events.out.tfevents.1638234960.r7i1n0.2708147.16 diff --git a/emb-norm-6k/184-module.50/events.out.tfevents.1638234960.r7i1n0.2708147.21 b/emb-norm-14.6k/184-module.50/events.out.tfevents.1638234960.r7i1n0.2708147.21 similarity index 100% rename from emb-norm-6k/184-module.50/events.out.tfevents.1638234960.r7i1n0.2708147.21 rename to emb-norm-14.6k/184-module.50/events.out.tfevents.1638234960.r7i1n0.2708147.21 diff --git a/emb-norm-6k/184-module/events.out.tfevents.1638234960.r7i1n0.2708147.22 b/emb-norm-14.6k/184-module/events.out.tfevents.1638234960.r7i1n0.2708147.22 similarity index 100% rename from emb-norm-6k/184-module/events.out.tfevents.1638234960.r7i1n0.2708147.22 rename to emb-norm-14.6k/184-module/events.out.tfevents.1638234960.r7i1n0.2708147.22 diff --git a/emb-norm-6k/248-module.65.input_layernorm/events.out.tfevents.1638234972.r7i2n7.3682384.0 b/emb-norm-14.6k/248-module.65.input_layernorm/events.out.tfevents.1638234972.r7i2n7.3682384.0 similarity index 100% rename from emb-norm-6k/248-module.65.input_layernorm/events.out.tfevents.1638234972.r7i2n7.3682384.0 rename to emb-norm-14.6k/248-module.65.input_layernorm/events.out.tfevents.1638234972.r7i2n7.3682384.0 diff --git a/emb-norm-6k/248-module.65.mlp.dense_4h_to_h/events.out.tfevents.1638234973.r7i2n7.3682384.8 b/emb-norm-14.6k/248-module.65.mlp.dense_4h_to_h/events.out.tfevents.1638234973.r7i2n7.3682384.8 similarity index 100% rename from emb-norm-6k/248-module.65.mlp.dense_4h_to_h/events.out.tfevents.1638234973.r7i2n7.3682384.8 rename to emb-norm-14.6k/248-module.65.mlp.dense_4h_to_h/events.out.tfevents.1638234973.r7i2n7.3682384.8 diff --git a/emb-norm-6k/248-module.65.mlp.dense_h_to_4h/events.out.tfevents.1638234973.r7i2n7.3682384.7 b/emb-norm-14.6k/248-module.65.mlp.dense_h_to_4h/events.out.tfevents.1638234973.r7i2n7.3682384.7 similarity index 100% rename from emb-norm-6k/248-module.65.mlp.dense_h_to_4h/events.out.tfevents.1638234973.r7i2n7.3682384.7 rename to emb-norm-14.6k/248-module.65.mlp.dense_h_to_4h/events.out.tfevents.1638234973.r7i2n7.3682384.7 diff --git a/emb-norm-6k/248-module.65.mlp/events.out.tfevents.1638234973.r7i2n7.3682384.9 b/emb-norm-14.6k/248-module.65.mlp/events.out.tfevents.1638234973.r7i2n7.3682384.9 similarity index 100% rename from emb-norm-6k/248-module.65.mlp/events.out.tfevents.1638234973.r7i2n7.3682384.9 rename to emb-norm-14.6k/248-module.65.mlp/events.out.tfevents.1638234973.r7i2n7.3682384.9 diff --git a/emb-norm-6k/248-module.65.post_attention_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.6 b/emb-norm-14.6k/248-module.65.post_attention_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.6 similarity index 100% rename from emb-norm-6k/248-module.65.post_attention_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.6 rename to emb-norm-14.6k/248-module.65.post_attention_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.6 diff --git a/emb-norm-6k/248-module.65.self_attention.attention_dropout/events.out.tfevents.1638234973.r7i2n7.3682384.3 b/emb-norm-14.6k/248-module.65.self_attention.attention_dropout/events.out.tfevents.1638234973.r7i2n7.3682384.3 similarity index 100% rename from emb-norm-6k/248-module.65.self_attention.attention_dropout/events.out.tfevents.1638234973.r7i2n7.3682384.3 rename to emb-norm-14.6k/248-module.65.self_attention.attention_dropout/events.out.tfevents.1638234973.r7i2n7.3682384.3 diff --git a/emb-norm-6k/248-module.65.self_attention.dense/events.out.tfevents.1638234973.r7i2n7.3682384.4 b/emb-norm-14.6k/248-module.65.self_attention.dense/events.out.tfevents.1638234973.r7i2n7.3682384.4 similarity index 100% rename from emb-norm-6k/248-module.65.self_attention.dense/events.out.tfevents.1638234973.r7i2n7.3682384.4 rename to emb-norm-14.6k/248-module.65.self_attention.dense/events.out.tfevents.1638234973.r7i2n7.3682384.4 diff --git a/emb-norm-6k/248-module.65.self_attention.query_key_value/events.out.tfevents.1638234973.r7i2n7.3682384.1 b/emb-norm-14.6k/248-module.65.self_attention.query_key_value/events.out.tfevents.1638234973.r7i2n7.3682384.1 similarity index 100% rename from emb-norm-6k/248-module.65.self_attention.query_key_value/events.out.tfevents.1638234973.r7i2n7.3682384.1 rename to emb-norm-14.6k/248-module.65.self_attention.query_key_value/events.out.tfevents.1638234973.r7i2n7.3682384.1 diff --git a/emb-norm-6k/248-module.65.self_attention.scale_mask_softmax/events.out.tfevents.1638234973.r7i2n7.3682384.2 b/emb-norm-14.6k/248-module.65.self_attention.scale_mask_softmax/events.out.tfevents.1638234973.r7i2n7.3682384.2 similarity index 100% rename from emb-norm-6k/248-module.65.self_attention.scale_mask_softmax/events.out.tfevents.1638234973.r7i2n7.3682384.2 rename to emb-norm-14.6k/248-module.65.self_attention.scale_mask_softmax/events.out.tfevents.1638234973.r7i2n7.3682384.2 diff --git a/emb-norm-6k/248-module.65.self_attention/events.out.tfevents.1638234973.r7i2n7.3682384.5 b/emb-norm-14.6k/248-module.65.self_attention/events.out.tfevents.1638234973.r7i2n7.3682384.5 similarity index 100% rename from emb-norm-6k/248-module.65.self_attention/events.out.tfevents.1638234973.r7i2n7.3682384.5 rename to emb-norm-14.6k/248-module.65.self_attention/events.out.tfevents.1638234973.r7i2n7.3682384.5 diff --git a/emb-norm-6k/248-module.65/events.out.tfevents.1638234973.r7i2n7.3682384.10 b/emb-norm-14.6k/248-module.65/events.out.tfevents.1638234973.r7i2n7.3682384.10 similarity index 100% rename from emb-norm-6k/248-module.65/events.out.tfevents.1638234973.r7i2n7.3682384.10 rename to emb-norm-14.6k/248-module.65/events.out.tfevents.1638234973.r7i2n7.3682384.10 diff --git a/emb-norm-6k/248-module.66.input_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.11 b/emb-norm-14.6k/248-module.66.input_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.11 similarity index 100% rename from emb-norm-6k/248-module.66.input_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.11 rename to emb-norm-14.6k/248-module.66.input_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.11 diff --git a/emb-norm-6k/248-module.66.mlp.dense_4h_to_h/events.out.tfevents.1638234973.r7i2n7.3682384.19 b/emb-norm-14.6k/248-module.66.mlp.dense_4h_to_h/events.out.tfevents.1638234973.r7i2n7.3682384.19 similarity index 100% rename from emb-norm-6k/248-module.66.mlp.dense_4h_to_h/events.out.tfevents.1638234973.r7i2n7.3682384.19 rename to emb-norm-14.6k/248-module.66.mlp.dense_4h_to_h/events.out.tfevents.1638234973.r7i2n7.3682384.19 diff --git a/emb-norm-6k/248-module.66.mlp.dense_h_to_4h/events.out.tfevents.1638234973.r7i2n7.3682384.18 b/emb-norm-14.6k/248-module.66.mlp.dense_h_to_4h/events.out.tfevents.1638234973.r7i2n7.3682384.18 similarity index 100% rename from emb-norm-6k/248-module.66.mlp.dense_h_to_4h/events.out.tfevents.1638234973.r7i2n7.3682384.18 rename to emb-norm-14.6k/248-module.66.mlp.dense_h_to_4h/events.out.tfevents.1638234973.r7i2n7.3682384.18 diff --git a/emb-norm-6k/248-module.66.mlp/events.out.tfevents.1638234973.r7i2n7.3682384.20 b/emb-norm-14.6k/248-module.66.mlp/events.out.tfevents.1638234973.r7i2n7.3682384.20 similarity index 100% rename from emb-norm-6k/248-module.66.mlp/events.out.tfevents.1638234973.r7i2n7.3682384.20 rename to emb-norm-14.6k/248-module.66.mlp/events.out.tfevents.1638234973.r7i2n7.3682384.20 diff --git a/emb-norm-6k/248-module.66.post_attention_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.17 b/emb-norm-14.6k/248-module.66.post_attention_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.17 similarity index 100% rename from emb-norm-6k/248-module.66.post_attention_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.17 rename to emb-norm-14.6k/248-module.66.post_attention_layernorm/events.out.tfevents.1638234973.r7i2n7.3682384.17 diff --git a/emb-norm-6k/248-module.66.self_attention.attention_dropout/events.out.tfevents.1638234973.r7i2n7.3682384.14 b/emb-norm-14.6k/248-module.66.self_attention.attention_dropout/events.out.tfevents.1638234973.r7i2n7.3682384.14 similarity index 100% rename from emb-norm-6k/248-module.66.self_attention.attention_dropout/events.out.tfevents.1638234973.r7i2n7.3682384.14 rename to emb-norm-14.6k/248-module.66.self_attention.attention_dropout/events.out.tfevents.1638234973.r7i2n7.3682384.14 diff --git a/emb-norm-6k/248-module.66.self_attention.dense/events.out.tfevents.1638234973.r7i2n7.3682384.15 b/emb-norm-14.6k/248-module.66.self_attention.dense/events.out.tfevents.1638234973.r7i2n7.3682384.15 similarity index 100% rename from emb-norm-6k/248-module.66.self_attention.dense/events.out.tfevents.1638234973.r7i2n7.3682384.15 rename to emb-norm-14.6k/248-module.66.self_attention.dense/events.out.tfevents.1638234973.r7i2n7.3682384.15 diff --git a/emb-norm-6k/248-module.66.self_attention.query_key_value/events.out.tfevents.1638234973.r7i2n7.3682384.12 b/emb-norm-14.6k/248-module.66.self_attention.query_key_value/events.out.tfevents.1638234973.r7i2n7.3682384.12 similarity index 100% rename from emb-norm-6k/248-module.66.self_attention.query_key_value/events.out.tfevents.1638234973.r7i2n7.3682384.12 rename to emb-norm-14.6k/248-module.66.self_attention.query_key_value/events.out.tfevents.1638234973.r7i2n7.3682384.12 diff --git a/emb-norm-6k/248-module.66.self_attention.scale_mask_softmax/events.out.tfevents.1638234973.r7i2n7.3682384.13 b/emb-norm-14.6k/248-module.66.self_attention.scale_mask_softmax/events.out.tfevents.1638234973.r7i2n7.3682384.13 similarity index 100% rename from emb-norm-6k/248-module.66.self_attention.scale_mask_softmax/events.out.tfevents.1638234973.r7i2n7.3682384.13 rename to emb-norm-14.6k/248-module.66.self_attention.scale_mask_softmax/events.out.tfevents.1638234973.r7i2n7.3682384.13 diff --git a/emb-norm-6k/248-module.66.self_attention/events.out.tfevents.1638234973.r7i2n7.3682384.16 b/emb-norm-14.6k/248-module.66.self_attention/events.out.tfevents.1638234973.r7i2n7.3682384.16 similarity index 100% rename from emb-norm-6k/248-module.66.self_attention/events.out.tfevents.1638234973.r7i2n7.3682384.16 rename to emb-norm-14.6k/248-module.66.self_attention/events.out.tfevents.1638234973.r7i2n7.3682384.16 diff --git a/emb-norm-6k/248-module.66/events.out.tfevents.1638234973.r7i2n7.3682384.21 b/emb-norm-14.6k/248-module.66/events.out.tfevents.1638234973.r7i2n7.3682384.21 similarity index 100% rename from emb-norm-6k/248-module.66/events.out.tfevents.1638234973.r7i2n7.3682384.21 rename to emb-norm-14.6k/248-module.66/events.out.tfevents.1638234973.r7i2n7.3682384.21 diff --git a/emb-norm-6k/248-module.68/events.out.tfevents.1638234973.r7i2n7.3682384.22 b/emb-norm-14.6k/248-module.68/events.out.tfevents.1638234973.r7i2n7.3682384.22 similarity index 100% rename from emb-norm-6k/248-module.68/events.out.tfevents.1638234973.r7i2n7.3682384.22 rename to emb-norm-14.6k/248-module.68/events.out.tfevents.1638234973.r7i2n7.3682384.22 diff --git a/emb-norm-6k/248-module/events.out.tfevents.1638234973.r7i2n7.3682384.23 b/emb-norm-14.6k/248-module/events.out.tfevents.1638234973.r7i2n7.3682384.23 similarity index 100% rename from emb-norm-6k/248-module/events.out.tfevents.1638234973.r7i2n7.3682384.23 rename to emb-norm-14.6k/248-module/events.out.tfevents.1638234973.r7i2n7.3682384.23 diff --git a/emb-norm-15k/000-module.3.input_layernorm/events.out.tfevents.1637404942.r6i5n3.394761.5 b/emb-norm-6.6k/000-module.3.input_layernorm/events.out.tfevents.1637404942.r6i5n3.394761.5 similarity index 100% rename from emb-norm-15k/000-module.3.input_layernorm/events.out.tfevents.1637404942.r6i5n3.394761.5 rename to emb-norm-6.6k/000-module.3.input_layernorm/events.out.tfevents.1637404942.r6i5n3.394761.5 diff --git a/emb-norm-15k/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1637404943.r6i5n3.394761.13 b/emb-norm-6.6k/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1637404943.r6i5n3.394761.13 similarity index 100% rename from emb-norm-15k/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1637404943.r6i5n3.394761.13 rename to emb-norm-6.6k/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1637404943.r6i5n3.394761.13 diff --git a/emb-norm-15k/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1637404943.r6i5n3.394761.12 b/emb-norm-6.6k/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1637404943.r6i5n3.394761.12 similarity index 100% rename from emb-norm-15k/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1637404943.r6i5n3.394761.12 rename to emb-norm-6.6k/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1637404943.r6i5n3.394761.12 diff --git a/emb-norm-15k/000-module.3.mlp/events.out.tfevents.1637404943.r6i5n3.394761.14 b/emb-norm-6.6k/000-module.3.mlp/events.out.tfevents.1637404943.r6i5n3.394761.14 similarity index 100% rename from emb-norm-15k/000-module.3.mlp/events.out.tfevents.1637404943.r6i5n3.394761.14 rename to emb-norm-6.6k/000-module.3.mlp/events.out.tfevents.1637404943.r6i5n3.394761.14 diff --git a/emb-norm-15k/000-module.3.post_attention_layernorm/events.out.tfevents.1637404943.r6i5n3.394761.11 b/emb-norm-6.6k/000-module.3.post_attention_layernorm/events.out.tfevents.1637404943.r6i5n3.394761.11 similarity index 100% rename from emb-norm-15k/000-module.3.post_attention_layernorm/events.out.tfevents.1637404943.r6i5n3.394761.11 rename to emb-norm-6.6k/000-module.3.post_attention_layernorm/events.out.tfevents.1637404943.r6i5n3.394761.11 diff --git a/emb-norm-15k/000-module.3.self_attention.attention_dropout/events.out.tfevents.1637404943.r6i5n3.394761.8 b/emb-norm-6.6k/000-module.3.self_attention.attention_dropout/events.out.tfevents.1637404943.r6i5n3.394761.8 similarity index 100% rename from emb-norm-15k/000-module.3.self_attention.attention_dropout/events.out.tfevents.1637404943.r6i5n3.394761.8 rename to emb-norm-6.6k/000-module.3.self_attention.attention_dropout/events.out.tfevents.1637404943.r6i5n3.394761.8 diff --git a/emb-norm-15k/000-module.3.self_attention.dense/events.out.tfevents.1637404943.r6i5n3.394761.9 b/emb-norm-6.6k/000-module.3.self_attention.dense/events.out.tfevents.1637404943.r6i5n3.394761.9 similarity index 100% rename from emb-norm-15k/000-module.3.self_attention.dense/events.out.tfevents.1637404943.r6i5n3.394761.9 rename to emb-norm-6.6k/000-module.3.self_attention.dense/events.out.tfevents.1637404943.r6i5n3.394761.9 diff --git a/emb-norm-15k/000-module.3.self_attention.query_key_value/events.out.tfevents.1637404943.r6i5n3.394761.6 b/emb-norm-6.6k/000-module.3.self_attention.query_key_value/events.out.tfevents.1637404943.r6i5n3.394761.6 similarity index 100% rename from emb-norm-15k/000-module.3.self_attention.query_key_value/events.out.tfevents.1637404943.r6i5n3.394761.6 rename to emb-norm-6.6k/000-module.3.self_attention.query_key_value/events.out.tfevents.1637404943.r6i5n3.394761.6 diff --git a/emb-norm-15k/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1637404943.r6i5n3.394761.7 b/emb-norm-6.6k/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1637404943.r6i5n3.394761.7 similarity index 100% rename from emb-norm-15k/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1637404943.r6i5n3.394761.7 rename to emb-norm-6.6k/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1637404943.r6i5n3.394761.7 diff --git a/emb-norm-15k/000-module.3.self_attention/events.out.tfevents.1637404943.r6i5n3.394761.10 b/emb-norm-6.6k/000-module.3.self_attention/events.out.tfevents.1637404943.r6i5n3.394761.10 similarity index 100% rename from emb-norm-15k/000-module.3.self_attention/events.out.tfevents.1637404943.r6i5n3.394761.10 rename to emb-norm-6.6k/000-module.3.self_attention/events.out.tfevents.1637404943.r6i5n3.394761.10 diff --git a/emb-norm-15k/000-module.3/events.out.tfevents.1637404944.r6i5n3.394761.15 b/emb-norm-6.6k/000-module.3/events.out.tfevents.1637404944.r6i5n3.394761.15 similarity index 100% rename from emb-norm-15k/000-module.3/events.out.tfevents.1637404944.r6i5n3.394761.15 rename to emb-norm-6.6k/000-module.3/events.out.tfevents.1637404944.r6i5n3.394761.15 diff --git a/emb-norm-15k/000-module.4.input_layernorm/events.out.tfevents.1637404944.r6i5n3.394761.16 b/emb-norm-6.6k/000-module.4.input_layernorm/events.out.tfevents.1637404944.r6i5n3.394761.16 similarity index 100% rename from emb-norm-15k/000-module.4.input_layernorm/events.out.tfevents.1637404944.r6i5n3.394761.16 rename to emb-norm-6.6k/000-module.4.input_layernorm/events.out.tfevents.1637404944.r6i5n3.394761.16 diff --git a/emb-norm-15k/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1637404944.r6i5n3.394761.24 b/emb-norm-6.6k/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1637404944.r6i5n3.394761.24 similarity index 100% rename from emb-norm-15k/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1637404944.r6i5n3.394761.24 rename to emb-norm-6.6k/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1637404944.r6i5n3.394761.24 diff --git a/emb-norm-15k/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1637404944.r6i5n3.394761.23 b/emb-norm-6.6k/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1637404944.r6i5n3.394761.23 similarity index 100% rename from emb-norm-15k/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1637404944.r6i5n3.394761.23 rename to emb-norm-6.6k/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1637404944.r6i5n3.394761.23 diff --git a/emb-norm-15k/000-module.4.mlp/events.out.tfevents.1637404944.r6i5n3.394761.25 b/emb-norm-6.6k/000-module.4.mlp/events.out.tfevents.1637404944.r6i5n3.394761.25 similarity index 100% rename from emb-norm-15k/000-module.4.mlp/events.out.tfevents.1637404944.r6i5n3.394761.25 rename to emb-norm-6.6k/000-module.4.mlp/events.out.tfevents.1637404944.r6i5n3.394761.25 diff --git a/emb-norm-15k/000-module.4.post_attention_layernorm/events.out.tfevents.1637404944.r6i5n3.394761.22 b/emb-norm-6.6k/000-module.4.post_attention_layernorm/events.out.tfevents.1637404944.r6i5n3.394761.22 similarity index 100% rename from emb-norm-15k/000-module.4.post_attention_layernorm/events.out.tfevents.1637404944.r6i5n3.394761.22 rename to emb-norm-6.6k/000-module.4.post_attention_layernorm/events.out.tfevents.1637404944.r6i5n3.394761.22 diff --git a/emb-norm-15k/000-module.4.self_attention.attention_dropout/events.out.tfevents.1637404944.r6i5n3.394761.19 b/emb-norm-6.6k/000-module.4.self_attention.attention_dropout/events.out.tfevents.1637404944.r6i5n3.394761.19 similarity index 100% rename from emb-norm-15k/000-module.4.self_attention.attention_dropout/events.out.tfevents.1637404944.r6i5n3.394761.19 rename to emb-norm-6.6k/000-module.4.self_attention.attention_dropout/events.out.tfevents.1637404944.r6i5n3.394761.19 diff --git a/emb-norm-15k/000-module.4.self_attention.dense/events.out.tfevents.1637404944.r6i5n3.394761.20 b/emb-norm-6.6k/000-module.4.self_attention.dense/events.out.tfevents.1637404944.r6i5n3.394761.20 similarity index 100% rename from emb-norm-15k/000-module.4.self_attention.dense/events.out.tfevents.1637404944.r6i5n3.394761.20 rename to emb-norm-6.6k/000-module.4.self_attention.dense/events.out.tfevents.1637404944.r6i5n3.394761.20 diff --git a/emb-norm-15k/000-module.4.self_attention.query_key_value/events.out.tfevents.1637404944.r6i5n3.394761.17 b/emb-norm-6.6k/000-module.4.self_attention.query_key_value/events.out.tfevents.1637404944.r6i5n3.394761.17 similarity index 100% rename from emb-norm-15k/000-module.4.self_attention.query_key_value/events.out.tfevents.1637404944.r6i5n3.394761.17 rename to emb-norm-6.6k/000-module.4.self_attention.query_key_value/events.out.tfevents.1637404944.r6i5n3.394761.17 diff --git a/emb-norm-15k/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1637404944.r6i5n3.394761.18 b/emb-norm-6.6k/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1637404944.r6i5n3.394761.18 similarity index 100% rename from emb-norm-15k/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1637404944.r6i5n3.394761.18 rename to emb-norm-6.6k/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1637404944.r6i5n3.394761.18 diff --git a/emb-norm-15k/000-module.4.self_attention/events.out.tfevents.1637404944.r6i5n3.394761.21 b/emb-norm-6.6k/000-module.4.self_attention/events.out.tfevents.1637404944.r6i5n3.394761.21 similarity index 100% rename from emb-norm-15k/000-module.4.self_attention/events.out.tfevents.1637404944.r6i5n3.394761.21 rename to emb-norm-6.6k/000-module.4.self_attention/events.out.tfevents.1637404944.r6i5n3.394761.21 diff --git a/emb-norm-15k/000-module.4/events.out.tfevents.1637404944.r6i5n3.394761.26 b/emb-norm-6.6k/000-module.4/events.out.tfevents.1637404944.r6i5n3.394761.26 similarity index 100% rename from emb-norm-15k/000-module.4/events.out.tfevents.1637404944.r6i5n3.394761.26 rename to emb-norm-6.6k/000-module.4/events.out.tfevents.1637404944.r6i5n3.394761.26 diff --git a/emb-norm-15k/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1637404942.r6i5n3.394761.3 b/emb-norm-6.6k/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1637404942.r6i5n3.394761.3 similarity index 100% rename from emb-norm-15k/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1637404942.r6i5n3.394761.3 rename to emb-norm-6.6k/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1637404942.r6i5n3.394761.3 diff --git a/emb-norm-15k/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1637404942.r6i5n3.394761.2 b/emb-norm-6.6k/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1637404942.r6i5n3.394761.2 similarity index 100% rename from emb-norm-15k/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1637404942.r6i5n3.394761.2 rename to emb-norm-6.6k/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1637404942.r6i5n3.394761.2 diff --git a/emb-norm-15k/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1637404942.r6i5n3.394761.0 b/emb-norm-6.6k/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1637404942.r6i5n3.394761.0 similarity index 100% rename from emb-norm-15k/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1637404942.r6i5n3.394761.0 rename to emb-norm-6.6k/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1637404942.r6i5n3.394761.0 diff --git a/emb-norm-15k/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1637404942.r6i5n3.394761.1 b/emb-norm-6.6k/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1637404942.r6i5n3.394761.1 similarity index 100% rename from emb-norm-15k/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1637404942.r6i5n3.394761.1 rename to emb-norm-6.6k/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1637404942.r6i5n3.394761.1 diff --git a/emb-norm-15k/000-module.tied_modules.embed/events.out.tfevents.1637404942.r6i5n3.394761.4 b/emb-norm-6.6k/000-module.tied_modules.embed/events.out.tfevents.1637404942.r6i5n3.394761.4 similarity index 100% rename from emb-norm-15k/000-module.tied_modules.embed/events.out.tfevents.1637404942.r6i5n3.394761.4 rename to emb-norm-6.6k/000-module.tied_modules.embed/events.out.tfevents.1637404942.r6i5n3.394761.4 diff --git a/emb-norm-15k/000-module/events.out.tfevents.1637404944.r6i5n3.394761.27 b/emb-norm-6.6k/000-module/events.out.tfevents.1637404944.r6i5n3.394761.27 similarity index 100% rename from emb-norm-15k/000-module/events.out.tfevents.1637404944.r6i5n3.394761.27 rename to emb-norm-6.6k/000-module/events.out.tfevents.1637404944.r6i5n3.394761.27 diff --git a/emb-norm-15k/028-module.17.input_layernorm/events.out.tfevents.1637404955.r7i5n1.454973.0 b/emb-norm-6.6k/028-module.17.input_layernorm/events.out.tfevents.1637404955.r7i5n1.454973.0 similarity index 100% rename from emb-norm-15k/028-module.17.input_layernorm/events.out.tfevents.1637404955.r7i5n1.454973.0 rename to emb-norm-6.6k/028-module.17.input_layernorm/events.out.tfevents.1637404955.r7i5n1.454973.0 diff --git a/emb-norm-15k/028-module.17.mlp.dense_4h_to_h/events.out.tfevents.1637404956.r7i5n1.454973.8 b/emb-norm-6.6k/028-module.17.mlp.dense_4h_to_h/events.out.tfevents.1637404956.r7i5n1.454973.8 similarity index 100% rename from emb-norm-15k/028-module.17.mlp.dense_4h_to_h/events.out.tfevents.1637404956.r7i5n1.454973.8 rename to emb-norm-6.6k/028-module.17.mlp.dense_4h_to_h/events.out.tfevents.1637404956.r7i5n1.454973.8 diff --git a/emb-norm-15k/028-module.17.mlp.dense_h_to_4h/events.out.tfevents.1637404956.r7i5n1.454973.7 b/emb-norm-6.6k/028-module.17.mlp.dense_h_to_4h/events.out.tfevents.1637404956.r7i5n1.454973.7 similarity index 100% rename from emb-norm-15k/028-module.17.mlp.dense_h_to_4h/events.out.tfevents.1637404956.r7i5n1.454973.7 rename to emb-norm-6.6k/028-module.17.mlp.dense_h_to_4h/events.out.tfevents.1637404956.r7i5n1.454973.7 diff --git a/emb-norm-15k/028-module.17.mlp/events.out.tfevents.1637404956.r7i5n1.454973.9 b/emb-norm-6.6k/028-module.17.mlp/events.out.tfevents.1637404956.r7i5n1.454973.9 similarity index 100% rename from emb-norm-15k/028-module.17.mlp/events.out.tfevents.1637404956.r7i5n1.454973.9 rename to emb-norm-6.6k/028-module.17.mlp/events.out.tfevents.1637404956.r7i5n1.454973.9 diff --git a/emb-norm-15k/028-module.17.post_attention_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.6 b/emb-norm-6.6k/028-module.17.post_attention_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.6 similarity index 100% rename from emb-norm-15k/028-module.17.post_attention_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.6 rename to emb-norm-6.6k/028-module.17.post_attention_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.6 diff --git a/emb-norm-15k/028-module.17.self_attention.attention_dropout/events.out.tfevents.1637404955.r7i5n1.454973.3 b/emb-norm-6.6k/028-module.17.self_attention.attention_dropout/events.out.tfevents.1637404955.r7i5n1.454973.3 similarity index 100% rename from emb-norm-15k/028-module.17.self_attention.attention_dropout/events.out.tfevents.1637404955.r7i5n1.454973.3 rename to emb-norm-6.6k/028-module.17.self_attention.attention_dropout/events.out.tfevents.1637404955.r7i5n1.454973.3 diff --git a/emb-norm-15k/028-module.17.self_attention.dense/events.out.tfevents.1637404955.r7i5n1.454973.4 b/emb-norm-6.6k/028-module.17.self_attention.dense/events.out.tfevents.1637404955.r7i5n1.454973.4 similarity index 100% rename from emb-norm-15k/028-module.17.self_attention.dense/events.out.tfevents.1637404955.r7i5n1.454973.4 rename to emb-norm-6.6k/028-module.17.self_attention.dense/events.out.tfevents.1637404955.r7i5n1.454973.4 diff --git a/emb-norm-15k/028-module.17.self_attention.query_key_value/events.out.tfevents.1637404955.r7i5n1.454973.1 b/emb-norm-6.6k/028-module.17.self_attention.query_key_value/events.out.tfevents.1637404955.r7i5n1.454973.1 similarity index 100% rename from emb-norm-15k/028-module.17.self_attention.query_key_value/events.out.tfevents.1637404955.r7i5n1.454973.1 rename to emb-norm-6.6k/028-module.17.self_attention.query_key_value/events.out.tfevents.1637404955.r7i5n1.454973.1 diff --git a/emb-norm-15k/028-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1637404955.r7i5n1.454973.2 b/emb-norm-6.6k/028-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1637404955.r7i5n1.454973.2 similarity index 100% rename from emb-norm-15k/028-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1637404955.r7i5n1.454973.2 rename to emb-norm-6.6k/028-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1637404955.r7i5n1.454973.2 diff --git a/emb-norm-15k/028-module.17.self_attention/events.out.tfevents.1637404955.r7i5n1.454973.5 b/emb-norm-6.6k/028-module.17.self_attention/events.out.tfevents.1637404955.r7i5n1.454973.5 similarity index 100% rename from emb-norm-15k/028-module.17.self_attention/events.out.tfevents.1637404955.r7i5n1.454973.5 rename to emb-norm-6.6k/028-module.17.self_attention/events.out.tfevents.1637404955.r7i5n1.454973.5 diff --git a/emb-norm-15k/028-module.17/events.out.tfevents.1637404956.r7i5n1.454973.10 b/emb-norm-6.6k/028-module.17/events.out.tfevents.1637404956.r7i5n1.454973.10 similarity index 100% rename from emb-norm-15k/028-module.17/events.out.tfevents.1637404956.r7i5n1.454973.10 rename to emb-norm-6.6k/028-module.17/events.out.tfevents.1637404956.r7i5n1.454973.10 diff --git a/emb-norm-15k/028-module.18.input_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.11 b/emb-norm-6.6k/028-module.18.input_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.11 similarity index 100% rename from emb-norm-15k/028-module.18.input_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.11 rename to emb-norm-6.6k/028-module.18.input_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.11 diff --git a/emb-norm-15k/028-module.18.mlp.dense_4h_to_h/events.out.tfevents.1637404956.r7i5n1.454973.19 b/emb-norm-6.6k/028-module.18.mlp.dense_4h_to_h/events.out.tfevents.1637404956.r7i5n1.454973.19 similarity index 100% rename from emb-norm-15k/028-module.18.mlp.dense_4h_to_h/events.out.tfevents.1637404956.r7i5n1.454973.19 rename to emb-norm-6.6k/028-module.18.mlp.dense_4h_to_h/events.out.tfevents.1637404956.r7i5n1.454973.19 diff --git a/emb-norm-15k/028-module.18.mlp.dense_h_to_4h/events.out.tfevents.1637404956.r7i5n1.454973.18 b/emb-norm-6.6k/028-module.18.mlp.dense_h_to_4h/events.out.tfevents.1637404956.r7i5n1.454973.18 similarity index 100% rename from emb-norm-15k/028-module.18.mlp.dense_h_to_4h/events.out.tfevents.1637404956.r7i5n1.454973.18 rename to emb-norm-6.6k/028-module.18.mlp.dense_h_to_4h/events.out.tfevents.1637404956.r7i5n1.454973.18 diff --git a/emb-norm-15k/028-module.18.mlp/events.out.tfevents.1637404956.r7i5n1.454973.20 b/emb-norm-6.6k/028-module.18.mlp/events.out.tfevents.1637404956.r7i5n1.454973.20 similarity index 100% rename from emb-norm-15k/028-module.18.mlp/events.out.tfevents.1637404956.r7i5n1.454973.20 rename to emb-norm-6.6k/028-module.18.mlp/events.out.tfevents.1637404956.r7i5n1.454973.20 diff --git a/emb-norm-15k/028-module.18.post_attention_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.17 b/emb-norm-6.6k/028-module.18.post_attention_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.17 similarity index 100% rename from emb-norm-15k/028-module.18.post_attention_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.17 rename to emb-norm-6.6k/028-module.18.post_attention_layernorm/events.out.tfevents.1637404956.r7i5n1.454973.17 diff --git a/emb-norm-15k/028-module.18.self_attention.attention_dropout/events.out.tfevents.1637404956.r7i5n1.454973.14 b/emb-norm-6.6k/028-module.18.self_attention.attention_dropout/events.out.tfevents.1637404956.r7i5n1.454973.14 similarity index 100% rename from emb-norm-15k/028-module.18.self_attention.attention_dropout/events.out.tfevents.1637404956.r7i5n1.454973.14 rename to emb-norm-6.6k/028-module.18.self_attention.attention_dropout/events.out.tfevents.1637404956.r7i5n1.454973.14 diff --git a/emb-norm-15k/028-module.18.self_attention.dense/events.out.tfevents.1637404956.r7i5n1.454973.15 b/emb-norm-6.6k/028-module.18.self_attention.dense/events.out.tfevents.1637404956.r7i5n1.454973.15 similarity index 100% rename from emb-norm-15k/028-module.18.self_attention.dense/events.out.tfevents.1637404956.r7i5n1.454973.15 rename to emb-norm-6.6k/028-module.18.self_attention.dense/events.out.tfevents.1637404956.r7i5n1.454973.15 diff --git a/emb-norm-15k/028-module.18.self_attention.query_key_value/events.out.tfevents.1637404956.r7i5n1.454973.12 b/emb-norm-6.6k/028-module.18.self_attention.query_key_value/events.out.tfevents.1637404956.r7i5n1.454973.12 similarity index 100% rename from emb-norm-15k/028-module.18.self_attention.query_key_value/events.out.tfevents.1637404956.r7i5n1.454973.12 rename to emb-norm-6.6k/028-module.18.self_attention.query_key_value/events.out.tfevents.1637404956.r7i5n1.454973.12 diff --git a/emb-norm-15k/028-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1637404956.r7i5n1.454973.13 b/emb-norm-6.6k/028-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1637404956.r7i5n1.454973.13 similarity index 100% rename from emb-norm-15k/028-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1637404956.r7i5n1.454973.13 rename to emb-norm-6.6k/028-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1637404956.r7i5n1.454973.13 diff --git a/emb-norm-15k/028-module.18.self_attention/events.out.tfevents.1637404956.r7i5n1.454973.16 b/emb-norm-6.6k/028-module.18.self_attention/events.out.tfevents.1637404956.r7i5n1.454973.16 similarity index 100% rename from emb-norm-15k/028-module.18.self_attention/events.out.tfevents.1637404956.r7i5n1.454973.16 rename to emb-norm-6.6k/028-module.18.self_attention/events.out.tfevents.1637404956.r7i5n1.454973.16 diff --git a/emb-norm-15k/028-module.18/events.out.tfevents.1637404956.r7i5n1.454973.21 b/emb-norm-6.6k/028-module.18/events.out.tfevents.1637404956.r7i5n1.454973.21 similarity index 100% rename from emb-norm-15k/028-module.18/events.out.tfevents.1637404956.r7i5n1.454973.21 rename to emb-norm-6.6k/028-module.18/events.out.tfevents.1637404956.r7i5n1.454973.21 diff --git a/emb-norm-15k/028-module/events.out.tfevents.1637404956.r7i5n1.454973.22 b/emb-norm-6.6k/028-module/events.out.tfevents.1637404956.r7i5n1.454973.22 similarity index 100% rename from emb-norm-15k/028-module/events.out.tfevents.1637404956.r7i5n1.454973.22 rename to emb-norm-6.6k/028-module/events.out.tfevents.1637404956.r7i5n1.454973.22 diff --git a/emb-norm-15k/060-module.33.input_layernorm/events.out.tfevents.1637404969.r8i1n6.1395687.0 b/emb-norm-6.6k/060-module.33.input_layernorm/events.out.tfevents.1637404969.r8i1n6.1395687.0 similarity index 100% rename from emb-norm-15k/060-module.33.input_layernorm/events.out.tfevents.1637404969.r8i1n6.1395687.0 rename to emb-norm-6.6k/060-module.33.input_layernorm/events.out.tfevents.1637404969.r8i1n6.1395687.0 diff --git a/emb-norm-15k/060-module.33.mlp.dense_4h_to_h/events.out.tfevents.1637404970.r8i1n6.1395687.8 b/emb-norm-6.6k/060-module.33.mlp.dense_4h_to_h/events.out.tfevents.1637404970.r8i1n6.1395687.8 similarity index 100% rename from emb-norm-15k/060-module.33.mlp.dense_4h_to_h/events.out.tfevents.1637404970.r8i1n6.1395687.8 rename to emb-norm-6.6k/060-module.33.mlp.dense_4h_to_h/events.out.tfevents.1637404970.r8i1n6.1395687.8 diff --git a/emb-norm-15k/060-module.33.mlp.dense_h_to_4h/events.out.tfevents.1637404970.r8i1n6.1395687.7 b/emb-norm-6.6k/060-module.33.mlp.dense_h_to_4h/events.out.tfevents.1637404970.r8i1n6.1395687.7 similarity index 100% rename from emb-norm-15k/060-module.33.mlp.dense_h_to_4h/events.out.tfevents.1637404970.r8i1n6.1395687.7 rename to emb-norm-6.6k/060-module.33.mlp.dense_h_to_4h/events.out.tfevents.1637404970.r8i1n6.1395687.7 diff --git a/emb-norm-15k/060-module.33.mlp/events.out.tfevents.1637404970.r8i1n6.1395687.9 b/emb-norm-6.6k/060-module.33.mlp/events.out.tfevents.1637404970.r8i1n6.1395687.9 similarity index 100% rename from emb-norm-15k/060-module.33.mlp/events.out.tfevents.1637404970.r8i1n6.1395687.9 rename to emb-norm-6.6k/060-module.33.mlp/events.out.tfevents.1637404970.r8i1n6.1395687.9 diff --git a/emb-norm-15k/060-module.33.post_attention_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.6 b/emb-norm-6.6k/060-module.33.post_attention_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.6 similarity index 100% rename from emb-norm-15k/060-module.33.post_attention_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.6 rename to emb-norm-6.6k/060-module.33.post_attention_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.6 diff --git a/emb-norm-15k/060-module.33.self_attention.attention_dropout/events.out.tfevents.1637404969.r8i1n6.1395687.3 b/emb-norm-6.6k/060-module.33.self_attention.attention_dropout/events.out.tfevents.1637404969.r8i1n6.1395687.3 similarity index 100% rename from emb-norm-15k/060-module.33.self_attention.attention_dropout/events.out.tfevents.1637404969.r8i1n6.1395687.3 rename to emb-norm-6.6k/060-module.33.self_attention.attention_dropout/events.out.tfevents.1637404969.r8i1n6.1395687.3 diff --git a/emb-norm-15k/060-module.33.self_attention.dense/events.out.tfevents.1637404969.r8i1n6.1395687.4 b/emb-norm-6.6k/060-module.33.self_attention.dense/events.out.tfevents.1637404969.r8i1n6.1395687.4 similarity index 100% rename from emb-norm-15k/060-module.33.self_attention.dense/events.out.tfevents.1637404969.r8i1n6.1395687.4 rename to emb-norm-6.6k/060-module.33.self_attention.dense/events.out.tfevents.1637404969.r8i1n6.1395687.4 diff --git a/emb-norm-15k/060-module.33.self_attention.query_key_value/events.out.tfevents.1637404969.r8i1n6.1395687.1 b/emb-norm-6.6k/060-module.33.self_attention.query_key_value/events.out.tfevents.1637404969.r8i1n6.1395687.1 similarity index 100% rename from emb-norm-15k/060-module.33.self_attention.query_key_value/events.out.tfevents.1637404969.r8i1n6.1395687.1 rename to emb-norm-6.6k/060-module.33.self_attention.query_key_value/events.out.tfevents.1637404969.r8i1n6.1395687.1 diff --git a/emb-norm-15k/060-module.33.self_attention.scale_mask_softmax/events.out.tfevents.1637404969.r8i1n6.1395687.2 b/emb-norm-6.6k/060-module.33.self_attention.scale_mask_softmax/events.out.tfevents.1637404969.r8i1n6.1395687.2 similarity index 100% rename from emb-norm-15k/060-module.33.self_attention.scale_mask_softmax/events.out.tfevents.1637404969.r8i1n6.1395687.2 rename to emb-norm-6.6k/060-module.33.self_attention.scale_mask_softmax/events.out.tfevents.1637404969.r8i1n6.1395687.2 diff --git a/emb-norm-15k/060-module.33.self_attention/events.out.tfevents.1637404969.r8i1n6.1395687.5 b/emb-norm-6.6k/060-module.33.self_attention/events.out.tfevents.1637404969.r8i1n6.1395687.5 similarity index 100% rename from emb-norm-15k/060-module.33.self_attention/events.out.tfevents.1637404969.r8i1n6.1395687.5 rename to emb-norm-6.6k/060-module.33.self_attention/events.out.tfevents.1637404969.r8i1n6.1395687.5 diff --git a/emb-norm-15k/060-module.33/events.out.tfevents.1637404970.r8i1n6.1395687.10 b/emb-norm-6.6k/060-module.33/events.out.tfevents.1637404970.r8i1n6.1395687.10 similarity index 100% rename from emb-norm-15k/060-module.33/events.out.tfevents.1637404970.r8i1n6.1395687.10 rename to emb-norm-6.6k/060-module.33/events.out.tfevents.1637404970.r8i1n6.1395687.10 diff --git a/emb-norm-15k/060-module.34.input_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.11 b/emb-norm-6.6k/060-module.34.input_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.11 similarity index 100% rename from emb-norm-15k/060-module.34.input_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.11 rename to emb-norm-6.6k/060-module.34.input_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.11 diff --git a/emb-norm-15k/060-module.34.mlp.dense_4h_to_h/events.out.tfevents.1637404970.r8i1n6.1395687.19 b/emb-norm-6.6k/060-module.34.mlp.dense_4h_to_h/events.out.tfevents.1637404970.r8i1n6.1395687.19 similarity index 100% rename from emb-norm-15k/060-module.34.mlp.dense_4h_to_h/events.out.tfevents.1637404970.r8i1n6.1395687.19 rename to emb-norm-6.6k/060-module.34.mlp.dense_4h_to_h/events.out.tfevents.1637404970.r8i1n6.1395687.19 diff --git a/emb-norm-15k/060-module.34.mlp.dense_h_to_4h/events.out.tfevents.1637404970.r8i1n6.1395687.18 b/emb-norm-6.6k/060-module.34.mlp.dense_h_to_4h/events.out.tfevents.1637404970.r8i1n6.1395687.18 similarity index 100% rename from emb-norm-15k/060-module.34.mlp.dense_h_to_4h/events.out.tfevents.1637404970.r8i1n6.1395687.18 rename to emb-norm-6.6k/060-module.34.mlp.dense_h_to_4h/events.out.tfevents.1637404970.r8i1n6.1395687.18 diff --git a/emb-norm-15k/060-module.34.mlp/events.out.tfevents.1637404970.r8i1n6.1395687.20 b/emb-norm-6.6k/060-module.34.mlp/events.out.tfevents.1637404970.r8i1n6.1395687.20 similarity index 100% rename from emb-norm-15k/060-module.34.mlp/events.out.tfevents.1637404970.r8i1n6.1395687.20 rename to emb-norm-6.6k/060-module.34.mlp/events.out.tfevents.1637404970.r8i1n6.1395687.20 diff --git a/emb-norm-15k/060-module.34.post_attention_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.17 b/emb-norm-6.6k/060-module.34.post_attention_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.17 similarity index 100% rename from emb-norm-15k/060-module.34.post_attention_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.17 rename to emb-norm-6.6k/060-module.34.post_attention_layernorm/events.out.tfevents.1637404970.r8i1n6.1395687.17 diff --git a/emb-norm-15k/060-module.34.self_attention.attention_dropout/events.out.tfevents.1637404970.r8i1n6.1395687.14 b/emb-norm-6.6k/060-module.34.self_attention.attention_dropout/events.out.tfevents.1637404970.r8i1n6.1395687.14 similarity index 100% rename from emb-norm-15k/060-module.34.self_attention.attention_dropout/events.out.tfevents.1637404970.r8i1n6.1395687.14 rename to emb-norm-6.6k/060-module.34.self_attention.attention_dropout/events.out.tfevents.1637404970.r8i1n6.1395687.14 diff --git a/emb-norm-15k/060-module.34.self_attention.dense/events.out.tfevents.1637404970.r8i1n6.1395687.15 b/emb-norm-6.6k/060-module.34.self_attention.dense/events.out.tfevents.1637404970.r8i1n6.1395687.15 similarity index 100% rename from emb-norm-15k/060-module.34.self_attention.dense/events.out.tfevents.1637404970.r8i1n6.1395687.15 rename to emb-norm-6.6k/060-module.34.self_attention.dense/events.out.tfevents.1637404970.r8i1n6.1395687.15 diff --git a/emb-norm-15k/060-module.34.self_attention.query_key_value/events.out.tfevents.1637404970.r8i1n6.1395687.12 b/emb-norm-6.6k/060-module.34.self_attention.query_key_value/events.out.tfevents.1637404970.r8i1n6.1395687.12 similarity index 100% rename from emb-norm-15k/060-module.34.self_attention.query_key_value/events.out.tfevents.1637404970.r8i1n6.1395687.12 rename to emb-norm-6.6k/060-module.34.self_attention.query_key_value/events.out.tfevents.1637404970.r8i1n6.1395687.12 diff --git a/emb-norm-15k/060-module.34.self_attention.scale_mask_softmax/events.out.tfevents.1637404970.r8i1n6.1395687.13 b/emb-norm-6.6k/060-module.34.self_attention.scale_mask_softmax/events.out.tfevents.1637404970.r8i1n6.1395687.13 similarity index 100% rename from emb-norm-15k/060-module.34.self_attention.scale_mask_softmax/events.out.tfevents.1637404970.r8i1n6.1395687.13 rename to emb-norm-6.6k/060-module.34.self_attention.scale_mask_softmax/events.out.tfevents.1637404970.r8i1n6.1395687.13 diff --git a/emb-norm-15k/060-module.34.self_attention/events.out.tfevents.1637404970.r8i1n6.1395687.16 b/emb-norm-6.6k/060-module.34.self_attention/events.out.tfevents.1637404970.r8i1n6.1395687.16 similarity index 100% rename from emb-norm-15k/060-module.34.self_attention/events.out.tfevents.1637404970.r8i1n6.1395687.16 rename to emb-norm-6.6k/060-module.34.self_attention/events.out.tfevents.1637404970.r8i1n6.1395687.16 diff --git a/emb-norm-15k/060-module.34/events.out.tfevents.1637404970.r8i1n6.1395687.21 b/emb-norm-6.6k/060-module.34/events.out.tfevents.1637404970.r8i1n6.1395687.21 similarity index 100% rename from emb-norm-15k/060-module.34/events.out.tfevents.1637404970.r8i1n6.1395687.21 rename to emb-norm-6.6k/060-module.34/events.out.tfevents.1637404970.r8i1n6.1395687.21 diff --git a/emb-norm-15k/060-module/events.out.tfevents.1637404970.r8i1n6.1395687.22 b/emb-norm-6.6k/060-module/events.out.tfevents.1637404970.r8i1n6.1395687.22 similarity index 100% rename from emb-norm-15k/060-module/events.out.tfevents.1637404970.r8i1n6.1395687.22 rename to emb-norm-6.6k/060-module/events.out.tfevents.1637404970.r8i1n6.1395687.22 diff --git a/emb-norm-15k/092-module.49.input_layernorm/events.out.tfevents.1637404982.r8i2n6.1525706.0 b/emb-norm-6.6k/092-module.49.input_layernorm/events.out.tfevents.1637404982.r8i2n6.1525706.0 similarity index 100% rename from emb-norm-15k/092-module.49.input_layernorm/events.out.tfevents.1637404982.r8i2n6.1525706.0 rename to emb-norm-6.6k/092-module.49.input_layernorm/events.out.tfevents.1637404982.r8i2n6.1525706.0 diff --git a/emb-norm-15k/092-module.49.mlp.dense_4h_to_h/events.out.tfevents.1637404984.r8i2n6.1525706.8 b/emb-norm-6.6k/092-module.49.mlp.dense_4h_to_h/events.out.tfevents.1637404984.r8i2n6.1525706.8 similarity index 100% rename from emb-norm-15k/092-module.49.mlp.dense_4h_to_h/events.out.tfevents.1637404984.r8i2n6.1525706.8 rename to emb-norm-6.6k/092-module.49.mlp.dense_4h_to_h/events.out.tfevents.1637404984.r8i2n6.1525706.8 diff --git a/emb-norm-15k/092-module.49.mlp.dense_h_to_4h/events.out.tfevents.1637404983.r8i2n6.1525706.7 b/emb-norm-6.6k/092-module.49.mlp.dense_h_to_4h/events.out.tfevents.1637404983.r8i2n6.1525706.7 similarity index 100% rename from emb-norm-15k/092-module.49.mlp.dense_h_to_4h/events.out.tfevents.1637404983.r8i2n6.1525706.7 rename to emb-norm-6.6k/092-module.49.mlp.dense_h_to_4h/events.out.tfevents.1637404983.r8i2n6.1525706.7 diff --git a/emb-norm-15k/092-module.49.mlp/events.out.tfevents.1637404984.r8i2n6.1525706.9 b/emb-norm-6.6k/092-module.49.mlp/events.out.tfevents.1637404984.r8i2n6.1525706.9 similarity index 100% rename from emb-norm-15k/092-module.49.mlp/events.out.tfevents.1637404984.r8i2n6.1525706.9 rename to emb-norm-6.6k/092-module.49.mlp/events.out.tfevents.1637404984.r8i2n6.1525706.9 diff --git a/emb-norm-15k/092-module.49.post_attention_layernorm/events.out.tfevents.1637404983.r8i2n6.1525706.6 b/emb-norm-6.6k/092-module.49.post_attention_layernorm/events.out.tfevents.1637404983.r8i2n6.1525706.6 similarity index 100% rename from emb-norm-15k/092-module.49.post_attention_layernorm/events.out.tfevents.1637404983.r8i2n6.1525706.6 rename to emb-norm-6.6k/092-module.49.post_attention_layernorm/events.out.tfevents.1637404983.r8i2n6.1525706.6 diff --git a/emb-norm-15k/092-module.49.self_attention.attention_dropout/events.out.tfevents.1637404983.r8i2n6.1525706.3 b/emb-norm-6.6k/092-module.49.self_attention.attention_dropout/events.out.tfevents.1637404983.r8i2n6.1525706.3 similarity index 100% rename from emb-norm-15k/092-module.49.self_attention.attention_dropout/events.out.tfevents.1637404983.r8i2n6.1525706.3 rename to emb-norm-6.6k/092-module.49.self_attention.attention_dropout/events.out.tfevents.1637404983.r8i2n6.1525706.3 diff --git a/emb-norm-15k/092-module.49.self_attention.dense/events.out.tfevents.1637404983.r8i2n6.1525706.4 b/emb-norm-6.6k/092-module.49.self_attention.dense/events.out.tfevents.1637404983.r8i2n6.1525706.4 similarity index 100% rename from emb-norm-15k/092-module.49.self_attention.dense/events.out.tfevents.1637404983.r8i2n6.1525706.4 rename to emb-norm-6.6k/092-module.49.self_attention.dense/events.out.tfevents.1637404983.r8i2n6.1525706.4 diff --git a/emb-norm-15k/092-module.49.self_attention.query_key_value/events.out.tfevents.1637404983.r8i2n6.1525706.1 b/emb-norm-6.6k/092-module.49.self_attention.query_key_value/events.out.tfevents.1637404983.r8i2n6.1525706.1 similarity index 100% rename from emb-norm-15k/092-module.49.self_attention.query_key_value/events.out.tfevents.1637404983.r8i2n6.1525706.1 rename to emb-norm-6.6k/092-module.49.self_attention.query_key_value/events.out.tfevents.1637404983.r8i2n6.1525706.1 diff --git a/emb-norm-15k/092-module.49.self_attention.scale_mask_softmax/events.out.tfevents.1637404983.r8i2n6.1525706.2 b/emb-norm-6.6k/092-module.49.self_attention.scale_mask_softmax/events.out.tfevents.1637404983.r8i2n6.1525706.2 similarity index 100% rename from emb-norm-15k/092-module.49.self_attention.scale_mask_softmax/events.out.tfevents.1637404983.r8i2n6.1525706.2 rename to emb-norm-6.6k/092-module.49.self_attention.scale_mask_softmax/events.out.tfevents.1637404983.r8i2n6.1525706.2 diff --git a/emb-norm-15k/092-module.49.self_attention/events.out.tfevents.1637404983.r8i2n6.1525706.5 b/emb-norm-6.6k/092-module.49.self_attention/events.out.tfevents.1637404983.r8i2n6.1525706.5 similarity index 100% rename from emb-norm-15k/092-module.49.self_attention/events.out.tfevents.1637404983.r8i2n6.1525706.5 rename to emb-norm-6.6k/092-module.49.self_attention/events.out.tfevents.1637404983.r8i2n6.1525706.5 diff --git a/emb-norm-15k/092-module.49/events.out.tfevents.1637404984.r8i2n6.1525706.10 b/emb-norm-6.6k/092-module.49/events.out.tfevents.1637404984.r8i2n6.1525706.10 similarity index 100% rename from emb-norm-15k/092-module.49/events.out.tfevents.1637404984.r8i2n6.1525706.10 rename to emb-norm-6.6k/092-module.49/events.out.tfevents.1637404984.r8i2n6.1525706.10 diff --git a/emb-norm-15k/092-module.50.input_layernorm/events.out.tfevents.1637404984.r8i2n6.1525706.11 b/emb-norm-6.6k/092-module.50.input_layernorm/events.out.tfevents.1637404984.r8i2n6.1525706.11 similarity index 100% rename from emb-norm-15k/092-module.50.input_layernorm/events.out.tfevents.1637404984.r8i2n6.1525706.11 rename to emb-norm-6.6k/092-module.50.input_layernorm/events.out.tfevents.1637404984.r8i2n6.1525706.11 diff --git a/emb-norm-15k/092-module.50.mlp.dense_4h_to_h/events.out.tfevents.1637404984.r8i2n6.1525706.19 b/emb-norm-6.6k/092-module.50.mlp.dense_4h_to_h/events.out.tfevents.1637404984.r8i2n6.1525706.19 similarity index 100% rename from emb-norm-15k/092-module.50.mlp.dense_4h_to_h/events.out.tfevents.1637404984.r8i2n6.1525706.19 rename to emb-norm-6.6k/092-module.50.mlp.dense_4h_to_h/events.out.tfevents.1637404984.r8i2n6.1525706.19 diff --git a/emb-norm-15k/092-module.50.mlp.dense_h_to_4h/events.out.tfevents.1637404984.r8i2n6.1525706.18 b/emb-norm-6.6k/092-module.50.mlp.dense_h_to_4h/events.out.tfevents.1637404984.r8i2n6.1525706.18 similarity index 100% rename from emb-norm-15k/092-module.50.mlp.dense_h_to_4h/events.out.tfevents.1637404984.r8i2n6.1525706.18 rename to emb-norm-6.6k/092-module.50.mlp.dense_h_to_4h/events.out.tfevents.1637404984.r8i2n6.1525706.18 diff --git a/emb-norm-15k/092-module.50.mlp/events.out.tfevents.1637404984.r8i2n6.1525706.20 b/emb-norm-6.6k/092-module.50.mlp/events.out.tfevents.1637404984.r8i2n6.1525706.20 similarity index 100% rename from emb-norm-15k/092-module.50.mlp/events.out.tfevents.1637404984.r8i2n6.1525706.20 rename to emb-norm-6.6k/092-module.50.mlp/events.out.tfevents.1637404984.r8i2n6.1525706.20 diff --git a/emb-norm-15k/092-module.50.post_attention_layernorm/events.out.tfevents.1637404984.r8i2n6.1525706.17 b/emb-norm-6.6k/092-module.50.post_attention_layernorm/events.out.tfevents.1637404984.r8i2n6.1525706.17 similarity index 100% rename from emb-norm-15k/092-module.50.post_attention_layernorm/events.out.tfevents.1637404984.r8i2n6.1525706.17 rename to emb-norm-6.6k/092-module.50.post_attention_layernorm/events.out.tfevents.1637404984.r8i2n6.1525706.17 diff --git a/emb-norm-15k/092-module.50.self_attention.attention_dropout/events.out.tfevents.1637404984.r8i2n6.1525706.14 b/emb-norm-6.6k/092-module.50.self_attention.attention_dropout/events.out.tfevents.1637404984.r8i2n6.1525706.14 similarity index 100% rename from emb-norm-15k/092-module.50.self_attention.attention_dropout/events.out.tfevents.1637404984.r8i2n6.1525706.14 rename to emb-norm-6.6k/092-module.50.self_attention.attention_dropout/events.out.tfevents.1637404984.r8i2n6.1525706.14 diff --git a/emb-norm-15k/092-module.50.self_attention.dense/events.out.tfevents.1637404984.r8i2n6.1525706.15 b/emb-norm-6.6k/092-module.50.self_attention.dense/events.out.tfevents.1637404984.r8i2n6.1525706.15 similarity index 100% rename from emb-norm-15k/092-module.50.self_attention.dense/events.out.tfevents.1637404984.r8i2n6.1525706.15 rename to emb-norm-6.6k/092-module.50.self_attention.dense/events.out.tfevents.1637404984.r8i2n6.1525706.15 diff --git a/emb-norm-15k/092-module.50.self_attention.query_key_value/events.out.tfevents.1637404984.r8i2n6.1525706.12 b/emb-norm-6.6k/092-module.50.self_attention.query_key_value/events.out.tfevents.1637404984.r8i2n6.1525706.12 similarity index 100% rename from emb-norm-15k/092-module.50.self_attention.query_key_value/events.out.tfevents.1637404984.r8i2n6.1525706.12 rename to emb-norm-6.6k/092-module.50.self_attention.query_key_value/events.out.tfevents.1637404984.r8i2n6.1525706.12 diff --git a/emb-norm-15k/092-module.50.self_attention.scale_mask_softmax/events.out.tfevents.1637404984.r8i2n6.1525706.13 b/emb-norm-6.6k/092-module.50.self_attention.scale_mask_softmax/events.out.tfevents.1637404984.r8i2n6.1525706.13 similarity index 100% rename from emb-norm-15k/092-module.50.self_attention.scale_mask_softmax/events.out.tfevents.1637404984.r8i2n6.1525706.13 rename to emb-norm-6.6k/092-module.50.self_attention.scale_mask_softmax/events.out.tfevents.1637404984.r8i2n6.1525706.13 diff --git a/emb-norm-15k/092-module.50.self_attention/events.out.tfevents.1637404984.r8i2n6.1525706.16 b/emb-norm-6.6k/092-module.50.self_attention/events.out.tfevents.1637404984.r8i2n6.1525706.16 similarity index 100% rename from emb-norm-15k/092-module.50.self_attention/events.out.tfevents.1637404984.r8i2n6.1525706.16 rename to emb-norm-6.6k/092-module.50.self_attention/events.out.tfevents.1637404984.r8i2n6.1525706.16 diff --git a/emb-norm-15k/092-module.50/events.out.tfevents.1637404984.r8i2n6.1525706.21 b/emb-norm-6.6k/092-module.50/events.out.tfevents.1637404984.r8i2n6.1525706.21 similarity index 100% rename from emb-norm-15k/092-module.50/events.out.tfevents.1637404984.r8i2n6.1525706.21 rename to emb-norm-6.6k/092-module.50/events.out.tfevents.1637404984.r8i2n6.1525706.21 diff --git a/emb-norm-15k/092-module/events.out.tfevents.1637404984.r8i2n6.1525706.22 b/emb-norm-6.6k/092-module/events.out.tfevents.1637404984.r8i2n6.1525706.22 similarity index 100% rename from emb-norm-15k/092-module/events.out.tfevents.1637404984.r8i2n6.1525706.22 rename to emb-norm-6.6k/092-module/events.out.tfevents.1637404984.r8i2n6.1525706.22 diff --git a/emb-norm-15k/124-module.65.input_layernorm/events.out.tfevents.1637404996.r9i7n1.414271.0 b/emb-norm-6.6k/124-module.65.input_layernorm/events.out.tfevents.1637404996.r9i7n1.414271.0 similarity index 100% rename from emb-norm-15k/124-module.65.input_layernorm/events.out.tfevents.1637404996.r9i7n1.414271.0 rename to emb-norm-6.6k/124-module.65.input_layernorm/events.out.tfevents.1637404996.r9i7n1.414271.0 diff --git a/emb-norm-15k/124-module.65.mlp.dense_4h_to_h/events.out.tfevents.1637404997.r9i7n1.414271.8 b/emb-norm-6.6k/124-module.65.mlp.dense_4h_to_h/events.out.tfevents.1637404997.r9i7n1.414271.8 similarity index 100% rename from emb-norm-15k/124-module.65.mlp.dense_4h_to_h/events.out.tfevents.1637404997.r9i7n1.414271.8 rename to emb-norm-6.6k/124-module.65.mlp.dense_4h_to_h/events.out.tfevents.1637404997.r9i7n1.414271.8 diff --git a/emb-norm-15k/124-module.65.mlp.dense_h_to_4h/events.out.tfevents.1637404997.r9i7n1.414271.7 b/emb-norm-6.6k/124-module.65.mlp.dense_h_to_4h/events.out.tfevents.1637404997.r9i7n1.414271.7 similarity index 100% rename from emb-norm-15k/124-module.65.mlp.dense_h_to_4h/events.out.tfevents.1637404997.r9i7n1.414271.7 rename to emb-norm-6.6k/124-module.65.mlp.dense_h_to_4h/events.out.tfevents.1637404997.r9i7n1.414271.7 diff --git a/emb-norm-15k/124-module.65.mlp/events.out.tfevents.1637404997.r9i7n1.414271.9 b/emb-norm-6.6k/124-module.65.mlp/events.out.tfevents.1637404997.r9i7n1.414271.9 similarity index 100% rename from emb-norm-15k/124-module.65.mlp/events.out.tfevents.1637404997.r9i7n1.414271.9 rename to emb-norm-6.6k/124-module.65.mlp/events.out.tfevents.1637404997.r9i7n1.414271.9 diff --git a/emb-norm-15k/124-module.65.post_attention_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.6 b/emb-norm-6.6k/124-module.65.post_attention_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.6 similarity index 100% rename from emb-norm-15k/124-module.65.post_attention_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.6 rename to emb-norm-6.6k/124-module.65.post_attention_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.6 diff --git a/emb-norm-15k/124-module.65.self_attention.attention_dropout/events.out.tfevents.1637404997.r9i7n1.414271.3 b/emb-norm-6.6k/124-module.65.self_attention.attention_dropout/events.out.tfevents.1637404997.r9i7n1.414271.3 similarity index 100% rename from emb-norm-15k/124-module.65.self_attention.attention_dropout/events.out.tfevents.1637404997.r9i7n1.414271.3 rename to emb-norm-6.6k/124-module.65.self_attention.attention_dropout/events.out.tfevents.1637404997.r9i7n1.414271.3 diff --git a/emb-norm-15k/124-module.65.self_attention.dense/events.out.tfevents.1637404997.r9i7n1.414271.4 b/emb-norm-6.6k/124-module.65.self_attention.dense/events.out.tfevents.1637404997.r9i7n1.414271.4 similarity index 100% rename from emb-norm-15k/124-module.65.self_attention.dense/events.out.tfevents.1637404997.r9i7n1.414271.4 rename to emb-norm-6.6k/124-module.65.self_attention.dense/events.out.tfevents.1637404997.r9i7n1.414271.4 diff --git a/emb-norm-15k/124-module.65.self_attention.query_key_value/events.out.tfevents.1637404997.r9i7n1.414271.1 b/emb-norm-6.6k/124-module.65.self_attention.query_key_value/events.out.tfevents.1637404997.r9i7n1.414271.1 similarity index 100% rename from emb-norm-15k/124-module.65.self_attention.query_key_value/events.out.tfevents.1637404997.r9i7n1.414271.1 rename to emb-norm-6.6k/124-module.65.self_attention.query_key_value/events.out.tfevents.1637404997.r9i7n1.414271.1 diff --git a/emb-norm-15k/124-module.65.self_attention.scale_mask_softmax/events.out.tfevents.1637404997.r9i7n1.414271.2 b/emb-norm-6.6k/124-module.65.self_attention.scale_mask_softmax/events.out.tfevents.1637404997.r9i7n1.414271.2 similarity index 100% rename from emb-norm-15k/124-module.65.self_attention.scale_mask_softmax/events.out.tfevents.1637404997.r9i7n1.414271.2 rename to emb-norm-6.6k/124-module.65.self_attention.scale_mask_softmax/events.out.tfevents.1637404997.r9i7n1.414271.2 diff --git a/emb-norm-15k/124-module.65.self_attention/events.out.tfevents.1637404997.r9i7n1.414271.5 b/emb-norm-6.6k/124-module.65.self_attention/events.out.tfevents.1637404997.r9i7n1.414271.5 similarity index 100% rename from emb-norm-15k/124-module.65.self_attention/events.out.tfevents.1637404997.r9i7n1.414271.5 rename to emb-norm-6.6k/124-module.65.self_attention/events.out.tfevents.1637404997.r9i7n1.414271.5 diff --git a/emb-norm-15k/124-module.65/events.out.tfevents.1637404997.r9i7n1.414271.10 b/emb-norm-6.6k/124-module.65/events.out.tfevents.1637404997.r9i7n1.414271.10 similarity index 100% rename from emb-norm-15k/124-module.65/events.out.tfevents.1637404997.r9i7n1.414271.10 rename to emb-norm-6.6k/124-module.65/events.out.tfevents.1637404997.r9i7n1.414271.10 diff --git a/emb-norm-15k/124-module.66.input_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.11 b/emb-norm-6.6k/124-module.66.input_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.11 similarity index 100% rename from emb-norm-15k/124-module.66.input_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.11 rename to emb-norm-6.6k/124-module.66.input_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.11 diff --git a/emb-norm-15k/124-module.66.mlp.dense_4h_to_h/events.out.tfevents.1637404997.r9i7n1.414271.19 b/emb-norm-6.6k/124-module.66.mlp.dense_4h_to_h/events.out.tfevents.1637404997.r9i7n1.414271.19 similarity index 100% rename from emb-norm-15k/124-module.66.mlp.dense_4h_to_h/events.out.tfevents.1637404997.r9i7n1.414271.19 rename to emb-norm-6.6k/124-module.66.mlp.dense_4h_to_h/events.out.tfevents.1637404997.r9i7n1.414271.19 diff --git a/emb-norm-15k/124-module.66.mlp.dense_h_to_4h/events.out.tfevents.1637404997.r9i7n1.414271.18 b/emb-norm-6.6k/124-module.66.mlp.dense_h_to_4h/events.out.tfevents.1637404997.r9i7n1.414271.18 similarity index 100% rename from emb-norm-15k/124-module.66.mlp.dense_h_to_4h/events.out.tfevents.1637404997.r9i7n1.414271.18 rename to emb-norm-6.6k/124-module.66.mlp.dense_h_to_4h/events.out.tfevents.1637404997.r9i7n1.414271.18 diff --git a/emb-norm-15k/124-module.66.mlp/events.out.tfevents.1637404997.r9i7n1.414271.20 b/emb-norm-6.6k/124-module.66.mlp/events.out.tfevents.1637404997.r9i7n1.414271.20 similarity index 100% rename from emb-norm-15k/124-module.66.mlp/events.out.tfevents.1637404997.r9i7n1.414271.20 rename to emb-norm-6.6k/124-module.66.mlp/events.out.tfevents.1637404997.r9i7n1.414271.20 diff --git a/emb-norm-15k/124-module.66.post_attention_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.17 b/emb-norm-6.6k/124-module.66.post_attention_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.17 similarity index 100% rename from emb-norm-15k/124-module.66.post_attention_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.17 rename to emb-norm-6.6k/124-module.66.post_attention_layernorm/events.out.tfevents.1637404997.r9i7n1.414271.17 diff --git a/emb-norm-15k/124-module.66.self_attention.attention_dropout/events.out.tfevents.1637404997.r9i7n1.414271.14 b/emb-norm-6.6k/124-module.66.self_attention.attention_dropout/events.out.tfevents.1637404997.r9i7n1.414271.14 similarity index 100% rename from emb-norm-15k/124-module.66.self_attention.attention_dropout/events.out.tfevents.1637404997.r9i7n1.414271.14 rename to emb-norm-6.6k/124-module.66.self_attention.attention_dropout/events.out.tfevents.1637404997.r9i7n1.414271.14 diff --git a/emb-norm-15k/124-module.66.self_attention.dense/events.out.tfevents.1637404997.r9i7n1.414271.15 b/emb-norm-6.6k/124-module.66.self_attention.dense/events.out.tfevents.1637404997.r9i7n1.414271.15 similarity index 100% rename from emb-norm-15k/124-module.66.self_attention.dense/events.out.tfevents.1637404997.r9i7n1.414271.15 rename to emb-norm-6.6k/124-module.66.self_attention.dense/events.out.tfevents.1637404997.r9i7n1.414271.15 diff --git a/emb-norm-15k/124-module.66.self_attention.query_key_value/events.out.tfevents.1637404997.r9i7n1.414271.12 b/emb-norm-6.6k/124-module.66.self_attention.query_key_value/events.out.tfevents.1637404997.r9i7n1.414271.12 similarity index 100% rename from emb-norm-15k/124-module.66.self_attention.query_key_value/events.out.tfevents.1637404997.r9i7n1.414271.12 rename to emb-norm-6.6k/124-module.66.self_attention.query_key_value/events.out.tfevents.1637404997.r9i7n1.414271.12 diff --git a/emb-norm-15k/124-module.66.self_attention.scale_mask_softmax/events.out.tfevents.1637404997.r9i7n1.414271.13 b/emb-norm-6.6k/124-module.66.self_attention.scale_mask_softmax/events.out.tfevents.1637404997.r9i7n1.414271.13 similarity index 100% rename from emb-norm-15k/124-module.66.self_attention.scale_mask_softmax/events.out.tfevents.1637404997.r9i7n1.414271.13 rename to emb-norm-6.6k/124-module.66.self_attention.scale_mask_softmax/events.out.tfevents.1637404997.r9i7n1.414271.13 diff --git a/emb-norm-15k/124-module.66.self_attention/events.out.tfevents.1637404997.r9i7n1.414271.16 b/emb-norm-6.6k/124-module.66.self_attention/events.out.tfevents.1637404997.r9i7n1.414271.16 similarity index 100% rename from emb-norm-15k/124-module.66.self_attention/events.out.tfevents.1637404997.r9i7n1.414271.16 rename to emb-norm-6.6k/124-module.66.self_attention/events.out.tfevents.1637404997.r9i7n1.414271.16 diff --git a/emb-norm-15k/124-module.66/events.out.tfevents.1637404997.r9i7n1.414271.21 b/emb-norm-6.6k/124-module.66/events.out.tfevents.1637404997.r9i7n1.414271.21 similarity index 100% rename from emb-norm-15k/124-module.66/events.out.tfevents.1637404997.r9i7n1.414271.21 rename to emb-norm-6.6k/124-module.66/events.out.tfevents.1637404997.r9i7n1.414271.21 diff --git a/emb-norm-15k/124-module.68/events.out.tfevents.1637404997.r9i7n1.414271.22 b/emb-norm-6.6k/124-module.68/events.out.tfevents.1637404997.r9i7n1.414271.22 similarity index 100% rename from emb-norm-15k/124-module.68/events.out.tfevents.1637404997.r9i7n1.414271.22 rename to emb-norm-6.6k/124-module.68/events.out.tfevents.1637404997.r9i7n1.414271.22 diff --git a/emb-norm-15k/124-module/events.out.tfevents.1637404997.r9i7n1.414271.23 b/emb-norm-6.6k/124-module/events.out.tfevents.1637404997.r9i7n1.414271.23 similarity index 100% rename from emb-norm-15k/124-module/events.out.tfevents.1637404997.r9i7n1.414271.23 rename to emb-norm-6.6k/124-module/events.out.tfevents.1637404997.r9i7n1.414271.23