fix
Browse filesThis view is limited to 50 files because it contains too many changes. Β
See raw diff
- {emb-norm-6k β emb-norm-14.6k}/000-module.3.input_layernorm/events.out.tfevents.1638234920.r6i3n2.1319219.5 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.13 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.12 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.3.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.14 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.3.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.11 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.8 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.3.self_attention.dense/events.out.tfevents.1638234920.r6i3n2.1319219.9 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.3.self_attention.query_key_value/events.out.tfevents.1638234920.r6i3n2.1319219.6 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638234920.r6i3n2.1319219.7 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.3.self_attention/events.out.tfevents.1638234920.r6i3n2.1319219.10 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.3/events.out.tfevents.1638234921.r6i3n2.1319219.15 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.4.input_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.16 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.24 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.23 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.4.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.25 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.4.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.22 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638234921.r6i3n2.1319219.19 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.4.self_attention.dense/events.out.tfevents.1638234921.r6i3n2.1319219.20 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.4.self_attention.query_key_value/events.out.tfevents.1638234921.r6i3n2.1319219.17 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638234921.r6i3n2.1319219.18 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.4.self_attention/events.out.tfevents.1638234921.r6i3n2.1319219.21 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.4/events.out.tfevents.1638234921.r6i3n2.1319219.26 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.3 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.2 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1638234920.r6i3n2.1319219.0 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.1 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module.tied_modules.embed/events.out.tfevents.1638234920.r6i3n2.1319219.4 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/000-module/events.out.tfevents.1638234921.r6i3n2.1319219.27 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.17.input_layernorm/events.out.tfevents.1638234932.r6i5n3.61809.0 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.8 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.7 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.17.mlp/events.out.tfevents.1638234933.r6i5n3.61809.9 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.17.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.6 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.17.self_attention.attention_dropout/events.out.tfevents.1638234932.r6i5n3.61809.3 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.17.self_attention.dense/events.out.tfevents.1638234932.r6i5n3.61809.4 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.17.self_attention.query_key_value/events.out.tfevents.1638234932.r6i5n3.61809.1 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638234932.r6i5n3.61809.2 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.17.self_attention/events.out.tfevents.1638234932.r6i5n3.61809.5 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.17/events.out.tfevents.1638234933.r6i5n3.61809.10 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.18.input_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.11 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.19 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.18 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.18.mlp/events.out.tfevents.1638234933.r6i5n3.61809.20 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.18.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.17 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.18.self_attention.attention_dropout/events.out.tfevents.1638234933.r6i5n3.61809.14 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.18.self_attention.dense/events.out.tfevents.1638234933.r6i5n3.61809.15 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.18.self_attention.query_key_value/events.out.tfevents.1638234933.r6i5n3.61809.12 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638234933.r6i5n3.61809.13 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.18.self_attention/events.out.tfevents.1638234933.r6i5n3.61809.16 +0 -0
- {emb-norm-6k β emb-norm-14.6k}/056-module.18/events.out.tfevents.1638234933.r6i5n3.61809.21 +0 -0
{emb-norm-6k β emb-norm-14.6k}/000-module.3.input_layernorm/events.out.tfevents.1638234920.r6i3n2.1319219.5
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.13
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.12
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.3.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.14
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.3.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.11
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.8
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.3.self_attention.dense/events.out.tfevents.1638234920.r6i3n2.1319219.9
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.3.self_attention.query_key_value/events.out.tfevents.1638234920.r6i3n2.1319219.6
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638234920.r6i3n2.1319219.7
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.3.self_attention/events.out.tfevents.1638234920.r6i3n2.1319219.10
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.3/events.out.tfevents.1638234921.r6i3n2.1319219.15
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.4.input_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.16
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.24
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.23
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.4.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.25
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.4.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.22
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638234921.r6i3n2.1319219.19
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.4.self_attention.dense/events.out.tfevents.1638234921.r6i3n2.1319219.20
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.4.self_attention.query_key_value/events.out.tfevents.1638234921.r6i3n2.1319219.17
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638234921.r6i3n2.1319219.18
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.4.self_attention/events.out.tfevents.1638234921.r6i3n2.1319219.21
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.4/events.out.tfevents.1638234921.r6i3n2.1319219.26
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.3
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.2
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1638234920.r6i3n2.1319219.0
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.1
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module.tied_modules.embed/events.out.tfevents.1638234920.r6i3n2.1319219.4
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/000-module/events.out.tfevents.1638234921.r6i3n2.1319219.27
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.17.input_layernorm/events.out.tfevents.1638234932.r6i5n3.61809.0
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.8
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.7
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.17.mlp/events.out.tfevents.1638234933.r6i5n3.61809.9
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.17.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.6
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.17.self_attention.attention_dropout/events.out.tfevents.1638234932.r6i5n3.61809.3
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.17.self_attention.dense/events.out.tfevents.1638234932.r6i5n3.61809.4
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.17.self_attention.query_key_value/events.out.tfevents.1638234932.r6i5n3.61809.1
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638234932.r6i5n3.61809.2
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.17.self_attention/events.out.tfevents.1638234932.r6i5n3.61809.5
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.17/events.out.tfevents.1638234933.r6i5n3.61809.10
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.18.input_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.11
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.19
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.18
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.18.mlp/events.out.tfevents.1638234933.r6i5n3.61809.20
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.18.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.17
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.18.self_attention.attention_dropout/events.out.tfevents.1638234933.r6i5n3.61809.14
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.18.self_attention.dense/events.out.tfevents.1638234933.r6i5n3.61809.15
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.18.self_attention.query_key_value/events.out.tfevents.1638234933.r6i5n3.61809.12
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638234933.r6i5n3.61809.13
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.18.self_attention/events.out.tfevents.1638234933.r6i5n3.61809.16
RENAMED
File without changes
|
{emb-norm-6k β emb-norm-14.6k}/056-module.18/events.out.tfevents.1638234933.r6i5n3.61809.21
RENAMED
File without changes
|