stas commited on
Commit
b97bd85
Β·
1 Parent(s): 3162d46
This view is limited to 50 files because it contains too many changes. Β  See raw diff
Files changed (50) hide show
  1. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.input_layernorm/events.out.tfevents.1638234920.r6i3n2.1319219.5 +0 -0
  2. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.13 +0 -0
  3. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.12 +0 -0
  4. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.14 +0 -0
  5. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.11 +0 -0
  6. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.8 +0 -0
  7. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.self_attention.dense/events.out.tfevents.1638234920.r6i3n2.1319219.9 +0 -0
  8. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.self_attention.query_key_value/events.out.tfevents.1638234920.r6i3n2.1319219.6 +0 -0
  9. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638234920.r6i3n2.1319219.7 +0 -0
  10. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.self_attention/events.out.tfevents.1638234920.r6i3n2.1319219.10 +0 -0
  11. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.3/events.out.tfevents.1638234921.r6i3n2.1319219.15 +0 -0
  12. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.input_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.16 +0 -0
  13. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.24 +0 -0
  14. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.23 +0 -0
  15. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.25 +0 -0
  16. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.22 +0 -0
  17. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638234921.r6i3n2.1319219.19 +0 -0
  18. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.self_attention.dense/events.out.tfevents.1638234921.r6i3n2.1319219.20 +0 -0
  19. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.self_attention.query_key_value/events.out.tfevents.1638234921.r6i3n2.1319219.17 +0 -0
  20. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638234921.r6i3n2.1319219.18 +0 -0
  21. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.self_attention/events.out.tfevents.1638234921.r6i3n2.1319219.21 +0 -0
  22. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.4/events.out.tfevents.1638234921.r6i3n2.1319219.26 +0 -0
  23. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.3 +0 -0
  24. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.2 +0 -0
  25. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1638234920.r6i3n2.1319219.0 +0 -0
  26. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.1 +0 -0
  27. {emb-norm-6k β†’ emb-norm-14.6k}/000-module.tied_modules.embed/events.out.tfevents.1638234920.r6i3n2.1319219.4 +0 -0
  28. {emb-norm-6k β†’ emb-norm-14.6k}/000-module/events.out.tfevents.1638234921.r6i3n2.1319219.27 +0 -0
  29. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.input_layernorm/events.out.tfevents.1638234932.r6i5n3.61809.0 +0 -0
  30. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.8 +0 -0
  31. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.7 +0 -0
  32. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.mlp/events.out.tfevents.1638234933.r6i5n3.61809.9 +0 -0
  33. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.6 +0 -0
  34. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.self_attention.attention_dropout/events.out.tfevents.1638234932.r6i5n3.61809.3 +0 -0
  35. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.self_attention.dense/events.out.tfevents.1638234932.r6i5n3.61809.4 +0 -0
  36. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.self_attention.query_key_value/events.out.tfevents.1638234932.r6i5n3.61809.1 +0 -0
  37. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638234932.r6i5n3.61809.2 +0 -0
  38. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.self_attention/events.out.tfevents.1638234932.r6i5n3.61809.5 +0 -0
  39. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.17/events.out.tfevents.1638234933.r6i5n3.61809.10 +0 -0
  40. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.input_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.11 +0 -0
  41. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.19 +0 -0
  42. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.18 +0 -0
  43. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.mlp/events.out.tfevents.1638234933.r6i5n3.61809.20 +0 -0
  44. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.17 +0 -0
  45. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.self_attention.attention_dropout/events.out.tfevents.1638234933.r6i5n3.61809.14 +0 -0
  46. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.self_attention.dense/events.out.tfevents.1638234933.r6i5n3.61809.15 +0 -0
  47. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.self_attention.query_key_value/events.out.tfevents.1638234933.r6i5n3.61809.12 +0 -0
  48. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638234933.r6i5n3.61809.13 +0 -0
  49. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.self_attention/events.out.tfevents.1638234933.r6i5n3.61809.16 +0 -0
  50. {emb-norm-6k β†’ emb-norm-14.6k}/056-module.18/events.out.tfevents.1638234933.r6i5n3.61809.21 +0 -0
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.input_layernorm/events.out.tfevents.1638234920.r6i3n2.1319219.5 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.13 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.12 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.14 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.11 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.8 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.self_attention.dense/events.out.tfevents.1638234920.r6i3n2.1319219.9 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.self_attention.query_key_value/events.out.tfevents.1638234920.r6i3n2.1319219.6 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638234920.r6i3n2.1319219.7 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.3.self_attention/events.out.tfevents.1638234920.r6i3n2.1319219.10 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.3/events.out.tfevents.1638234921.r6i3n2.1319219.15 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.input_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.16 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638234921.r6i3n2.1319219.24 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638234921.r6i3n2.1319219.23 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.mlp/events.out.tfevents.1638234921.r6i3n2.1319219.25 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.post_attention_layernorm/events.out.tfevents.1638234921.r6i3n2.1319219.22 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638234921.r6i3n2.1319219.19 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.self_attention.dense/events.out.tfevents.1638234921.r6i3n2.1319219.20 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.self_attention.query_key_value/events.out.tfevents.1638234921.r6i3n2.1319219.17 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638234921.r6i3n2.1319219.18 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.4.self_attention/events.out.tfevents.1638234921.r6i3n2.1319219.21 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.4/events.out.tfevents.1638234921.r6i3n2.1319219.26 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638234920.r6i3n2.1319219.3 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.2 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.tied_modules.embed.word_embeddings.norm/events.out.tfevents.1638234920.r6i3n2.1319219.0 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638234920.r6i3n2.1319219.1 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module.tied_modules.embed/events.out.tfevents.1638234920.r6i3n2.1319219.4 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/000-module/events.out.tfevents.1638234921.r6i3n2.1319219.27 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.input_layernorm/events.out.tfevents.1638234932.r6i5n3.61809.0 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.8 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.7 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.mlp/events.out.tfevents.1638234933.r6i5n3.61809.9 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.6 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.self_attention.attention_dropout/events.out.tfevents.1638234932.r6i5n3.61809.3 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.self_attention.dense/events.out.tfevents.1638234932.r6i5n3.61809.4 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.self_attention.query_key_value/events.out.tfevents.1638234932.r6i5n3.61809.1 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638234932.r6i5n3.61809.2 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.17.self_attention/events.out.tfevents.1638234932.r6i5n3.61809.5 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.17/events.out.tfevents.1638234933.r6i5n3.61809.10 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.input_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.11 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638234933.r6i5n3.61809.19 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638234933.r6i5n3.61809.18 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.mlp/events.out.tfevents.1638234933.r6i5n3.61809.20 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.post_attention_layernorm/events.out.tfevents.1638234933.r6i5n3.61809.17 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.self_attention.attention_dropout/events.out.tfevents.1638234933.r6i5n3.61809.14 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.self_attention.dense/events.out.tfevents.1638234933.r6i5n3.61809.15 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.self_attention.query_key_value/events.out.tfevents.1638234933.r6i5n3.61809.12 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638234933.r6i5n3.61809.13 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.18.self_attention/events.out.tfevents.1638234933.r6i5n3.61809.16 RENAMED
File without changes
{emb-norm-6k β†’ emb-norm-14.6k}/056-module.18/events.out.tfevents.1638234933.r6i5n3.61809.21 RENAMED
File without changes