ashanhr commited on
Commit
61049ff
1 Parent(s): cffc794

Training in progress, step 3200, checkpoint

Browse files
last-checkpoint/model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa3f8250eedc0ad91d9bd7bd29190dfcd30c24ddbb981802ff4398fb1b6f8ccb
3
  size 4978139416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bf71b0c4b5b42be2c849af7ec687de0ddfb09171ee59dc0c9b9e95435acb0ae
3
  size 4978139416
last-checkpoint/model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d61642ae37b7f2123a78d2dc95232dacaf674afbc5bc78d70d4b6245a6343788
3
  size 3659223436
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e23c99508fe49e7d270ef25d2b0bfddea927c361d4b4b369364b31eb5bfb76aa
3
  size 3659223436
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9aa0dc12fc4c549ade65217632d28f06d688771482b33353c8dcff908cd43500
3
  size 17241500333
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:794316e4b1b49164c3c1b912b03bc9e5c56a1bde3e75f18b56f92a8c3ef576cd
3
  size 17241500333
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9b8972e9f2b0f288dfd8ade7d14f3387e82aa534b7b0691b69299c0919f543f0
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:caa8f6a1dd5101e10414474b080f8f573bd80f1bc9e5c32a51cbba518e254664
3
+ size 14567
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd47c81b0d91d48642f51b85203435f35325e0ebcfd794d4d6fa6f9f3a411358
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9caf1980567e30be4f62497610fa1f8c611b6eb31004cde77b37b2a91c8900c9
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.2628920227320564,
5
  "eval_steps": 100,
6
- "global_step": 3000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -487,6 +487,38 @@
487
  "eval_samples_per_second": 27.932,
488
  "eval_steps_per_second": 3.492,
489
  "step": 3000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
490
  }
491
  ],
492
  "logging_steps": 100,
@@ -494,7 +526,7 @@
494
  "num_input_tokens_seen": 0,
495
  "num_train_epochs": 30,
496
  "save_steps": 100,
497
- "total_flos": 3.298748154606821e+19,
498
  "train_batch_size": 8,
499
  "trial_name": null,
500
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.3470848242475268,
5
  "eval_steps": 100,
6
+ "global_step": 3200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
487
  "eval_samples_per_second": 27.932,
488
  "eval_steps_per_second": 3.492,
489
  "step": 3000
490
+ },
491
+ {
492
+ "epoch": 1.3,
493
+ "grad_norm": 3.9499669075012207,
494
+ "learning_rate": 4.816749116607774e-05,
495
+ "loss": 2.4353,
496
+ "step": 3100
497
+ },
498
+ {
499
+ "epoch": 1.3,
500
+ "eval_cer": 0.5479229400492746,
501
+ "eval_loss": 3.4527170658111572,
502
+ "eval_runtime": 354.1425,
503
+ "eval_samples_per_second": 26.763,
504
+ "eval_steps_per_second": 3.346,
505
+ "step": 3100
506
+ },
507
+ {
508
+ "epoch": 1.35,
509
+ "grad_norm": 2.9536569118499756,
510
+ "learning_rate": 4.809681978798587e-05,
511
+ "loss": 2.9787,
512
+ "step": 3200
513
+ },
514
+ {
515
+ "epoch": 1.35,
516
+ "eval_cer": 0.5677500879903015,
517
+ "eval_loss": 2.6674227714538574,
518
+ "eval_runtime": 344.0522,
519
+ "eval_samples_per_second": 27.548,
520
+ "eval_steps_per_second": 3.444,
521
+ "step": 3200
522
  }
523
  ],
524
  "logging_steps": 100,
 
526
  "num_input_tokens_seen": 0,
527
  "num_train_epochs": 30,
528
  "save_steps": 100,
529
+ "total_flos": 3.518283860575115e+19,
530
  "train_batch_size": 8,
531
  "trial_name": null,
532
  "trial_params": null