Training in progress, step 21000

Browse files

Files changed (9) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +123 -3
last-checkpoint/training_args.bin +1 -1
pytorch_model.bin +1 -1
training_args.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b7d8c9fb8208aa0e0d90ff9e6faa30e64692a370a85f4d8998eee25bca138e50
 size 2226478553

 version https://git-lfs.github.com/spec/v1
+oid sha256:39a351e6af26803f9eeacbdc3599fe7ba53df6f5641098b8daa5f7b9e0aa7b85
 size 2226478553

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ff61a403b3cfb6a54ffab03f89d73788332a1bacb81b51101f34eaa479906cb3
 size 1113252715

 version https://git-lfs.github.com/spec/v1
+oid sha256:59dcfd93fbced501dd096334a41c07a4b2e21743fa787c29c4db14612e8f084f
 size 1113252715

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ddb58e7fd295f3218fc9dda421b48419dac1c35f9f62dd226cd79272ce3149c8
 size 17563

 version https://git-lfs.github.com/spec/v1
+oid sha256:2427d3e67c681daaaba70098244ec32f3b70c7781145897a05d923a006eff520
 size 17563

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:766c4f37fdc6039a73178318ed142079f6cd59c61c3481cd6269f2a7cfa68325
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:88c633fcf373eeb32eac8eef8541ef4cf7ce7b0edbad3ac306cf7779b78afda6
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e5fd6c830f4df967d9f2291b54c56401f3e6ffddab3b4f1fcd21a88c860c00bf
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:7b337a80290075bf247d1150cdeaf1a5b708e8ccc1775639aea6fdc42b499e1c
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.7039331537933788,
-  "global_step": 20800,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -12486,11 +12486,131 @@
       "learning_rate": 1.5456564448620482e-05,
       "loss": 1.1033,
       "step": 20800
     }
   ],
   "max_steps": 24414,
   "num_train_epochs": 2,
-  "total_flos": 2.810210873905797e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.7203170279652253,
+  "global_step": 21000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.5456564448620482e-05,
       "loss": 1.1033,
       "step": 20800
+    },
+    {
+      "epoch": 1.7,
+      "learning_rate": 1.5413854958571797e-05,
+      "loss": 1.1021,
+      "step": 20810
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.5371145468523108e-05,
+      "loss": 1.0975,
+      "step": 20820
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.532843597847442e-05,
+      "loss": 1.0981,
+      "step": 20830
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.528572648842573e-05,
+      "loss": 1.1019,
+      "step": 20840
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.524301699837704e-05,
+      "loss": 1.1089,
+      "step": 20850
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.5200307508328351e-05,
+      "loss": 1.1111,
+      "step": 20860
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.5157598018279662e-05,
+      "loss": 1.1091,
+      "step": 20870
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.5114888528230975e-05,
+      "loss": 1.1001,
+      "step": 20880
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.5072179038182286e-05,
+      "loss": 1.0987,
+      "step": 20890
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.5029469548133595e-05,
+      "loss": 1.107,
+      "step": 20900
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.4986760058084906e-05,
+      "loss": 1.0973,
+      "step": 20910
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.494405056803622e-05,
+      "loss": 1.0978,
+      "step": 20920
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 1.490134107798753e-05,
+      "loss": 1.0993,
+      "step": 20930
+    },
+    {
+      "epoch": 1.72,
+      "learning_rate": 1.485863158793884e-05,
+      "loss": 1.093,
+      "step": 20940
+    },
+    {
+      "epoch": 1.72,
+      "learning_rate": 1.4815922097890153e-05,
+      "loss": 1.1091,
+      "step": 20950
+    },
+    {
+      "epoch": 1.72,
+      "learning_rate": 1.4773212607841464e-05,
+      "loss": 1.1066,
+      "step": 20960
+    },
+    {
+      "epoch": 1.72,
+      "learning_rate": 1.4730503117792775e-05,
+      "loss": 1.1056,
+      "step": 20970
+    },
+    {
+      "epoch": 1.72,
+      "learning_rate": 1.4687793627744084e-05,
+      "loss": 1.101,
+      "step": 20980
+    },
+    {
+      "epoch": 1.72,
+      "learning_rate": 1.4645084137695398e-05,
+      "loss": 1.1034,
+      "step": 20990
+    },
+    {
+      "epoch": 1.72,
+      "learning_rate": 1.4602374647646707e-05,
+      "loss": 1.0953,
+      "step": 21000
     }
   ],
   "max_steps": 24414,
   "num_train_epochs": 2,
+  "total_flos": 2.837232089174661e+18,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4f904905931c8a1fe154e57477d84e6e13f86ce2215774d32d1df579ae96fcbd
 size 3439

 version https://git-lfs.github.com/spec/v1
+oid sha256:6610c57ac1474bf5097bd000e69f982c66ca3a4b3ce31c1509196f6a47bc4144
 size 3439

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ff61a403b3cfb6a54ffab03f89d73788332a1bacb81b51101f34eaa479906cb3
 size 1113252715

 version https://git-lfs.github.com/spec/v1
+oid sha256:59dcfd93fbced501dd096334a41c07a4b2e21743fa787c29c4db14612e8f084f
 size 1113252715

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4f904905931c8a1fe154e57477d84e6e13f86ce2215774d32d1df579ae96fcbd
 size 3439

 version https://git-lfs.github.com/spec/v1
+oid sha256:6610c57ac1474bf5097bd000e69f982c66ca3a4b3ce31c1509196f6a47bc4144
 size 3439