sedrickkeh commited on
Commit
8a53969
·
verified ·
1 Parent(s): 51a02be

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4263bb12f6f7b00cc787ca42acd9f1e6041bdb37b46a99592b1d88d1273c92df
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f32be30d71ab482614b34cb7b9be6145b6db2ba168e6ccc0c787665f22a280d
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:065a237bd8ad8cf4066a0afbd6671f6cf69d55d76e49496adcc09264f8b3bbd6
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d54e0668796c376e3dde689708f25080420f11b6247b8030f5f573a477c961da
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b20f4b185827c975fe4e2de6775d96c941617e3f433e2eb70eade3664ee43cf
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecf2a138718acfc5cfb09c89cc5ac7ea6389b6f8b9e0bcbd686706f562551275
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a5c5a9e6108759a35e812818c4fd3367f3fc176e91d00d7c4bcb115b7790adc
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfd321f0abc60182ac54d4b174858fc24f49223ce88aba6ff17c7b3f4a2288af
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -33,3 +33,20 @@
33
  {"current_steps": 320, "total_steps": 501, "loss": 0.7196, "lr": 5e-06, "epoch": 1.9076005961251863, "percentage": 63.87, "elapsed_time": "5:12:41", "remaining_time": "2:56:51"}
34
  {"current_steps": 330, "total_steps": 501, "loss": 0.7274, "lr": 5e-06, "epoch": 1.9672131147540983, "percentage": 65.87, "elapsed_time": "5:22:20", "remaining_time": "2:47:01"}
35
  {"current_steps": 335, "total_steps": 501, "eval_loss": 0.7537275552749634, "epoch": 1.9970193740685542, "percentage": 66.87, "elapsed_time": "5:30:31", "remaining_time": "2:43:46"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  {"current_steps": 320, "total_steps": 501, "loss": 0.7196, "lr": 5e-06, "epoch": 1.9076005961251863, "percentage": 63.87, "elapsed_time": "5:12:41", "remaining_time": "2:56:51"}
34
  {"current_steps": 330, "total_steps": 501, "loss": 0.7274, "lr": 5e-06, "epoch": 1.9672131147540983, "percentage": 65.87, "elapsed_time": "5:22:20", "remaining_time": "2:47:01"}
35
  {"current_steps": 335, "total_steps": 501, "eval_loss": 0.7537275552749634, "epoch": 1.9970193740685542, "percentage": 66.87, "elapsed_time": "5:30:31", "remaining_time": "2:43:46"}
36
+ {"current_steps": 340, "total_steps": 501, "loss": 0.7213, "lr": 5e-06, "epoch": 2.0268256333830106, "percentage": 67.86, "elapsed_time": "5:36:05", "remaining_time": "2:39:08"}
37
+ {"current_steps": 350, "total_steps": 501, "loss": 0.6748, "lr": 5e-06, "epoch": 2.0864381520119224, "percentage": 69.86, "elapsed_time": "5:45:42", "remaining_time": "2:29:08"}
38
+ {"current_steps": 360, "total_steps": 501, "loss": 0.6786, "lr": 5e-06, "epoch": 2.1460506706408347, "percentage": 71.86, "elapsed_time": "5:55:20", "remaining_time": "2:19:10"}
39
+ {"current_steps": 370, "total_steps": 501, "loss": 0.6768, "lr": 5e-06, "epoch": 2.2056631892697465, "percentage": 73.85, "elapsed_time": "6:05:00", "remaining_time": "2:09:13"}
40
+ {"current_steps": 380, "total_steps": 501, "loss": 0.6779, "lr": 5e-06, "epoch": 2.2652757078986587, "percentage": 75.85, "elapsed_time": "6:14:38", "remaining_time": "1:59:17"}
41
+ {"current_steps": 390, "total_steps": 501, "loss": 0.6764, "lr": 5e-06, "epoch": 2.3248882265275705, "percentage": 77.84, "elapsed_time": "6:24:16", "remaining_time": "1:49:22"}
42
+ {"current_steps": 400, "total_steps": 501, "loss": 0.6782, "lr": 5e-06, "epoch": 2.384500745156483, "percentage": 79.84, "elapsed_time": "6:33:56", "remaining_time": "1:39:28"}
43
+ {"current_steps": 410, "total_steps": 501, "loss": 0.6723, "lr": 5e-06, "epoch": 2.444113263785395, "percentage": 81.84, "elapsed_time": "6:43:35", "remaining_time": "1:29:34"}
44
+ {"current_steps": 420, "total_steps": 501, "loss": 0.6771, "lr": 5e-06, "epoch": 2.503725782414307, "percentage": 83.83, "elapsed_time": "6:53:13", "remaining_time": "1:19:41"}
45
+ {"current_steps": 430, "total_steps": 501, "loss": 0.6772, "lr": 5e-06, "epoch": 2.563338301043219, "percentage": 85.83, "elapsed_time": "7:02:51", "remaining_time": "1:09:49"}
46
+ {"current_steps": 440, "total_steps": 501, "loss": 0.6771, "lr": 5e-06, "epoch": 2.6229508196721314, "percentage": 87.82, "elapsed_time": "7:12:30", "remaining_time": "0:59:57"}
47
+ {"current_steps": 450, "total_steps": 501, "loss": 0.6777, "lr": 5e-06, "epoch": 2.682563338301043, "percentage": 89.82, "elapsed_time": "7:22:08", "remaining_time": "0:50:06"}
48
+ {"current_steps": 460, "total_steps": 501, "loss": 0.6745, "lr": 5e-06, "epoch": 2.742175856929955, "percentage": 91.82, "elapsed_time": "7:31:48", "remaining_time": "0:40:16"}
49
+ {"current_steps": 470, "total_steps": 501, "loss": 0.6781, "lr": 5e-06, "epoch": 2.8017883755588673, "percentage": 93.81, "elapsed_time": "7:41:27", "remaining_time": "0:30:26"}
50
+ {"current_steps": 480, "total_steps": 501, "loss": 0.6794, "lr": 5e-06, "epoch": 2.8614008941877795, "percentage": 95.81, "elapsed_time": "7:51:06", "remaining_time": "0:20:36"}
51
+ {"current_steps": 490, "total_steps": 501, "loss": 0.6742, "lr": 5e-06, "epoch": 2.9210134128166914, "percentage": 97.8, "elapsed_time": "8:00:45", "remaining_time": "0:10:47"}
52
+ {"current_steps": 500, "total_steps": 501, "loss": 0.6854, "lr": 5e-06, "epoch": 2.9806259314456036, "percentage": 99.8, "elapsed_time": "8:10:22", "remaining_time": "0:00:58"}