jasmeeetsingh commited on
Commit
5dc6dba
·
1 Parent(s): ea47a6f

Training in progress, step 11000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1369b02d89701e28f033efb1fdfba6cd30f8ada70562c93809d9883be5b9de7
3
  size 2384440
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c759ebf82040d6924a05c3ef4316882f71fdfc5e1b34d803d1cf5e7f577947dc
3
  size 2384440
last-checkpoint/global_step11000/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b61da4166d8014dfc824de70e94cd75e218a43aec48d563e391be2fdb8c64ad
3
+ size 3621285613
last-checkpoint/global_step11000/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c76796e0a5ad1b2741e9392873ac8fcd56fcd71393acdc19edd39fe901f98068
3
+ size 3542398
last-checkpoint/global_step11000/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe8299be7845efef45ca9388efd063c06646f5b0c0a5b383be3474ace2312202
3
+ size 3621285613
last-checkpoint/global_step11000/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c76286844f2e286577df0d98e4eb162c2424b7191d7a984fbcb663b5605cb436
3
+ size 3542398
last-checkpoint/global_step11000/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:991b3b749cca321f674ff5c8a87595c63e8a384a6eb2babd2ce9161a0479015b
3
+ size 3621285613
last-checkpoint/global_step11000/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92651aafa0d65b5221500ecd6317d6fbbeb6da3f3b19bad754f5a14adc0e1a55
3
+ size 3542398
last-checkpoint/global_step11000/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6991057ddb079a2d339379735329ec45f81b7d4122ed67df36e1a4b2cfc3b2e8
3
+ size 3621285613
last-checkpoint/global_step11000/zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bca9b920a2267bcce9d4e6237f4f19c59724abc2834eb2785811e14292717b1b
3
+ size 3542398
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step10000
 
1
+ global_step11000
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cfa02571e999b30d0d68db203d90860835ed576add579d94609958c91e7b09a3
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52a13920852463d3760190660bdbe29994e27158b7378d417b535b5ef21324ea
3
  size 17655
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5c248e07247a95e6c83e8ae323322b82a1e853159d5005510e323c697c46c54
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78d89e2d388155ee26c42c6125f61bfc2ba203bd49f50c360d30f1c842192bf7
3
  size 17655
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84dc7dd2db4843621003e2ea8697005b3f04a7bc93e21bbb989f813c9486dc7c
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1165af8401156c8f098205da71e41b90fedaad3a533634c223b68d0f661152b
3
  size 17655
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:585e72b3001d4cb10eaaa2d832401b7dac69a6f6d999ec8b6d8ef0d97db02ad4
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cd048a9881e1fce04ccdea656f2f647f3f1bba4b88a2f3ad6be8c37959e86e6
3
  size 17655
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 7.818608287724785,
5
  "eval_steps": 500,
6
- "global_step": 10000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -67,13 +67,19 @@
67
  "learning_rate": 0.0001,
68
  "loss": 0.3771,
69
  "step": 10000
 
 
 
 
 
 
70
  }
71
  ],
72
  "logging_steps": 1000,
73
  "max_steps": 12790,
74
  "num_train_epochs": 10,
75
  "save_steps": 1000,
76
- "total_flos": 73042358173696.0,
77
  "trial_name": null,
78
  "trial_params": null
79
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 8.600469116497264,
5
  "eval_steps": 500,
6
+ "global_step": 11000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
67
  "learning_rate": 0.0001,
68
  "loss": 0.3771,
69
  "step": 10000
70
+ },
71
+ {
72
+ "epoch": 8.6,
73
+ "learning_rate": 0.0001,
74
+ "loss": 0.371,
75
+ "step": 11000
76
  }
77
  ],
78
  "logging_steps": 1000,
79
  "max_steps": 12790,
80
  "num_train_epochs": 10,
81
  "save_steps": 1000,
82
+ "total_flos": 80322346614784.0,
83
  "trial_name": null,
84
  "trial_params": null
85
  }