jasmeeetsingh commited on
Commit
dd5941e
·
1 Parent(s): 139a1ab

Training in progress, step 2000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3552a00edec5e3ff885856bf37262282090bb542f8d1760897ace37c5e58bbf
3
  size 2384440
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fed3d0a014b7ac5bbf1f83a3a549bc3b56211d657c975c53a4f07f6dde47d01b
3
  size 2384440
last-checkpoint/global_step2000/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83a8db9056f93d8166aeb3dabf792534fee73deae21a9732cfe0be4dbc951e89
3
+ size 3621285613
last-checkpoint/global_step2000/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62466777353879028fa9199f790aca543323055373baea8f5481a394086e44ad
3
+ size 3542398
last-checkpoint/global_step2000/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b49072a49b5cf08c50b5afbc4b66502decc83d71ba3b72e39d5c1992d66e384
3
+ size 3621285613
last-checkpoint/global_step2000/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8da23ac94cc745c58226f91a78aaa9d4270963cffe2fda97e3d1ef10e386f4a
3
+ size 3542398
last-checkpoint/global_step2000/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9890a111a29adf26a2148ec38224c8dcc558785e1491da276c00b622defde960
3
+ size 3621285613
last-checkpoint/global_step2000/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9bcbe6c9f2ee4ad9118a6ef11427e612f7201233ce70829463bd79630fd8b72
3
+ size 3542398
last-checkpoint/global_step2000/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:613b8488c940aef26b63d29a51b45f2cb0a8d150bb0c26fe859aa40728877a49
3
+ size 3621285613
last-checkpoint/global_step2000/zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ca8cf67963e6c43e10b8e779d985cafcfb4ff01e3dcbbe5fbfb804eed5f03b0
3
+ size 3542398
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step1000
 
1
+ global_step2000
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f441efbee3751a48833c647ff7d9a17d0114136b3ca4f2bafd39cf7bd78767c
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6978e908c92772fe19c7d622c0523251d41ab05aaef529e7acd2caf4d0eafcb5
3
  size 17655
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cb547d05ff943109defb3515810f7a467d12cc0d4cc7b6de3b6c232503fe80d
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e3cd3cde36f4529c33ca348673132abd387870ddc25d7664ce7bed468955d89
3
  size 17655
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d539268bb0b2ffae38169e0f3b017e8c70f43c956e06e386aa3765f6857b15d8
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1d69d053ab98fad68ae2c8253970f3b7496f23830112d8923e49b3ccba17590
3
  size 17655
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d1f517289c7a91414eb73765e692a98606f4b5b073550a2851d53f1b603795b
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec44e66877bdf688eefe2444b516fec47140ba260f54ef402b4b8193b6a7f35b
3
  size 17655
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.7818608287724785,
5
  "eval_steps": 500,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -13,13 +13,19 @@
13
  "learning_rate": 0.0001,
14
  "loss": 0.6904,
15
  "step": 1000
 
 
 
 
 
 
16
  }
17
  ],
18
  "logging_steps": 1000,
19
  "max_steps": 12790,
20
  "num_train_epochs": 10,
21
  "save_steps": 1000,
22
- "total_flos": 7272076410880.0,
23
  "trial_name": null,
24
  "trial_params": null
25
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.5637216575449568,
5
  "eval_steps": 500,
6
+ "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
13
  "learning_rate": 0.0001,
14
  "loss": 0.6904,
15
  "step": 1000
16
+ },
17
+ {
18
+ "epoch": 1.56,
19
+ "learning_rate": 0.0001,
20
+ "loss": 0.5373,
21
+ "step": 2000
22
  }
23
  ],
24
  "logging_steps": 1000,
25
  "max_steps": 12790,
26
  "num_train_epochs": 10,
27
  "save_steps": 1000,
28
+ "total_flos": 14607257174016.0,
29
  "trial_name": null,
30
  "trial_params": null
31
  }