naman1011 commited on
Commit
91a05ed
·
1 Parent(s): 24541ff

Training in progress, step 2000, checkpoint

Browse files
last-checkpoint/global_step2000/zero_pp_rank_0_mp_rank_00_model_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c631555bb216228fd776c70fdb0e256ee4e31d790108950abfa77b028c501d3
3
- size 3369573916
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f77aa4b2756dfa4ffe04430a21cbf190e731d9a25d70b84b6af14fdd079577ac
3
+ size 77125
last-checkpoint/global_step2000/zero_pp_rank_0_mp_rank_00_optim_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3080ba6a4f448c0f1f9e781443c976f2fd5a79ea723a6a49542f4c026632d021
3
- size 3149677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b8456ae654ac85c7fe868407ce73c183217554c658fdcc4ab255743f110e767
3
+ size 181523565
last-checkpoint/global_step2000/zero_pp_rank_1_mp_rank_00_model_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be005c1c969525d4152a78bec86f4a9dbe8b58678eb89bb1bffa0b9953b40ba3
3
- size 3369573916
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:728bb222faac3c947ca5539282b110677e3dcbc2bf7b634c4d73fc517df9b319
3
+ size 76997
last-checkpoint/global_step2000/zero_pp_rank_1_mp_rank_00_optim_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc4c18a4ef0f9857edeb68da455dc4e7080151c87a75e93f7b1ce4cbf4ab2461
3
- size 3149677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c65958d00da74a9cc659cf20ecc61919fb9685a657b21ec9101a7375c51001c3
3
+ size 181523565
last-checkpoint/global_step2000/zero_pp_rank_2_mp_rank_00_model_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7169575885257a5886f2a16d9e9ac0ec0650b4840c49e3cf46173bb490042a1f
3
- size 3369573916
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37db7f8f1c899ab6031d7b9a7a9d7f4d13c375f2e5ef89dfa01b7e672aa7ddb0
3
+ size 76997
last-checkpoint/global_step2000/zero_pp_rank_2_mp_rank_00_optim_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a397d278e62116e1535866690747e07fcc337e68d0d6a1bc83659b5bce2d0fc8
3
- size 3149677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c4c3325b64ec89ef8ed79f9b3801f51bcba3ccf24530e611e172e7155998248
3
+ size 181523565
last-checkpoint/global_step2000/zero_pp_rank_3_mp_rank_00_model_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93bf1650107328c65c26fa2f710cf3bf59bb92597b39fbc8120f97a1c8179044
3
- size 3369573916
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f97f66ab01e2047b7ee2764c66b669ecb4a6fe23c8445c4ea0aae397721c98e
3
+ size 76997
last-checkpoint/global_step2000/zero_pp_rank_3_mp_rank_00_optim_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a216e45206c382e0569c4be9c261a3ff128aafd1935e65cab66c418f586fd578
3
- size 3149677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe3a4ec221f98936dedf0ae1db8ba950a1f667b9d0013965bb835d6561d482ec
3
+ size 181523565
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step1500
 
1
+ global_step2000
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:194af0302478c97171645454a5eb846b0fc5f8e392d4e3959fa03596fc8e4026
3
  size 242070038
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17769a6403d15a70cb9712603c4ec5dd4be70332def23aa0b13ea3bda8a1a7a1
3
  size 242070038
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d3cf537aeb636d74260ac33f9ee9f5f5488cd868e57c67412d317e90d714583
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9f6b0d8f8f3c7c672a3e4ec564e590a67d25f6a49a376b2b9d0d8236bb5ca89
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f46e6b131c11a49aaf40dd0567abef518102c7a1352bb71be9e97f08d2acdd07
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:077d38406025d335a1423c2a3b5123be5c0cbb86249376bb98772d98985b4106
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af26ea8cc81928ae6c96810dd49af32aaee79970eeeea540d94edd0eded31879
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86e2e9b2214a9712f049f41b02d665d19d9548d57de7aee006787e9507288ac8
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28da90f216354525bfc6e2c4fb7d9537e9448788220df6cdda43e8d5ba71d985
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bb3902c2fcdb3573e92153da7d553c4d6b893a789269e48961d6e7c05faeacc
3
  size 15024
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 6.0,
5
  "eval_steps": 500,
6
- "global_step": 1500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -25,13 +25,19 @@
25
  "learning_rate": 0.01,
26
  "loss": 0.1689,
27
  "step": 1500
 
 
 
 
 
 
28
  }
29
  ],
30
  "logging_steps": 500,
31
  "max_steps": 2500,
32
  "num_train_epochs": 10,
33
  "save_steps": 500,
34
- "total_flos": 253548232704.0,
35
  "trial_name": null,
36
  "trial_params": null
37
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 8.0,
5
  "eval_steps": 500,
6
+ "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
25
  "learning_rate": 0.01,
26
  "loss": 0.1689,
27
  "step": 1500
28
+ },
29
+ {
30
+ "epoch": 8.0,
31
+ "learning_rate": 0.01,
32
+ "loss": 0.1537,
33
+ "step": 2000
34
  }
35
  ],
36
  "logging_steps": 500,
37
  "max_steps": 2500,
38
  "num_train_epochs": 10,
39
  "save_steps": 500,
40
+ "total_flos": 338064310272.0,
41
  "trial_name": null,
42
  "trial_params": null
43
  }