Transformers
PyTorch
English
pixel
pretraining
plip commited on
Commit
ab34e00
·
1 Parent(s): 4d3b7a9

Training in progress, step 660000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa92f0e8b9e69e1553d8b13a15bb13ce9949137fccf0723c1cf598ce83f198b0
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d1b9c3dadef4c83eaa6444ae31d8e46ec85073c61b37dd61844f05913236e16
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b48d3a0bd417c9af2fc7e229c4f39167675dca2415013cbeac1e6dc95824f669
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2fc5b645a51764da4f8ff98e3c407a8e3b54b7f2ebf4044514e81a387a44685
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e055e902e7363a164e2d5682ba553c77cec859581fb13cd45150bf96f1a362c
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdc9f2d6c7b188b0a4e60257b0a8bd84c335d50dfde13a7917d3ec48da9a1694
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:436765cf8b9dcd2a96469489c52342b1fc2a8edf0ab7af7b53c1cbd1ff9932a6
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f55bf132d9f9827e3128928d8dd16bab60642cd4846a79818e1304f0d9048138
3
+ size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ee8f18ff63c361ce90d137b232b2607444382342857d71c811d9abe82e89eeb
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c250144fe49ffdfe7647f695a0d687d07a9a35cdce7fa106343ed4f42beb24af
3
+ size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:106d03af9d874407e7a0086ddb94edb099a500fa25e66c11a4dedce8d45fc7e2
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d99a97fa7df68e7130dee285dc72156e57930a619ecb49b136dff7611919aa2
3
+ size 14439
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b544465929a51046e9a52e629bd463b9098d69ff8cc60ad2e18003214dae8858
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e668d5f010f36e9bc3681300c074ae1cd82ec8d3466f5c0bcb0eb7c6db53f6b
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 9.925634095316628,
5
- "global_step": 650000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -4816,11 +4816,85 @@
4816
  "eval_samples_per_second": 965.164,
4817
  "eval_steps_per_second": 15.443,
4818
  "step": 650000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4819
  }
4820
  ],
4821
  "max_steps": 1000000,
4822
  "num_train_epochs": 16,
4823
- "total_flos": 4.556511053359226e+22,
4824
  "trial_name": null,
4825
  "trial_params": null
4826
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 10.078336158321498,
5
+ "global_step": 660000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
4816
  "eval_samples_per_second": 965.164,
4817
  "eval_steps_per_second": 15.443,
4818
  "step": 650000
4819
+ },
4820
+ {
4821
+ "epoch": 9.94,
4822
+ "learning_rate": 5.166948591359489e-05,
4823
+ "loss": 0.2493,
4824
+ "step": 651000
4825
+ },
4826
+ {
4827
+ "epoch": 9.96,
4828
+ "learning_rate": 5.145796137086076e-05,
4829
+ "loss": 0.2493,
4830
+ "step": 652000
4831
+ },
4832
+ {
4833
+ "epoch": 9.97,
4834
+ "learning_rate": 5.124674895928823e-05,
4835
+ "loss": 0.2493,
4836
+ "step": 653000
4837
+ },
4838
+ {
4839
+ "epoch": 9.99,
4840
+ "learning_rate": 5.103585098866237e-05,
4841
+ "loss": 0.2491,
4842
+ "step": 654000
4843
+ },
4844
+ {
4845
+ "epoch": 10.0,
4846
+ "learning_rate": 5.082526976532968e-05,
4847
+ "loss": 0.249,
4848
+ "step": 655000
4849
+ },
4850
+ {
4851
+ "epoch": 10.0,
4852
+ "eval_runtime": 1.0267,
4853
+ "eval_samples_per_second": 974.027,
4854
+ "eval_steps_per_second": 15.584,
4855
+ "step": 655000
4856
+ },
4857
+ {
4858
+ "epoch": 10.02,
4859
+ "learning_rate": 5.061500759217261e-05,
4860
+ "loss": 0.2494,
4861
+ "step": 656000
4862
+ },
4863
+ {
4864
+ "epoch": 10.03,
4865
+ "learning_rate": 5.04050667685846e-05,
4866
+ "loss": 0.2487,
4867
+ "step": 657000
4868
+ },
4869
+ {
4870
+ "epoch": 10.05,
4871
+ "learning_rate": 5.01954495904449e-05,
4872
+ "loss": 0.2485,
4873
+ "step": 658000
4874
+ },
4875
+ {
4876
+ "epoch": 10.06,
4877
+ "learning_rate": 4.998615835009339e-05,
4878
+ "loss": 0.2488,
4879
+ "step": 659000
4880
+ },
4881
+ {
4882
+ "epoch": 10.08,
4883
+ "learning_rate": 4.97771953363055e-05,
4884
+ "loss": 0.2489,
4885
+ "step": 660000
4886
+ },
4887
+ {
4888
+ "epoch": 10.08,
4889
+ "eval_runtime": 1.0445,
4890
+ "eval_samples_per_second": 957.361,
4891
+ "eval_steps_per_second": 15.318,
4892
+ "step": 660000
4893
  }
4894
  ],
4895
  "max_steps": 1000000,
4896
  "num_train_epochs": 16,
4897
+ "total_flos": 4.626610657321424e+22,
4898
  "trial_name": null,
4899
  "trial_params": null
4900
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b48d3a0bd417c9af2fc7e229c4f39167675dca2415013cbeac1e6dc95824f669
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2fc5b645a51764da4f8ff98e3c407a8e3b54b7f2ebf4044514e81a387a44685
3
  size 449471589