dima806 commited on
Commit
3dbad02
1 Parent(s): 67227a1

Upload folder using huggingface_hub

Browse files
checkpoint-3571/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c9d79a31dfd6cc06d7b238be742f88936198c7eee75656dd34ae40a20abb172
3
  size 343223968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b38e7d3de2be44b224cb4cffe881a0c4b75f7283c5d4a2017fbadd58bd41fdef
3
  size 343223968
checkpoint-3571/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bfc71d18a94aa67c691a6d2b42ea911711e1200bc1ace883a77a8f1c2bebe06c
3
  size 686568453
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f79103d18f35fce10ed3263f681c4583d0852f6a22a308dc9202b63818c1675c
3
  size 686568453
checkpoint-3571/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d8ae862eb872ca63527a4196c92bcd9af2aa0565512f1d314a5f0e3bed16f6f
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb0c7d2df9e3c7eddd2ddf2bb0658eca3700ed3c06e49ec653e14f162ce50e2c
3
  size 627
checkpoint-3571/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.022927358746528625,
3
  "best_model_checkpoint": "deepfake_vs_real_image_detection/checkpoint-3571",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,67 +10,67 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.14,
13
- "grad_norm": 0.26625385880470276,
14
- "learning_rate": 8.721953990343652e-07,
15
- "loss": 0.0944,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.28,
20
- "grad_norm": 0.4247075319290161,
21
- "learning_rate": 7.301902868503266e-07,
22
- "loss": 0.0715,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.42,
27
- "grad_norm": 7.891324520111084,
28
- "learning_rate": 5.881851746662879e-07,
29
- "loss": 0.069,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.56,
34
- "grad_norm": 6.847803115844727,
35
- "learning_rate": 4.461800624822493e-07,
36
- "loss": 0.0658,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.7,
41
- "grad_norm": 2.0988214015960693,
42
- "learning_rate": 3.041749502982107e-07,
43
- "loss": 0.0632,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.84,
48
- "grad_norm": 6.4862895011901855,
49
- "learning_rate": 1.621698381141721e-07,
50
- "loss": 0.0698,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.98,
55
- "grad_norm": 0.6512278914451599,
56
- "learning_rate": 2.0164725930133484e-08,
57
- "loss": 0.0587,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 1.0,
62
- "eval_accuracy": 0.9926865456073318,
63
- "eval_loss": 0.022927358746528625,
64
- "eval_runtime": 773.2123,
65
- "eval_samples_per_second": 98.499,
66
- "eval_steps_per_second": 12.314,
67
  "step": 3571
68
  }
69
  ],
70
  "logging_steps": 500,
71
- "max_steps": 3571,
72
  "num_input_tokens_seen": 0,
73
- "num_train_epochs": 1,
74
  "save_steps": 500,
75
  "total_flos": 8.852762385560605e+18,
76
  "train_batch_size": 32,
 
1
  {
2
+ "best_metric": 0.02310723066329956,
3
  "best_model_checkpoint": "deepfake_vs_real_image_detection/checkpoint-3571",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.14,
13
+ "grad_norm": 6.2275071144104,
14
+ "learning_rate": 9.365482233502537e-07,
15
+ "loss": 0.0626,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.28,
20
+ "grad_norm": 10.569954872131348,
21
+ "learning_rate": 8.660462492949803e-07,
22
+ "loss": 0.0574,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.42,
27
+ "grad_norm": 10.928681373596191,
28
+ "learning_rate": 7.955442752397067e-07,
29
+ "loss": 0.0657,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.56,
34
+ "grad_norm": 1.1176731586456299,
35
+ "learning_rate": 7.250423011844331e-07,
36
+ "loss": 0.0568,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.7,
41
+ "grad_norm": 9.849133491516113,
42
+ "learning_rate": 6.545403271291596e-07,
43
+ "loss": 0.0546,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.84,
48
+ "grad_norm": 2.835080862045288,
49
+ "learning_rate": 5.840383530738861e-07,
50
+ "loss": 0.0552,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.98,
55
+ "grad_norm": 0.03996190056204796,
56
+ "learning_rate": 5.135363790186125e-07,
57
+ "loss": 0.0603,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 1.0,
62
+ "eval_accuracy": 0.9927259358464305,
63
+ "eval_loss": 0.02310723066329956,
64
+ "eval_runtime": 806.2331,
65
+ "eval_samples_per_second": 94.465,
66
+ "eval_steps_per_second": 11.809,
67
  "step": 3571
68
  }
69
  ],
70
  "logging_steps": 500,
71
+ "max_steps": 7142,
72
  "num_input_tokens_seen": 0,
73
+ "num_train_epochs": 2,
74
  "save_steps": 500,
75
  "total_flos": 8.852762385560605e+18,
76
  "train_batch_size": 32,
checkpoint-3571/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:992d4bc7f07ddce259b1dd27aeca6e78641e1544cdefa763b060e959db4c8f00
3
  size 4411
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43f6d25546b8da26ab17504f529643fe71525e1a77fe75ca99c8e672a1e11a7c
3
  size 4411
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c9d79a31dfd6cc06d7b238be742f88936198c7eee75656dd34ae40a20abb172
3
  size 343223968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b38e7d3de2be44b224cb4cffe881a0c4b75f7283c5d4a2017fbadd58bd41fdef
3
  size 343223968
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:992d4bc7f07ddce259b1dd27aeca6e78641e1544cdefa763b060e959db4c8f00
3
  size 4411
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43f6d25546b8da26ab17504f529643fe71525e1a77fe75ca99c8e672a1e11a7c
3
  size 4411