upload ViV1T model checkpoints, each trained with a different seed.
Browse files- 001/args.yaml +87 -0
- 001/ckpt/model_state.pt +3 -0
- 001/evaluation.yaml +3 -0
- 001/model.txt +143 -0
- 001/output.log +816 -0
- 002/args.yaml +87 -0
- 002/ckpt/model_state.pt +3 -0
- 002/evaluation.yaml +3 -0
- 002/model.txt +143 -0
- 002/output.log +942 -0
- 003/args.yaml +87 -0
- 003/ckpt/model_state.pt +3 -0
- 003/evaluation.yaml +3 -0
- 003/model.txt +143 -0
- 003/output.log +789 -0
- 004/args.yaml +87 -0
- 004/ckpt/model_state.pt +3 -0
- 004/evaluation.yaml +3 -0
- 004/model.txt +143 -0
- 004/output.log +770 -0
- 005/args.yaml +87 -0
- 005/ckpt/model_state.pt +3 -0
- 005/evaluation.yaml +3 -0
- 005/model.txt +143 -0
- 005/output.log +822 -0
001/args.yaml
ADDED
@@ -0,0 +1,87 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
adam_beta1: 0.9
|
2 |
+
adam_beta2: 0.999
|
3 |
+
adam_eps: 1e-08
|
4 |
+
batch_size: 6
|
5 |
+
cache_data: false
|
6 |
+
center_crop: 1.0
|
7 |
+
clear_output_dir: true
|
8 |
+
core: vivit
|
9 |
+
core_behavior_mode: 2
|
10 |
+
core_compile: false
|
11 |
+
core_drop_path: 0.0505
|
12 |
+
core_emb_dim: 112
|
13 |
+
core_ff_activation: gelu
|
14 |
+
core_ff_dropout: 0.0592
|
15 |
+
core_flash_attention: 1
|
16 |
+
core_head_dim: 48
|
17 |
+
core_lr: 0.0048
|
18 |
+
core_mha_dropout: 0.358
|
19 |
+
core_mlp_dim: 136
|
20 |
+
core_norm_qk: false
|
21 |
+
core_num_heads: 11
|
22 |
+
core_p_dropout: 0.1338
|
23 |
+
core_parallel_attention: true
|
24 |
+
core_patch_mode: 0
|
25 |
+
core_pos_encoding: 3
|
26 |
+
core_spatial_depth: 3
|
27 |
+
core_spatial_patch_size: 7
|
28 |
+
core_spatial_patch_stride: 2
|
29 |
+
core_temporal_depth: 5
|
30 |
+
core_temporal_patch_size: 25
|
31 |
+
core_temporal_patch_stride: 1
|
32 |
+
core_weight_decay: 0.1789
|
33 |
+
criterion: poisson_correlation
|
34 |
+
critic_mode: 0
|
35 |
+
crop_frame: 140
|
36 |
+
data: /home/storage/sensorium
|
37 |
+
deterministic: false
|
38 |
+
device: cuda
|
39 |
+
dpi: 120
|
40 |
+
ds_mode: 3
|
41 |
+
ds_scale: 1
|
42 |
+
epochs: 400
|
43 |
+
format: svg
|
44 |
+
git_hash: 1033c29
|
45 |
+
grad_checkpointing: 0
|
46 |
+
grad_norm: null
|
47 |
+
input_shapes:
|
48 |
+
behavior: [2, 140]
|
49 |
+
pupil_center: [2, 140]
|
50 |
+
video: [1, 140, 36, 64]
|
51 |
+
limit_data: null
|
52 |
+
lr: 0.0036
|
53 |
+
max_frame: 300
|
54 |
+
micro_batch_size: 6
|
55 |
+
modulator_mode: 0
|
56 |
+
mouse_ids: [A, B, C, D, E, F, G, H, I, J]
|
57 |
+
num_workers: 2
|
58 |
+
output_dir: /home/storage/runs/001
|
59 |
+
output_mode: 1
|
60 |
+
output_shapes:
|
61 |
+
A: [7440, 140]
|
62 |
+
B: [7928, 140]
|
63 |
+
C: [8285, 140]
|
64 |
+
D: [7671, 140]
|
65 |
+
E: [7495, 140]
|
66 |
+
F: [7863, 140]
|
67 |
+
G: [7908, 140]
|
68 |
+
H: [8202, 140]
|
69 |
+
I: [7939, 140]
|
70 |
+
J: [8122, 140]
|
71 |
+
precision: "32"
|
72 |
+
pretrain_core: null
|
73 |
+
readout: gaussian2d
|
74 |
+
readout_bias_mode: 2
|
75 |
+
readout_dropout: 0.0
|
76 |
+
readout_grid_mode: 1
|
77 |
+
restore: null
|
78 |
+
save_plots: false
|
79 |
+
seed: 2
|
80 |
+
shifter_layers: 3
|
81 |
+
shifter_mode: 1
|
82 |
+
shifter_size: 5
|
83 |
+
stat_mode: 1
|
84 |
+
trainable_params: 12278365
|
85 |
+
transform_mode: 2
|
86 |
+
verbose: 1
|
87 |
+
weight_decay: 0.3939
|
001/ckpt/model_state.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86ee492503a0f995686aba27eb0db7f8d759dd2c4b491a692740b3be3241f14a
|
3 |
+
size 148268583
|
001/evaluation.yaml
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
validation: {A: 0.24868205189704895, B: 0.2788656949996948, C: 0.271991103887558,
|
2 |
+
D: 0.2340584099292755, E: 0.23670722544193268, F: 0.23395685851573944, G: 0.25554871559143066,
|
3 |
+
H: 0.23508135974407196, I: 0.25329142808914185, J: 0.2589012682437897, average: 0.25070841163396834}
|
001/model.txt
ADDED
@@ -0,0 +1,143 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
=======================================================================================================================================
|
2 |
+
Layer (type:depth-idx) Input Shape Output Shape Param #
|
3 |
+
=======================================================================================================================================
|
4 |
+
Model -- [1, 7440, 116] --
|
5 |
+
├─ViViTCore: 1-1 -- [1, 112, 116, 15, 29] --
|
6 |
+
│ └─ViViT: 2-1 [1, 5, 140, 36, 64] [1, 112, 116, 15, 29] --
|
7 |
+
│ │ └─Tokenizer: 3-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] 79,632
|
8 |
+
│ │ │ └─Sequential: 4-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] --
|
9 |
+
│ │ │ │ └─Unfold3d: 5-1 [1, 5, 140, 36, 64] [1, 116, 435, 6125] --
|
10 |
+
│ │ │ │ └─LayerNorm: 5-2 [1, 116, 435, 6125] [1, 116, 435, 6125] 12,250
|
11 |
+
│ │ │ │ └─Linear: 5-3 [1, 116, 435, 6125] [1, 116, 435, 112] 686,112
|
12 |
+
│ │ │ │ └─LayerNorm: 5-4 [1, 116, 435, 112] [1, 116, 435, 112] 224
|
13 |
+
│ │ │ │ └─Dropout: 5-5 [1, 116, 435, 112] [1, 116, 435, 112] --
|
14 |
+
│ │ └─Transformer: 3-2 [116, 435, 112] [116, 435, 112] --
|
15 |
+
│ │ │ └─ModuleList: 4-2 -- -- --
|
16 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-6 [116, 435, 112] [116, 435, 112] --
|
17 |
+
│ │ │ │ │ └─LayerNorm: 6-1 [116, 435, 112] [116, 435, 112] 224
|
18 |
+
│ │ │ │ │ └─Linear: 6-2 [116, 435, 112] [116, 435, 1720] 192,640
|
19 |
+
│ │ │ │ │ └─Linear: 6-3 [116, 435, 528] [116, 435, 112] 59,136
|
20 |
+
│ │ │ │ │ └─DropPath: 6-4 [116, 435, 112] [116, 435, 112] --
|
21 |
+
│ │ │ │ │ └─Sequential: 6-5 [116, 435, 136] [116, 435, 112] --
|
22 |
+
│ │ │ │ │ │ └─GELU: 7-1 [116, 435, 136] [116, 435, 136] --
|
23 |
+
│ │ │ │ │ │ └─Dropout: 7-2 [116, 435, 136] [116, 435, 136] --
|
24 |
+
│ │ │ │ │ │ └─Linear: 7-3 [116, 435, 136] [116, 435, 112] 15,232
|
25 |
+
│ │ │ │ │ └─DropPath: 6-6 [116, 435, 112] [116, 435, 112] --
|
26 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-7 [116, 435, 112] [116, 435, 112] --
|
27 |
+
│ │ │ │ │ └─LayerNorm: 6-7 [116, 435, 112] [116, 435, 112] 224
|
28 |
+
│ │ │ │ │ └─Linear: 6-8 [116, 435, 112] [116, 435, 1720] 192,640
|
29 |
+
│ │ │ │ │ └─Linear: 6-9 [116, 435, 528] [116, 435, 112] 59,136
|
30 |
+
│ │ │ │ │ └─DropPath: 6-10 [116, 435, 112] [116, 435, 112] --
|
31 |
+
│ │ │ │ │ └─Sequential: 6-11 [116, 435, 136] [116, 435, 112] --
|
32 |
+
│ │ │ │ │ │ └─GELU: 7-4 [116, 435, 136] [116, 435, 136] --
|
33 |
+
│ │ │ │ │ │ └─Dropout: 7-5 [116, 435, 136] [116, 435, 136] --
|
34 |
+
│ │ │ │ │ │ └─Linear: 7-6 [116, 435, 136] [116, 435, 112] 15,232
|
35 |
+
│ │ │ │ │ └─DropPath: 6-12 [116, 435, 112] [116, 435, 112] --
|
36 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-8 [116, 435, 112] [116, 435, 112] --
|
37 |
+
│ │ │ │ │ └─LayerNorm: 6-13 [116, 435, 112] [116, 435, 112] 224
|
38 |
+
│ │ │ │ │ └─Linear: 6-14 [116, 435, 112] [116, 435, 1720] 192,640
|
39 |
+
│ │ │ │ │ └─Linear: 6-15 [116, 435, 528] [116, 435, 112] 59,136
|
40 |
+
│ │ │ │ │ └─DropPath: 6-16 [116, 435, 112] [116, 435, 112] --
|
41 |
+
│ │ │ │ │ └─Sequential: 6-17 [116, 435, 136] [116, 435, 112] --
|
42 |
+
│ │ │ │ │ │ └─GELU: 7-7 [116, 435, 136] [116, 435, 136] --
|
43 |
+
│ │ │ │ │ │ └─Dropout: 7-8 [116, 435, 136] [116, 435, 136] --
|
44 |
+
│ │ │ │ │ │ └─Linear: 7-9 [116, 435, 136] [116, 435, 112] 15,232
|
45 |
+
│ │ │ │ │ └─DropPath: 6-18 [116, 435, 112] [116, 435, 112] --
|
46 |
+
│ │ └─Transformer: 3-3 [435, 116, 112] [435, 116, 112] --
|
47 |
+
│ │ │ └─ModuleList: 4-3 -- -- --
|
48 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-9 [435, 116, 112] [435, 116, 112] --
|
49 |
+
│ │ │ │ │ └─LayerNorm: 6-19 [435, 116, 112] [435, 116, 112] 224
|
50 |
+
│ │ │ │ │ └─Linear: 6-20 [435, 116, 112] [435, 116, 1720] 192,640
|
51 |
+
│ │ │ │ │ └─Linear: 6-21 [435, 116, 528] [435, 116, 112] 59,136
|
52 |
+
│ │ │ │ │ └─DropPath: 6-22 [435, 116, 112] [435, 116, 112] --
|
53 |
+
│ │ │ │ │ └─Sequential: 6-23 [435, 116, 136] [435, 116, 112] --
|
54 |
+
│ │ │ │ │ │ └─GELU: 7-10 [435, 116, 136] [435, 116, 136] --
|
55 |
+
│ │ │ │ │ │ └─Dropout: 7-11 [435, 116, 136] [435, 116, 136] --
|
56 |
+
│ │ │ │ │ │ └─Linear: 7-12 [435, 116, 136] [435, 116, 112] 15,232
|
57 |
+
│ │ │ │ │ └─DropPath: 6-24 [435, 116, 112] [435, 116, 112] --
|
58 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-10 [435, 116, 112] [435, 116, 112] --
|
59 |
+
│ │ │ │ │ └─LayerNorm: 6-25 [435, 116, 112] [435, 116, 112] 224
|
60 |
+
│ │ │ │ │ └─Linear: 6-26 [435, 116, 112] [435, 116, 1720] 192,640
|
61 |
+
│ │ │ │ │ └─Linear: 6-27 [435, 116, 528] [435, 116, 112] 59,136
|
62 |
+
│ │ │ │ │ └─DropPath: 6-28 [435, 116, 112] [435, 116, 112] --
|
63 |
+
│ │ │ │ │ └─Sequential: 6-29 [435, 116, 136] [435, 116, 112] --
|
64 |
+
│ │ │ │ │ │ └─GELU: 7-13 [435, 116, 136] [435, 116, 136] --
|
65 |
+
│ │ │ │ │ │ └─Dropout: 7-14 [435, 116, 136] [435, 116, 136] --
|
66 |
+
│ │ │ │ │ │ └─Linear: 7-15 [435, 116, 136] [435, 116, 112] 15,232
|
67 |
+
│ │ │ │ │ └─DropPath: 6-30 [435, 116, 112] [435, 116, 112] --
|
68 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-11 [435, 116, 112] [435, 116, 112] --
|
69 |
+
│ │ │ │ │ └─LayerNorm: 6-31 [435, 116, 112] [435, 116, 112] 224
|
70 |
+
│ │ │ │ │ └─Linear: 6-32 [435, 116, 112] [435, 116, 1720] 192,640
|
71 |
+
│ │ │ │ │ └─Linear: 6-33 [435, 116, 528] [435, 116, 112] 59,136
|
72 |
+
│ │ │ │ │ └─DropPath: 6-34 [435, 116, 112] [435, 116, 112] --
|
73 |
+
│ │ │ │ │ └─Sequential: 6-35 [435, 116, 136] [435, 116, 112] --
|
74 |
+
│ │ │ │ │ │ └─GELU: 7-16 [435, 116, 136] [435, 116, 136] --
|
75 |
+
│ │ │ │ │ │ └─Dropout: 7-17 [435, 116, 136] [435, 116, 136] --
|
76 |
+
│ │ │ │ │ │ └─Linear: 7-18 [435, 116, 136] [435, 116, 112] 15,232
|
77 |
+
│ │ │ │ │ └─DropPath: 6-36 [435, 116, 112] [435, 116, 112] --
|
78 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-12 [435, 116, 112] [435, 116, 112] --
|
79 |
+
│ │ │ │ │ └─LayerNorm: 6-37 [435, 116, 112] [435, 116, 112] 224
|
80 |
+
│ │ │ │ │ └─Linear: 6-38 [435, 116, 112] [435, 116, 1720] 192,640
|
81 |
+
│ │ │ │ │ └─Linear: 6-39 [435, 116, 528] [435, 116, 112] 59,136
|
82 |
+
│ │ │ │ │ └─DropPath: 6-40 [435, 116, 112] [435, 116, 112] --
|
83 |
+
│ │ │ │ │ └─Sequential: 6-41 [435, 116, 136] [435, 116, 112] --
|
84 |
+
│ │ │ │ │ │ └─GELU: 7-19 [435, 116, 136] [435, 116, 136] --
|
85 |
+
│ │ │ │ │ │ └─Dropout: 7-20 [435, 116, 136] [435, 116, 136] --
|
86 |
+
│ │ │ │ │ │ └─Linear: 7-21 [435, 116, 136] [435, 116, 112] 15,232
|
87 |
+
│ │ │ │ │ └─DropPath: 6-42 [435, 116, 112] [435, 116, 112] --
|
88 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-13 [435, 116, 112] [435, 116, 112] --
|
89 |
+
│ │ │ │ │ └─LayerNorm: 6-43 [435, 116, 112] [435, 116, 112] 224
|
90 |
+
│ │ │ │ │ └─Linear: 6-44 [435, 116, 112] [435, 116, 1720] 192,640
|
91 |
+
│ │ │ │ │ └─Linear: 6-45 [435, 116, 528] [435, 116, 112] 59,136
|
92 |
+
│ │ │ │ │ └─DropPath: 6-46 [435, 116, 112] [435, 116, 112] --
|
93 |
+
│ │ │ │ │ └─Sequential: 6-47 [435, 116, 136] [435, 116, 112] --
|
94 |
+
│ │ │ │ │ │ └─GELU: 7-22 [435, 116, 136] [435, 116, 136] --
|
95 |
+
│ │ │ │ │ │ └─Dropout: 7-23 [435, 116, 136] [435, 116, 136] --
|
96 |
+
│ │ │ │ │ │ └─Linear: 7-24 [435, 116, 136] [435, 116, 112] 15,232
|
97 |
+
│ │ │ │ │ └─DropPath: 6-48 [435, 116, 112] [435, 116, 112] --
|
98 |
+
│ │ └─Rearrange: 3-4 [1, 116, 435, 112] [1, 112, 116, 15, 29] --
|
99 |
+
├─MLPShifters: 1-2 -- [1, 2, 116] 513
|
100 |
+
│ └─MLPShifter: 2-2 [116, 2] [116, 2] --
|
101 |
+
│ │ └─Sequential: 3-5 [116, 2] [116, 2] --
|
102 |
+
│ │ │ └─Linear: 4-4 [116, 2] [116, 5] 15
|
103 |
+
│ │ │ └─Tanh: 4-5 [116, 5] [116, 5] --
|
104 |
+
│ │ │ └─Linear: 4-6 [116, 5] [116, 5] 30
|
105 |
+
│ │ │ └─Tanh: 4-7 [116, 5] [116, 5] --
|
106 |
+
│ │ │ └─Linear: 4-8 [116, 5] [116, 2] 12
|
107 |
+
│ │ │ └─Tanh: 4-9 [116, 2] [116, 2] --
|
108 |
+
├─Readouts: 1-3 [1, 112, 116, 15, 29] [1, 7440, 116] 8,477,649
|
109 |
+
│ └─Gaussian2DReadout2: 2-3 [1, 112, 116, 15, 29] [1, 7440, 116] 870,480
|
110 |
+
│ │ └─Sequential: 3-6 [7440, 2] [7440, 2] --
|
111 |
+
│ │ │ └─Linear: 4-10 [7440, 2] [7440, 30] 90
|
112 |
+
│ │ │ └─ELU: 4-11 [7440, 30] [7440, 30] --
|
113 |
+
│ │ │ └─Linear: 4-12 [7440, 30] [7440, 2] 62
|
114 |
+
│ │ │ └─Tanh: 4-13 [7440, 2] [7440, 2] --
|
115 |
+
│ │ └─Sequential: 3-7 [7440, 2] [7440, 2] (recursive)
|
116 |
+
│ │ │ └─Linear: 4-14 [7440, 2] [7440, 30] (recursive)
|
117 |
+
│ │ │ └─ELU: 4-15 [7440, 30] [7440, 30] --
|
118 |
+
�� │ │ └─Linear: 4-16 [7440, 30] [7440, 2] (recursive)
|
119 |
+
│ │ │ └─Tanh: 4-17 [7440, 2] [7440, 2] --
|
120 |
+
│ │ └─Sequential: 3-8 [7440, 2] [7440, 2] (recursive)
|
121 |
+
│ │ │ └─Linear: 4-18 [7440, 2] [7440, 30] (recursive)
|
122 |
+
│ │ │ └─ELU: 4-19 [7440, 30] [7440, 30] --
|
123 |
+
│ │ │ └─Linear: 4-20 [7440, 30] [7440, 2] (recursive)
|
124 |
+
│ │ │ └─Tanh: 4-21 [7440, 2] [7440, 2] --
|
125 |
+
│ │ └─Sequential: 3-9 [116, 4] [116, 112] --
|
126 |
+
│ │ │ └─Linear: 4-22 [116, 4] [116, 112] 560
|
127 |
+
│ │ │ └─LayerNorm: 4-23 [116, 112] [116, 112] 224
|
128 |
+
│ │ │ └─GELU: 4-24 [116, 112] [116, 112] --
|
129 |
+
│ │ │ └─Dropout: 4-25 [116, 112] [116, 112] --
|
130 |
+
│ │ │ └─Linear: 4-26 [116, 112] [116, 112] 12,656
|
131 |
+
│ │ │ └─Tanh: 4-27 [116, 112] [116, 112] --
|
132 |
+
├─Exponential: 1-4 [1, 7440, 116] [1, 7440, 116] --
|
133 |
+
=======================================================================================================================================
|
134 |
+
Total params: 12,278,365
|
135 |
+
Trainable params: 12,278,365
|
136 |
+
Non-trainable params: 0
|
137 |
+
Total mult-adds (Units.MEGABYTES): 679.88
|
138 |
+
=======================================================================================================================================
|
139 |
+
Input size (MB): 1.29
|
140 |
+
Forward/backward pass size (MB): 9208.73
|
141 |
+
Params size (MB): 11.40
|
142 |
+
Estimated Total Size (MB): 9221.42
|
143 |
+
=======================================================================================================================================
|
001/output.log
ADDED
@@ -0,0 +1,816 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Use bfloat16 for core module.
|
2 |
+
Use parallel attention and MLP in ViViT.
|
3 |
+
|
4 |
+
Epoch 001/400
|
5 |
+
Train loss: 113924008.00 correlation: 0.0107
|
6 |
+
Validation loss: 200107760.00 correlation: 0.0263
|
7 |
+
Elapse: 605.46s
|
8 |
+
|
9 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
10 |
+
|
11 |
+
Epoch 002/400
|
12 |
+
Train loss: 97896768.00 correlation: 0.0340
|
13 |
+
Validation loss: 199235856.00 correlation: 0.0378
|
14 |
+
Elapse: 556.86s
|
15 |
+
|
16 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
17 |
+
|
18 |
+
Epoch 003/400
|
19 |
+
Train loss: 96883144.00 correlation: 0.0443
|
20 |
+
Validation loss: 198767200.00 correlation: 0.0405
|
21 |
+
Elapse: 560.31s
|
22 |
+
|
23 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
24 |
+
|
25 |
+
Epoch 004/400
|
26 |
+
Train loss: 96317000.00 correlation: 0.0499
|
27 |
+
Validation loss: 198194576.00 correlation: 0.0449
|
28 |
+
Elapse: 560.78s
|
29 |
+
|
30 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
31 |
+
|
32 |
+
Epoch 005/400
|
33 |
+
Train loss: 95592096.00 correlation: 0.0577
|
34 |
+
Validation loss: 197382576.00 correlation: 0.0493
|
35 |
+
Elapse: 563.47s
|
36 |
+
|
37 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
38 |
+
|
39 |
+
Epoch 006/400
|
40 |
+
Train loss: 94455696.00 correlation: 0.0692
|
41 |
+
Validation loss: 195917728.00 correlation: 0.0602
|
42 |
+
Elapse: 565.83s
|
43 |
+
|
44 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
45 |
+
|
46 |
+
Epoch 007/400
|
47 |
+
Train loss: 93257144.00 correlation: 0.0821
|
48 |
+
Validation loss: 193956304.00 correlation: 0.0721
|
49 |
+
Elapse: 566.60s
|
50 |
+
|
51 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
52 |
+
|
53 |
+
Epoch 008/400
|
54 |
+
Train loss: 92014728.00 correlation: 0.0951
|
55 |
+
Validation loss: 192039424.00 correlation: 0.0839
|
56 |
+
Elapse: 566.05s
|
57 |
+
|
58 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
59 |
+
|
60 |
+
Epoch 009/400
|
61 |
+
Train loss: 91067848.00 correlation: 0.1053
|
62 |
+
Validation loss: 190701360.00 correlation: 0.0935
|
63 |
+
Elapse: 563.36s
|
64 |
+
|
65 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
66 |
+
|
67 |
+
Epoch 010/400
|
68 |
+
Train loss: 90106464.00 correlation: 0.1149
|
69 |
+
Validation loss: 189259712.00 correlation: 0.1026
|
70 |
+
Elapse: 562.44s
|
71 |
+
|
72 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
73 |
+
|
74 |
+
Epoch 011/400
|
75 |
+
Train loss: 89183952.00 correlation: 0.1243
|
76 |
+
Validation loss: 187589920.00 correlation: 0.1130
|
77 |
+
Elapse: 560.31s
|
78 |
+
|
79 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
80 |
+
|
81 |
+
Epoch 012/400
|
82 |
+
Train loss: 88171952.00 correlation: 0.1348
|
83 |
+
Validation loss: 186131232.00 correlation: 0.1219
|
84 |
+
Elapse: 559.08s
|
85 |
+
|
86 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
87 |
+
|
88 |
+
Epoch 013/400
|
89 |
+
Train loss: 87220088.00 correlation: 0.1442
|
90 |
+
Validation loss: 184294144.00 correlation: 0.1328
|
91 |
+
Elapse: 564.57s
|
92 |
+
|
93 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
94 |
+
|
95 |
+
Epoch 014/400
|
96 |
+
Train loss: 86305888.00 correlation: 0.1535
|
97 |
+
Validation loss: 182766432.00 correlation: 0.1425
|
98 |
+
Elapse: 564.31s
|
99 |
+
|
100 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
101 |
+
|
102 |
+
Epoch 015/400
|
103 |
+
Train loss: 85306032.00 correlation: 0.1632
|
104 |
+
Validation loss: 181567952.00 correlation: 0.1505
|
105 |
+
Elapse: 562.48s
|
106 |
+
|
107 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
108 |
+
|
109 |
+
Epoch 016/400
|
110 |
+
Train loss: 84622736.00 correlation: 0.1701
|
111 |
+
Validation loss: 180351280.00 correlation: 0.1587
|
112 |
+
Elapse: 561.75s
|
113 |
+
|
114 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
115 |
+
|
116 |
+
Epoch 017/400
|
117 |
+
Train loss: 83839824.00 correlation: 0.1780
|
118 |
+
Validation loss: 179434864.00 correlation: 0.1644
|
119 |
+
Elapse: 561.90s
|
120 |
+
|
121 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
122 |
+
|
123 |
+
Epoch 018/400
|
124 |
+
Train loss: 83213000.00 correlation: 0.1840
|
125 |
+
Validation loss: 178816208.00 correlation: 0.1695
|
126 |
+
Elapse: 562.07s
|
127 |
+
|
128 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
129 |
+
|
130 |
+
Epoch 019/400
|
131 |
+
Train loss: 82673560.00 correlation: 0.1895
|
132 |
+
Validation loss: 178169568.00 correlation: 0.1740
|
133 |
+
Elapse: 562.05s
|
134 |
+
|
135 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
136 |
+
|
137 |
+
Epoch 020/400
|
138 |
+
Train loss: 82081376.00 correlation: 0.1949
|
139 |
+
Validation loss: 177435600.00 correlation: 0.1787
|
140 |
+
Elapse: 561.87s
|
141 |
+
|
142 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
143 |
+
|
144 |
+
Epoch 021/400
|
145 |
+
Train loss: 81644440.00 correlation: 0.1992
|
146 |
+
Validation loss: 176873408.00 correlation: 0.1824
|
147 |
+
Elapse: 562.31s
|
148 |
+
|
149 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
150 |
+
|
151 |
+
Epoch 022/400
|
152 |
+
Train loss: 81300944.00 correlation: 0.2027
|
153 |
+
Validation loss: 176298464.00 correlation: 0.1855
|
154 |
+
Elapse: 562.57s
|
155 |
+
|
156 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
157 |
+
|
158 |
+
Epoch 023/400
|
159 |
+
Train loss: 80864992.00 correlation: 0.2072
|
160 |
+
Validation loss: 175630304.00 correlation: 0.1905
|
161 |
+
Elapse: 562.55s
|
162 |
+
|
163 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
164 |
+
|
165 |
+
Epoch 024/400
|
166 |
+
Train loss: 80516536.00 correlation: 0.2102
|
167 |
+
Validation loss: 175099184.00 correlation: 0.1937
|
168 |
+
Elapse: 561.74s
|
169 |
+
|
170 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
171 |
+
|
172 |
+
Epoch 025/400
|
173 |
+
Train loss: 80141312.00 correlation: 0.2140
|
174 |
+
Validation loss: 174953952.00 correlation: 0.1954
|
175 |
+
Elapse: 563.63s
|
176 |
+
|
177 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
178 |
+
|
179 |
+
Epoch 026/400
|
180 |
+
Train loss: 79914320.00 correlation: 0.2162
|
181 |
+
Validation loss: 174397456.00 correlation: 0.1975
|
182 |
+
Elapse: 563.20s
|
183 |
+
|
184 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
185 |
+
|
186 |
+
Epoch 027/400
|
187 |
+
Train loss: 79520984.00 correlation: 0.2200
|
188 |
+
Validation loss: 174134560.00 correlation: 0.2014
|
189 |
+
Elapse: 562.71s
|
190 |
+
|
191 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
192 |
+
|
193 |
+
Epoch 028/400
|
194 |
+
Train loss: 79212208.00 correlation: 0.2229
|
195 |
+
Validation loss: 173471920.00 correlation: 0.2046
|
196 |
+
Elapse: 562.79s
|
197 |
+
|
198 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
199 |
+
|
200 |
+
Epoch 029/400
|
201 |
+
Train loss: 78973040.00 correlation: 0.2252
|
202 |
+
Validation loss: 173183520.00 correlation: 0.2064
|
203 |
+
Elapse: 563.08s
|
204 |
+
|
205 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
206 |
+
|
207 |
+
Epoch 030/400
|
208 |
+
Train loss: 78870784.00 correlation: 0.2264
|
209 |
+
Validation loss: 172775088.00 correlation: 0.2096
|
210 |
+
Elapse: 562.82s
|
211 |
+
|
212 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
213 |
+
|
214 |
+
Epoch 031/400
|
215 |
+
Train loss: 78490200.00 correlation: 0.2296
|
216 |
+
Validation loss: 172664992.00 correlation: 0.2107
|
217 |
+
Elapse: 563.05s
|
218 |
+
|
219 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
220 |
+
|
221 |
+
Epoch 032/400
|
222 |
+
Train loss: 78317200.00 correlation: 0.2318
|
223 |
+
Validation loss: 172019824.00 correlation: 0.2132
|
224 |
+
Elapse: 562.89s
|
225 |
+
|
226 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
227 |
+
|
228 |
+
Epoch 033/400
|
229 |
+
Train loss: 78137128.00 correlation: 0.2333
|
230 |
+
Validation loss: 171897024.00 correlation: 0.2150
|
231 |
+
Elapse: 562.71s
|
232 |
+
|
233 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
234 |
+
|
235 |
+
Epoch 034/400
|
236 |
+
Train loss: 77950032.00 correlation: 0.2354
|
237 |
+
Validation loss: 171802656.00 correlation: 0.2157
|
238 |
+
Elapse: 562.68s
|
239 |
+
|
240 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
241 |
+
|
242 |
+
Epoch 035/400
|
243 |
+
Train loss: 77766832.00 correlation: 0.2367
|
244 |
+
Validation loss: 171322160.00 correlation: 0.2180
|
245 |
+
Elapse: 561.92s
|
246 |
+
|
247 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
248 |
+
|
249 |
+
Epoch 036/400
|
250 |
+
Train loss: 77637216.00 correlation: 0.2384
|
251 |
+
Validation loss: 171034880.00 correlation: 0.2209
|
252 |
+
Elapse: 562.15s
|
253 |
+
|
254 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
255 |
+
|
256 |
+
Epoch 037/400
|
257 |
+
Train loss: 77482304.00 correlation: 0.2397
|
258 |
+
Validation loss: 171174608.00 correlation: 0.2203
|
259 |
+
Elapse: 564.93s
|
260 |
+
|
261 |
+
Epoch 038/400
|
262 |
+
Train loss: 77429408.00 correlation: 0.2402
|
263 |
+
Validation loss: 170815888.00 correlation: 0.2218
|
264 |
+
Elapse: 564.45s
|
265 |
+
|
266 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
267 |
+
|
268 |
+
Epoch 039/400
|
269 |
+
Train loss: 77292792.00 correlation: 0.2412
|
270 |
+
Validation loss: 170692576.00 correlation: 0.2224
|
271 |
+
Elapse: 563.94s
|
272 |
+
|
273 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
274 |
+
|
275 |
+
Epoch 040/400
|
276 |
+
Train loss: 77122352.00 correlation: 0.2426
|
277 |
+
Validation loss: 170492064.00 correlation: 0.2256
|
278 |
+
Elapse: 565.03s
|
279 |
+
|
280 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
281 |
+
|
282 |
+
Epoch 041/400
|
283 |
+
Train loss: 77124456.00 correlation: 0.2430
|
284 |
+
Validation loss: 170532256.00 correlation: 0.2245
|
285 |
+
Elapse: 564.39s
|
286 |
+
|
287 |
+
Epoch 042/400
|
288 |
+
Train loss: 76964592.00 correlation: 0.2445
|
289 |
+
Validation loss: 170406688.00 correlation: 0.2257
|
290 |
+
Elapse: 565.12s
|
291 |
+
|
292 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
293 |
+
|
294 |
+
Epoch 043/400
|
295 |
+
Train loss: 76869008.00 correlation: 0.2454
|
296 |
+
Validation loss: 170592080.00 correlation: 0.2248
|
297 |
+
Elapse: 563.98s
|
298 |
+
|
299 |
+
Epoch 044/400
|
300 |
+
Train loss: 76798544.00 correlation: 0.2461
|
301 |
+
Validation loss: 170285664.00 correlation: 0.2253
|
302 |
+
Elapse: 564.88s
|
303 |
+
|
304 |
+
Epoch 045/400
|
305 |
+
Train loss: 76706736.00 correlation: 0.2469
|
306 |
+
Validation loss: 170137504.00 correlation: 0.2276
|
307 |
+
Elapse: 564.78s
|
308 |
+
|
309 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
310 |
+
|
311 |
+
Epoch 046/400
|
312 |
+
Train loss: 76661312.00 correlation: 0.2474
|
313 |
+
Validation loss: 170203360.00 correlation: 0.2258
|
314 |
+
Elapse: 563.90s
|
315 |
+
|
316 |
+
Epoch 047/400
|
317 |
+
Train loss: 76653904.00 correlation: 0.2479
|
318 |
+
Validation loss: 169920448.00 correlation: 0.2283
|
319 |
+
Elapse: 565.79s
|
320 |
+
|
321 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
322 |
+
|
323 |
+
Epoch 048/400
|
324 |
+
Train loss: 76510704.00 correlation: 0.2491
|
325 |
+
Validation loss: 169954384.00 correlation: 0.2279
|
326 |
+
Elapse: 566.41s
|
327 |
+
|
328 |
+
Epoch 049/400
|
329 |
+
Train loss: 76493416.00 correlation: 0.2492
|
330 |
+
Validation loss: 169840224.00 correlation: 0.2290
|
331 |
+
Elapse: 566.13s
|
332 |
+
|
333 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
334 |
+
|
335 |
+
Epoch 050/400
|
336 |
+
Train loss: 76429016.00 correlation: 0.2495
|
337 |
+
Validation loss: 170036560.00 correlation: 0.2272
|
338 |
+
Elapse: 567.15s
|
339 |
+
|
340 |
+
Epoch 051/400
|
341 |
+
Train loss: 76434184.00 correlation: 0.2500
|
342 |
+
Validation loss: 169668848.00 correlation: 0.2298
|
343 |
+
Elapse: 563.78s
|
344 |
+
|
345 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
346 |
+
|
347 |
+
Epoch 052/400
|
348 |
+
Train loss: 76368824.00 correlation: 0.2505
|
349 |
+
Validation loss: 169862640.00 correlation: 0.2292
|
350 |
+
Elapse: 563.52s
|
351 |
+
|
352 |
+
Epoch 053/400
|
353 |
+
Train loss: 76235120.00 correlation: 0.2516
|
354 |
+
Validation loss: 169524560.00 correlation: 0.2315
|
355 |
+
Elapse: 565.24s
|
356 |
+
|
357 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
358 |
+
|
359 |
+
Epoch 054/400
|
360 |
+
Train loss: 76236176.00 correlation: 0.2518
|
361 |
+
Validation loss: 169235696.00 correlation: 0.2324
|
362 |
+
Elapse: 564.43s
|
363 |
+
|
364 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
365 |
+
|
366 |
+
Epoch 055/400
|
367 |
+
Train loss: 76272208.00 correlation: 0.2514
|
368 |
+
Validation loss: 169566032.00 correlation: 0.2303
|
369 |
+
Elapse: 564.62s
|
370 |
+
|
371 |
+
Epoch 056/400
|
372 |
+
Train loss: 76095872.00 correlation: 0.2528
|
373 |
+
Validation loss: 169257008.00 correlation: 0.2329
|
374 |
+
Elapse: 564.52s
|
375 |
+
|
376 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
377 |
+
|
378 |
+
Epoch 057/400
|
379 |
+
Train loss: 76150160.00 correlation: 0.2523
|
380 |
+
Validation loss: 169306656.00 correlation: 0.2323
|
381 |
+
Elapse: 564.42s
|
382 |
+
|
383 |
+
Epoch 058/400
|
384 |
+
Train loss: 75971168.00 correlation: 0.2540
|
385 |
+
Validation loss: 169281824.00 correlation: 0.2326
|
386 |
+
Elapse: 565.79s
|
387 |
+
|
388 |
+
Epoch 059/400
|
389 |
+
Train loss: 76016632.00 correlation: 0.2537
|
390 |
+
Validation loss: 169175984.00 correlation: 0.2330
|
391 |
+
Elapse: 567.53s
|
392 |
+
|
393 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
394 |
+
|
395 |
+
Epoch 060/400
|
396 |
+
Train loss: 75961288.00 correlation: 0.2543
|
397 |
+
Validation loss: 169244832.00 correlation: 0.2312
|
398 |
+
Elapse: 564.74s
|
399 |
+
|
400 |
+
Epoch 061/400
|
401 |
+
Train loss: 75918368.00 correlation: 0.2545
|
402 |
+
Validation loss: 169277088.00 correlation: 0.2310
|
403 |
+
Elapse: 564.73s
|
404 |
+
|
405 |
+
Epoch 062/400
|
406 |
+
Train loss: 75869072.00 correlation: 0.2550
|
407 |
+
Validation loss: 169328944.00 correlation: 0.2320
|
408 |
+
Elapse: 564.39s
|
409 |
+
|
410 |
+
Epoch 063/400
|
411 |
+
Train loss: 75762192.00 correlation: 0.2561
|
412 |
+
Validation loss: 169258112.00 correlation: 0.2316
|
413 |
+
Elapse: 564.19s
|
414 |
+
|
415 |
+
Epoch 064/400
|
416 |
+
Train loss: 75825328.00 correlation: 0.2556
|
417 |
+
Validation loss: 169071840.00 correlation: 0.2332
|
418 |
+
Elapse: 564.93s
|
419 |
+
|
420 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
421 |
+
|
422 |
+
Epoch 065/400
|
423 |
+
Train loss: 75713256.00 correlation: 0.2566
|
424 |
+
Validation loss: 169214000.00 correlation: 0.2329
|
425 |
+
Elapse: 564.84s
|
426 |
+
|
427 |
+
Epoch 066/400
|
428 |
+
Train loss: 75745160.00 correlation: 0.2561
|
429 |
+
Validation loss: 169041248.00 correlation: 0.2327
|
430 |
+
Elapse: 564.78s
|
431 |
+
|
432 |
+
Epoch 067/400
|
433 |
+
Train loss: 75648152.00 correlation: 0.2572
|
434 |
+
Validation loss: 169051616.00 correlation: 0.2327
|
435 |
+
Elapse: 565.20s
|
436 |
+
|
437 |
+
Epoch 068/400
|
438 |
+
Train loss: 75614368.00 correlation: 0.2577
|
439 |
+
Validation loss: 169221120.00 correlation: 0.2327
|
440 |
+
Elapse: 564.71s
|
441 |
+
|
442 |
+
Epoch 069/400
|
443 |
+
Train loss: 75625776.00 correlation: 0.2574
|
444 |
+
Validation loss: 169122256.00 correlation: 0.2330
|
445 |
+
Elapse: 564.46s
|
446 |
+
|
447 |
+
Loaded checkpoint from epoch 64 (correlation: 0.2332).
|
448 |
+
|
449 |
+
Reduce learning rate of core to 1.4400e-03 (num. reduce: 1).
|
450 |
+
Reduce learning rate of readouts to 1.0800e-03 (num. reduce: 1).
|
451 |
+
Reduce learning rate of shifters to 1.0800e-03 (num. reduce: 1).
|
452 |
+
|
453 |
+
Epoch 070/400
|
454 |
+
Train loss: 73759920.00 correlation: 0.2731
|
455 |
+
Validation loss: 167411552.00 correlation: 0.2444
|
456 |
+
Elapse: 565.27s
|
457 |
+
|
458 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
459 |
+
|
460 |
+
Epoch 071/400
|
461 |
+
Train loss: 73162624.00 correlation: 0.2785
|
462 |
+
Validation loss: 167276400.00 correlation: 0.2454
|
463 |
+
Elapse: 565.31s
|
464 |
+
|
465 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
466 |
+
|
467 |
+
Epoch 072/400
|
468 |
+
Train loss: 73062080.00 correlation: 0.2797
|
469 |
+
Validation loss: 167303840.00 correlation: 0.2453
|
470 |
+
Elapse: 565.70s
|
471 |
+
|
472 |
+
Epoch 073/400
|
473 |
+
Train loss: 72859248.00 correlation: 0.2818
|
474 |
+
Validation loss: 167279840.00 correlation: 0.2448
|
475 |
+
Elapse: 566.21s
|
476 |
+
|
477 |
+
Epoch 074/400
|
478 |
+
Train loss: 72867944.00 correlation: 0.2819
|
479 |
+
Validation loss: 167328304.00 correlation: 0.2445
|
480 |
+
Elapse: 566.10s
|
481 |
+
|
482 |
+
Epoch 075/400
|
483 |
+
Train loss: 72806064.00 correlation: 0.2823
|
484 |
+
Validation loss: 167367392.00 correlation: 0.2443
|
485 |
+
Elapse: 566.39s
|
486 |
+
|
487 |
+
Epoch 076/400
|
488 |
+
Train loss: 72707504.00 correlation: 0.2836
|
489 |
+
Validation loss: 167176992.00 correlation: 0.2450
|
490 |
+
Elapse: 566.85s
|
491 |
+
|
492 |
+
Loaded checkpoint from epoch 71 (correlation: 0.2454).
|
493 |
+
|
494 |
+
Reduce learning rate of core to 4.3200e-04 (num. reduce: 1).
|
495 |
+
Reduce learning rate of readouts to 3.2400e-04 (num. reduce: 1).
|
496 |
+
Reduce learning rate of shifters to 3.2400e-04 (num. reduce: 1).
|
497 |
+
|
498 |
+
Epoch 077/400
|
499 |
+
Train loss: 72382144.00 correlation: 0.2856
|
500 |
+
Validation loss: 166842576.00 correlation: 0.2479
|
501 |
+
Elapse: 566.50s
|
502 |
+
|
503 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
504 |
+
|
505 |
+
Epoch 078/400
|
506 |
+
Train loss: 72078376.00 correlation: 0.2881
|
507 |
+
Validation loss: 166822496.00 correlation: 0.2483
|
508 |
+
Elapse: 567.42s
|
509 |
+
|
510 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
511 |
+
|
512 |
+
Epoch 079/400
|
513 |
+
Train loss: 71958248.00 correlation: 0.2896
|
514 |
+
Validation loss: 166738624.00 correlation: 0.2488
|
515 |
+
Elapse: 567.48s
|
516 |
+
|
517 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
518 |
+
|
519 |
+
Epoch 080/400
|
520 |
+
Train loss: 71895880.00 correlation: 0.2900
|
521 |
+
Validation loss: 166642640.00 correlation: 0.2490
|
522 |
+
Elapse: 567.47s
|
523 |
+
|
524 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
525 |
+
|
526 |
+
Epoch 081/400
|
527 |
+
Train loss: 71789800.00 correlation: 0.2911
|
528 |
+
Validation loss: 166705248.00 correlation: 0.2491
|
529 |
+
Elapse: 566.97s
|
530 |
+
|
531 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
532 |
+
|
533 |
+
Epoch 082/400
|
534 |
+
Train loss: 71770424.00 correlation: 0.2915
|
535 |
+
Validation loss: 166628368.00 correlation: 0.2487
|
536 |
+
Elapse: 567.08s
|
537 |
+
|
538 |
+
Epoch 083/400
|
539 |
+
Train loss: 71742960.00 correlation: 0.2915
|
540 |
+
Validation loss: 166623744.00 correlation: 0.2491
|
541 |
+
Elapse: 567.32s
|
542 |
+
|
543 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
544 |
+
|
545 |
+
Epoch 084/400
|
546 |
+
Train loss: 71726080.00 correlation: 0.2915
|
547 |
+
Validation loss: 166593008.00 correlation: 0.2489
|
548 |
+
Elapse: 566.52s
|
549 |
+
|
550 |
+
Epoch 085/400
|
551 |
+
Train loss: 71608472.00 correlation: 0.2930
|
552 |
+
Validation loss: 166582448.00 correlation: 0.2494
|
553 |
+
Elapse: 566.39s
|
554 |
+
|
555 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
556 |
+
|
557 |
+
Epoch 086/400
|
558 |
+
Train loss: 71622656.00 correlation: 0.2929
|
559 |
+
Validation loss: 166651488.00 correlation: 0.2488
|
560 |
+
Elapse: 567.27s
|
561 |
+
|
562 |
+
Epoch 087/400
|
563 |
+
Train loss: 71550640.00 correlation: 0.2936
|
564 |
+
Validation loss: 166630768.00 correlation: 0.2490
|
565 |
+
Elapse: 566.70s
|
566 |
+
|
567 |
+
Epoch 088/400
|
568 |
+
Train loss: 71491864.00 correlation: 0.2941
|
569 |
+
Validation loss: 166610080.00 correlation: 0.2493
|
570 |
+
Elapse: 567.65s
|
571 |
+
|
572 |
+
Epoch 089/400
|
573 |
+
Train loss: 71458584.00 correlation: 0.2944
|
574 |
+
Validation loss: 166546464.00 correlation: 0.2492
|
575 |
+
Elapse: 566.68s
|
576 |
+
|
577 |
+
Epoch 090/400
|
578 |
+
Train loss: 71462792.00 correlation: 0.2945
|
579 |
+
Validation loss: 166668320.00 correlation: 0.2492
|
580 |
+
Elapse: 566.84s
|
581 |
+
|
582 |
+
Loaded checkpoint from epoch 85 (correlation: 0.2494).
|
583 |
+
|
584 |
+
Reduce learning rate of core to 1.2960e-04 (num. reduce: 1).
|
585 |
+
Reduce learning rate of readouts to 9.7200e-05 (num. reduce: 1).
|
586 |
+
Reduce learning rate of shifters to 9.7200e-05 (num. reduce: 1).
|
587 |
+
|
588 |
+
Epoch 091/400
|
589 |
+
Train loss: 71288968.00 correlation: 0.2953
|
590 |
+
Validation loss: 166494880.00 correlation: 0.2500
|
591 |
+
Elapse: 567.12s
|
592 |
+
|
593 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
594 |
+
|
595 |
+
Epoch 092/400
|
596 |
+
Train loss: 71275904.00 correlation: 0.2958
|
597 |
+
Validation loss: 166504256.00 correlation: 0.2498
|
598 |
+
Elapse: 566.80s
|
599 |
+
|
600 |
+
Epoch 093/400
|
601 |
+
Train loss: 71229392.00 correlation: 0.2962
|
602 |
+
Validation loss: 166490080.00 correlation: 0.2502
|
603 |
+
Elapse: 567.91s
|
604 |
+
|
605 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
606 |
+
|
607 |
+
Epoch 094/400
|
608 |
+
Train loss: 71289360.00 correlation: 0.2955
|
609 |
+
Validation loss: 166481824.00 correlation: 0.2501
|
610 |
+
Elapse: 567.35s
|
611 |
+
|
612 |
+
Epoch 095/400
|
613 |
+
Train loss: 71209928.00 correlation: 0.2962
|
614 |
+
Validation loss: 166463984.00 correlation: 0.2501
|
615 |
+
Elapse: 567.29s
|
616 |
+
|
617 |
+
Epoch 096/400
|
618 |
+
Train loss: 71155936.00 correlation: 0.2969
|
619 |
+
Validation loss: 166447504.00 correlation: 0.2502
|
620 |
+
Elapse: 567.66s
|
621 |
+
|
622 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
623 |
+
|
624 |
+
Epoch 097/400
|
625 |
+
Train loss: 71163080.00 correlation: 0.2967
|
626 |
+
Validation loss: 166476448.00 correlation: 0.2501
|
627 |
+
Elapse: 567.23s
|
628 |
+
|
629 |
+
Epoch 098/400
|
630 |
+
Train loss: 71090216.00 correlation: 0.2976
|
631 |
+
Validation loss: 166447952.00 correlation: 0.2502
|
632 |
+
Elapse: 567.15s
|
633 |
+
|
634 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
635 |
+
|
636 |
+
Epoch 099/400
|
637 |
+
Train loss: 71146160.00 correlation: 0.2971
|
638 |
+
Validation loss: 166436720.00 correlation: 0.2504
|
639 |
+
Elapse: 566.92s
|
640 |
+
|
641 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
642 |
+
|
643 |
+
Epoch 100/400
|
644 |
+
Train loss: 71064016.00 correlation: 0.2977
|
645 |
+
Validation loss: 166422944.00 correlation: 0.2502
|
646 |
+
Elapse: 567.03s
|
647 |
+
|
648 |
+
Epoch 101/400
|
649 |
+
Train loss: 71056432.00 correlation: 0.2979
|
650 |
+
Validation loss: 166403840.00 correlation: 0.2505
|
651 |
+
Elapse: 567.52s
|
652 |
+
|
653 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
654 |
+
|
655 |
+
Epoch 102/400
|
656 |
+
Train loss: 71051576.00 correlation: 0.2978
|
657 |
+
Validation loss: 166443872.00 correlation: 0.2504
|
658 |
+
Elapse: 567.13s
|
659 |
+
|
660 |
+
Epoch 103/400
|
661 |
+
Train loss: 71046608.00 correlation: 0.2979
|
662 |
+
Validation loss: 166479680.00 correlation: 0.2502
|
663 |
+
Elapse: 566.67s
|
664 |
+
|
665 |
+
Epoch 104/400
|
666 |
+
Train loss: 71038120.00 correlation: 0.2981
|
667 |
+
Validation loss: 166454112.00 correlation: 0.2501
|
668 |
+
Elapse: 564.93s
|
669 |
+
|
670 |
+
Epoch 105/400
|
671 |
+
Train loss: 70978192.00 correlation: 0.2988
|
672 |
+
Validation loss: 166414432.00 correlation: 0.2503
|
673 |
+
Elapse: 564.91s
|
674 |
+
|
675 |
+
Epoch 106/400
|
676 |
+
Train loss: 70976960.00 correlation: 0.2990
|
677 |
+
Validation loss: 166474720.00 correlation: 0.2500
|
678 |
+
Elapse: 566.07s
|
679 |
+
|
680 |
+
Loaded checkpoint from epoch 101 (correlation: 0.2505).
|
681 |
+
|
682 |
+
Reduce learning rate of core to 3.8880e-05 (num. reduce: 1).
|
683 |
+
Reduce learning rate of readouts to 2.9160e-05 (num. reduce: 1).
|
684 |
+
Reduce learning rate of shifters to 2.9160e-05 (num. reduce: 1).
|
685 |
+
|
686 |
+
Epoch 107/400
|
687 |
+
Train loss: 70972624.00 correlation: 0.2986
|
688 |
+
Validation loss: 166398144.00 correlation: 0.2506
|
689 |
+
Elapse: 566.75s
|
690 |
+
|
691 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
692 |
+
|
693 |
+
Epoch 108/400
|
694 |
+
Train loss: 70964176.00 correlation: 0.2987
|
695 |
+
Validation loss: 166382512.00 correlation: 0.2506
|
696 |
+
Elapse: 566.44s
|
697 |
+
|
698 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
699 |
+
|
700 |
+
Epoch 109/400
|
701 |
+
Train loss: 70976968.00 correlation: 0.2987
|
702 |
+
Validation loss: 166404432.00 correlation: 0.2505
|
703 |
+
Elapse: 567.32s
|
704 |
+
|
705 |
+
Epoch 110/400
|
706 |
+
Train loss: 70951736.00 correlation: 0.2985
|
707 |
+
Validation loss: 166396896.00 correlation: 0.2506
|
708 |
+
Elapse: 567.77s
|
709 |
+
|
710 |
+
Epoch 111/400
|
711 |
+
Train loss: 70895944.00 correlation: 0.2997
|
712 |
+
Validation loss: 166385856.00 correlation: 0.2506
|
713 |
+
Elapse: 566.89s
|
714 |
+
|
715 |
+
Epoch 112/400
|
716 |
+
Train loss: 70880200.00 correlation: 0.2995
|
717 |
+
Validation loss: 166380672.00 correlation: 0.2507
|
718 |
+
Elapse: 566.94s
|
719 |
+
|
720 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
|
721 |
+
|
722 |
+
Epoch 113/400
|
723 |
+
Train loss: 70861304.00 correlation: 0.2998
|
724 |
+
Validation loss: 166391184.00 correlation: 0.2506
|
725 |
+
Elapse: 566.54s
|
726 |
+
|
727 |
+
Epoch 114/400
|
728 |
+
Train loss: 70921912.00 correlation: 0.2989
|
729 |
+
Validation loss: 166417776.00 correlation: 0.2504
|
730 |
+
Elapse: 567.26s
|
731 |
+
|
732 |
+
Epoch 115/400
|
733 |
+
Train loss: 70914312.00 correlation: 0.2989
|
734 |
+
Validation loss: 166403376.00 correlation: 0.2506
|
735 |
+
Elapse: 566.92s
|
736 |
+
|
737 |
+
Epoch 116/400
|
738 |
+
Train loss: 70903784.00 correlation: 0.2992
|
739 |
+
Validation loss: 166403360.00 correlation: 0.2506
|
740 |
+
Elapse: 567.11s
|
741 |
+
|
742 |
+
Epoch 117/400
|
743 |
+
Train loss: 70866896.00 correlation: 0.2994
|
744 |
+
Validation loss: 166382688.00 correlation: 0.2505
|
745 |
+
Elapse: 566.94s
|
746 |
+
|
747 |
+
Loaded checkpoint from epoch 112 (correlation: 0.2507).
|
748 |
+
|
749 |
+
Reduce learning rate of core to 1.1664e-05 (num. reduce: 1).
|
750 |
+
Reduce learning rate of readouts to 8.7480e-06 (num. reduce: 1).
|
751 |
+
Reduce learning rate of shifters to 8.7480e-06 (num. reduce: 1).
|
752 |
+
|
753 |
+
Epoch 118/400
|
754 |
+
Train loss: 70926000.00 correlation: 0.2989
|
755 |
+
Validation loss: 166380768.00 correlation: 0.2506
|
756 |
+
Elapse: 567.50s
|
757 |
+
|
758 |
+
Epoch 119/400
|
759 |
+
Train loss: 70900808.00 correlation: 0.2993
|
760 |
+
Validation loss: 166386016.00 correlation: 0.2506
|
761 |
+
Elapse: 567.35s
|
762 |
+
|
763 |
+
Epoch 120/400
|
764 |
+
Train loss: 70881328.00 correlation: 0.2993
|
765 |
+
Validation loss: 166387568.00 correlation: 0.2506
|
766 |
+
Elapse: 567.65s
|
767 |
+
|
768 |
+
Epoch 121/400
|
769 |
+
Train loss: 70937256.00 correlation: 0.2984
|
770 |
+
Validation loss: 166393568.00 correlation: 0.2506
|
771 |
+
Elapse: 566.97s
|
772 |
+
|
773 |
+
Epoch 122/400
|
774 |
+
Train loss: 70855888.00 correlation: 0.2996
|
775 |
+
Validation loss: 166378592.00 correlation: 0.2507
|
776 |
+
Elapse: 567.50s
|
777 |
+
|
778 |
+
Loaded checkpoint from epoch 112 (correlation: 0.2507).
|
779 |
+
|
780 |
+
Reduce learning rate of core to 3.4992e-06 (num. reduce: 2).
|
781 |
+
Reduce learning rate of readouts to 2.6244e-06 (num. reduce: 2).
|
782 |
+
Reduce learning rate of shifters to 2.6244e-06 (num. reduce: 2).
|
783 |
+
|
784 |
+
Epoch 123/400
|
785 |
+
Train loss: 70938496.00 correlation: 0.2988
|
786 |
+
Validation loss: 166375792.00 correlation: 0.2507
|
787 |
+
Elapse: 567.50s
|
788 |
+
|
789 |
+
Epoch 124/400
|
790 |
+
Train loss: 70966320.00 correlation: 0.2986
|
791 |
+
Validation loss: 166383664.00 correlation: 0.2506
|
792 |
+
Elapse: 567.77s
|
793 |
+
|
794 |
+
Epoch 125/400
|
795 |
+
Train loss: 70872080.00 correlation: 0.2990
|
796 |
+
Validation loss: 166383328.00 correlation: 0.2506
|
797 |
+
Elapse: 567.87s
|
798 |
+
|
799 |
+
Epoch 126/400
|
800 |
+
Train loss: 70866264.00 correlation: 0.2997
|
801 |
+
Validation loss: 166383136.00 correlation: 0.2506
|
802 |
+
Elapse: 567.21s
|
803 |
+
|
804 |
+
Epoch 127/400
|
805 |
+
Train loss: 70836352.00 correlation: 0.2996
|
806 |
+
Validation loss: 166386816.00 correlation: 0.2506
|
807 |
+
Elapse: 566.90s
|
808 |
+
|
809 |
+
Model has not improved after 2 LR reductions.
|
810 |
+
|
811 |
+
Loaded checkpoint from epoch 112 (correlation: 0.2507).
|
812 |
+
|
813 |
+
|
814 |
+
ValidationA: 0.2487 B: 0.2789 C: 0.2720 D: 0.2341 E: 0.2367 F: 0.2340 G: 0.2555 H: 0.2351 I: 0.2533 J: 0.2589 average: 0.2507
|
815 |
+
|
816 |
+
Results saved to /home/storage/runs/vivit_ensemble/002.
|
002/args.yaml
ADDED
@@ -0,0 +1,87 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
adam_beta1: 0.9
|
2 |
+
adam_beta2: 0.999
|
3 |
+
adam_eps: 1e-08
|
4 |
+
batch_size: 6
|
5 |
+
cache_data: false
|
6 |
+
center_crop: 1.0
|
7 |
+
clear_output_dir: true
|
8 |
+
core: vivit
|
9 |
+
core_behavior_mode: 2
|
10 |
+
core_compile: false
|
11 |
+
core_drop_path: 0.0505
|
12 |
+
core_emb_dim: 112
|
13 |
+
core_ff_activation: gelu
|
14 |
+
core_ff_dropout: 0.0592
|
15 |
+
core_flash_attention: 1
|
16 |
+
core_head_dim: 48
|
17 |
+
core_lr: 0.0048
|
18 |
+
core_mha_dropout: 0.358
|
19 |
+
core_mlp_dim: 136
|
20 |
+
core_norm_qk: false
|
21 |
+
core_num_heads: 11
|
22 |
+
core_p_dropout: 0.1338
|
23 |
+
core_parallel_attention: true
|
24 |
+
core_patch_mode: 0
|
25 |
+
core_pos_encoding: 3
|
26 |
+
core_spatial_depth: 3
|
27 |
+
core_spatial_patch_size: 7
|
28 |
+
core_spatial_patch_stride: 2
|
29 |
+
core_temporal_depth: 5
|
30 |
+
core_temporal_patch_size: 25
|
31 |
+
core_temporal_patch_stride: 1
|
32 |
+
core_weight_decay: 0.1789
|
33 |
+
criterion: poisson_correlation
|
34 |
+
critic_mode: 0
|
35 |
+
crop_frame: 140
|
36 |
+
data: /home/sensorium2023
|
37 |
+
deterministic: false
|
38 |
+
device: cuda
|
39 |
+
dpi: 120
|
40 |
+
ds_mode: 3
|
41 |
+
ds_scale: 1
|
42 |
+
epochs: 400
|
43 |
+
format: svg
|
44 |
+
git_hash: 1033c29
|
45 |
+
grad_checkpointing: 0
|
46 |
+
grad_norm: null
|
47 |
+
input_shapes:
|
48 |
+
behavior: [2, 140]
|
49 |
+
pupil_center: [2, 140]
|
50 |
+
video: [1, 140, 36, 64]
|
51 |
+
limit_data: null
|
52 |
+
lr: 0.0036
|
53 |
+
max_frame: 300
|
54 |
+
micro_batch_size: 6
|
55 |
+
modulator_mode: 0
|
56 |
+
mouse_ids: [A, B, C, D, E, F, G, H, I, J]
|
57 |
+
num_workers: 2
|
58 |
+
output_dir: /home/storage/runs/002
|
59 |
+
output_mode: 1
|
60 |
+
output_shapes:
|
61 |
+
A: [7440, 140]
|
62 |
+
B: [7928, 140]
|
63 |
+
C: [8285, 140]
|
64 |
+
D: [7671, 140]
|
65 |
+
E: [7495, 140]
|
66 |
+
F: [7863, 140]
|
67 |
+
G: [7908, 140]
|
68 |
+
H: [8202, 140]
|
69 |
+
I: [7939, 140]
|
70 |
+
J: [8122, 140]
|
71 |
+
precision: "32"
|
72 |
+
pretrain_core: null
|
73 |
+
readout: gaussian2d
|
74 |
+
readout_bias_mode: 2
|
75 |
+
readout_dropout: 0.0
|
76 |
+
readout_grid_mode: 1
|
77 |
+
restore: null
|
78 |
+
save_plots: false
|
79 |
+
seed: 9
|
80 |
+
shifter_layers: 3
|
81 |
+
shifter_mode: 1
|
82 |
+
shifter_size: 5
|
83 |
+
stat_mode: 1
|
84 |
+
trainable_params: 12278365
|
85 |
+
transform_mode: 2
|
86 |
+
verbose: 1
|
87 |
+
weight_decay: 0.3939
|
002/ckpt/model_state.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:beef5725438551d35727d0a1a42f996cce8ce0c760b74e7f7228171b34283e11
|
3 |
+
size 148268583
|
002/evaluation.yaml
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
validation: {A: 0.25081300735473633, B: 0.2804259657859802, C: 0.27504464983940125,
|
2 |
+
D: 0.23932193219661713, E: 0.23903165757656097, F: 0.23461945354938507, G: 0.25730910897254944,
|
3 |
+
H: 0.2378837764263153, I: 0.2555205523967743, J: 0.25993871688842773, average: 0.25299088209867476}
|
002/model.txt
ADDED
@@ -0,0 +1,143 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
=======================================================================================================================================
|
2 |
+
Layer (type:depth-idx) Input Shape Output Shape Param #
|
3 |
+
=======================================================================================================================================
|
4 |
+
Model -- [1, 7440, 116] --
|
5 |
+
├─ViViTCore: 1-1 -- [1, 112, 116, 15, 29] --
|
6 |
+
│ └─ViViT: 2-1 [1, 5, 140, 36, 64] [1, 112, 116, 15, 29] --
|
7 |
+
│ │ └─Tokenizer: 3-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] 79,632
|
8 |
+
│ │ │ └─Sequential: 4-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] --
|
9 |
+
│ │ │ │ └─Unfold3d: 5-1 [1, 5, 140, 36, 64] [1, 116, 435, 6125] --
|
10 |
+
│ │ │ │ └─LayerNorm: 5-2 [1, 116, 435, 6125] [1, 116, 435, 6125] 12,250
|
11 |
+
│ │ │ │ └─Linear: 5-3 [1, 116, 435, 6125] [1, 116, 435, 112] 686,112
|
12 |
+
│ │ │ │ └─LayerNorm: 5-4 [1, 116, 435, 112] [1, 116, 435, 112] 224
|
13 |
+
│ │ │ │ └─Dropout: 5-5 [1, 116, 435, 112] [1, 116, 435, 112] --
|
14 |
+
│ │ └─Transformer: 3-2 [116, 435, 112] [116, 435, 112] --
|
15 |
+
│ │ │ └─ModuleList: 4-2 -- -- --
|
16 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-6 [116, 435, 112] [116, 435, 112] --
|
17 |
+
│ │ │ │ │ └─LayerNorm: 6-1 [116, 435, 112] [116, 435, 112] 224
|
18 |
+
│ │ │ │ │ └─Linear: 6-2 [116, 435, 112] [116, 435, 1720] 192,640
|
19 |
+
│ │ │ │ │ └─Linear: 6-3 [116, 435, 528] [116, 435, 112] 59,136
|
20 |
+
│ │ │ │ │ └─DropPath: 6-4 [116, 435, 112] [116, 435, 112] --
|
21 |
+
│ │ │ │ │ └─Sequential: 6-5 [116, 435, 136] [116, 435, 112] --
|
22 |
+
│ │ │ │ │ │ └─GELU: 7-1 [116, 435, 136] [116, 435, 136] --
|
23 |
+
│ │ │ │ │ │ └─Dropout: 7-2 [116, 435, 136] [116, 435, 136] --
|
24 |
+
│ │ │ │ │ │ └─Linear: 7-3 [116, 435, 136] [116, 435, 112] 15,232
|
25 |
+
│ │ │ │ │ └─DropPath: 6-6 [116, 435, 112] [116, 435, 112] --
|
26 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-7 [116, 435, 112] [116, 435, 112] --
|
27 |
+
│ │ │ │ │ └─LayerNorm: 6-7 [116, 435, 112] [116, 435, 112] 224
|
28 |
+
│ │ │ │ │ └─Linear: 6-8 [116, 435, 112] [116, 435, 1720] 192,640
|
29 |
+
│ │ │ │ │ └─Linear: 6-9 [116, 435, 528] [116, 435, 112] 59,136
|
30 |
+
│ │ │ │ │ └─DropPath: 6-10 [116, 435, 112] [116, 435, 112] --
|
31 |
+
│ │ │ │ │ └─Sequential: 6-11 [116, 435, 136] [116, 435, 112] --
|
32 |
+
│ │ │ │ │ │ └─GELU: 7-4 [116, 435, 136] [116, 435, 136] --
|
33 |
+
│ │ │ │ │ │ └─Dropout: 7-5 [116, 435, 136] [116, 435, 136] --
|
34 |
+
│ │ │ │ │ │ └─Linear: 7-6 [116, 435, 136] [116, 435, 112] 15,232
|
35 |
+
│ │ │ │ │ └─DropPath: 6-12 [116, 435, 112] [116, 435, 112] --
|
36 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-8 [116, 435, 112] [116, 435, 112] --
|
37 |
+
│ │ │ │ │ └─LayerNorm: 6-13 [116, 435, 112] [116, 435, 112] 224
|
38 |
+
│ │ │ │ │ └─Linear: 6-14 [116, 435, 112] [116, 435, 1720] 192,640
|
39 |
+
│ │ │ │ │ └─Linear: 6-15 [116, 435, 528] [116, 435, 112] 59,136
|
40 |
+
│ │ │ │ │ └─DropPath: 6-16 [116, 435, 112] [116, 435, 112] --
|
41 |
+
│ │ │ │ │ └─Sequential: 6-17 [116, 435, 136] [116, 435, 112] --
|
42 |
+
│ │ │ │ │ │ └─GELU: 7-7 [116, 435, 136] [116, 435, 136] --
|
43 |
+
│ │ │ │ │ │ └─Dropout: 7-8 [116, 435, 136] [116, 435, 136] --
|
44 |
+
│ │ │ │ │ │ └─Linear: 7-9 [116, 435, 136] [116, 435, 112] 15,232
|
45 |
+
│ │ │ │ │ └─DropPath: 6-18 [116, 435, 112] [116, 435, 112] --
|
46 |
+
│ │ └─Transformer: 3-3 [435, 116, 112] [435, 116, 112] --
|
47 |
+
│ │ │ └─ModuleList: 4-3 -- -- --
|
48 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-9 [435, 116, 112] [435, 116, 112] --
|
49 |
+
│ │ │ │ │ └─LayerNorm: 6-19 [435, 116, 112] [435, 116, 112] 224
|
50 |
+
│ │ │ │ │ └─Linear: 6-20 [435, 116, 112] [435, 116, 1720] 192,640
|
51 |
+
│ │ │ │ │ └─Linear: 6-21 [435, 116, 528] [435, 116, 112] 59,136
|
52 |
+
│ │ │ │ │ └─DropPath: 6-22 [435, 116, 112] [435, 116, 112] --
|
53 |
+
│ │ │ │ │ └─Sequential: 6-23 [435, 116, 136] [435, 116, 112] --
|
54 |
+
│ │ │ │ │ │ └─GELU: 7-10 [435, 116, 136] [435, 116, 136] --
|
55 |
+
│ │ │ │ │ │ └─Dropout: 7-11 [435, 116, 136] [435, 116, 136] --
|
56 |
+
│ │ │ │ │ │ └─Linear: 7-12 [435, 116, 136] [435, 116, 112] 15,232
|
57 |
+
│ │ │ │ │ └─DropPath: 6-24 [435, 116, 112] [435, 116, 112] --
|
58 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-10 [435, 116, 112] [435, 116, 112] --
|
59 |
+
│ │ │ │ │ └─LayerNorm: 6-25 [435, 116, 112] [435, 116, 112] 224
|
60 |
+
│ │ │ │ │ └─Linear: 6-26 [435, 116, 112] [435, 116, 1720] 192,640
|
61 |
+
│ │ │ │ │ └─Linear: 6-27 [435, 116, 528] [435, 116, 112] 59,136
|
62 |
+
│ │ │ │ │ └─DropPath: 6-28 [435, 116, 112] [435, 116, 112] --
|
63 |
+
│ │ │ │ │ └─Sequential: 6-29 [435, 116, 136] [435, 116, 112] --
|
64 |
+
│ │ │ │ │ │ └─GELU: 7-13 [435, 116, 136] [435, 116, 136] --
|
65 |
+
│ │ │ │ │ │ └─Dropout: 7-14 [435, 116, 136] [435, 116, 136] --
|
66 |
+
│ │ │ │ │ │ └─Linear: 7-15 [435, 116, 136] [435, 116, 112] 15,232
|
67 |
+
│ │ │ │ │ └─DropPath: 6-30 [435, 116, 112] [435, 116, 112] --
|
68 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-11 [435, 116, 112] [435, 116, 112] --
|
69 |
+
│ │ │ │ │ └─LayerNorm: 6-31 [435, 116, 112] [435, 116, 112] 224
|
70 |
+
│ │ │ │ │ └─Linear: 6-32 [435, 116, 112] [435, 116, 1720] 192,640
|
71 |
+
│ │ │ │ │ └─Linear: 6-33 [435, 116, 528] [435, 116, 112] 59,136
|
72 |
+
│ │ │ │ │ └─DropPath: 6-34 [435, 116, 112] [435, 116, 112] --
|
73 |
+
│ │ │ │ │ └─Sequential: 6-35 [435, 116, 136] [435, 116, 112] --
|
74 |
+
│ │ │ │ │ │ └─GELU: 7-16 [435, 116, 136] [435, 116, 136] --
|
75 |
+
│ │ │ │ │ │ └─Dropout: 7-17 [435, 116, 136] [435, 116, 136] --
|
76 |
+
│ │ │ │ │ │ └─Linear: 7-18 [435, 116, 136] [435, 116, 112] 15,232
|
77 |
+
│ │ │ │ │ └─DropPath: 6-36 [435, 116, 112] [435, 116, 112] --
|
78 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-12 [435, 116, 112] [435, 116, 112] --
|
79 |
+
│ │ │ │ │ └─LayerNorm: 6-37 [435, 116, 112] [435, 116, 112] 224
|
80 |
+
│ │ │ │ │ └─Linear: 6-38 [435, 116, 112] [435, 116, 1720] 192,640
|
81 |
+
│ │ │ │ │ └─Linear: 6-39 [435, 116, 528] [435, 116, 112] 59,136
|
82 |
+
│ │ │ │ │ └─DropPath: 6-40 [435, 116, 112] [435, 116, 112] --
|
83 |
+
│ │ │ │ │ └─Sequential: 6-41 [435, 116, 136] [435, 116, 112] --
|
84 |
+
│ │ │ │ │ │ └─GELU: 7-19 [435, 116, 136] [435, 116, 136] --
|
85 |
+
│ │ │ │ │ │ └─Dropout: 7-20 [435, 116, 136] [435, 116, 136] --
|
86 |
+
│ │ │ │ │ │ └─Linear: 7-21 [435, 116, 136] [435, 116, 112] 15,232
|
87 |
+
│ │ │ │ │ └─DropPath: 6-42 [435, 116, 112] [435, 116, 112] --
|
88 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-13 [435, 116, 112] [435, 116, 112] --
|
89 |
+
│ │ │ │ │ └─LayerNorm: 6-43 [435, 116, 112] [435, 116, 112] 224
|
90 |
+
│ │ │ │ │ └─Linear: 6-44 [435, 116, 112] [435, 116, 1720] 192,640
|
91 |
+
│ │ │ │ │ └─Linear: 6-45 [435, 116, 528] [435, 116, 112] 59,136
|
92 |
+
│ │ │ │ │ └─DropPath: 6-46 [435, 116, 112] [435, 116, 112] --
|
93 |
+
│ │ │ │ │ └─Sequential: 6-47 [435, 116, 136] [435, 116, 112] --
|
94 |
+
│ │ │ │ │ │ └─GELU: 7-22 [435, 116, 136] [435, 116, 136] --
|
95 |
+
│ │ │ │ │ │ └─Dropout: 7-23 [435, 116, 136] [435, 116, 136] --
|
96 |
+
│ │ │ │ │ │ └─Linear: 7-24 [435, 116, 136] [435, 116, 112] 15,232
|
97 |
+
│ │ │ │ │ └─DropPath: 6-48 [435, 116, 112] [435, 116, 112] --
|
98 |
+
│ │ └─Rearrange: 3-4 [1, 116, 435, 112] [1, 112, 116, 15, 29] --
|
99 |
+
├─MLPShifters: 1-2 -- [1, 2, 116] 513
|
100 |
+
│ └─MLPShifter: 2-2 [116, 2] [116, 2] --
|
101 |
+
│ │ └─Sequential: 3-5 [116, 2] [116, 2] --
|
102 |
+
│ │ │ └─Linear: 4-4 [116, 2] [116, 5] 15
|
103 |
+
│ │ │ └─Tanh: 4-5 [116, 5] [116, 5] --
|
104 |
+
│ │ │ └─Linear: 4-6 [116, 5] [116, 5] 30
|
105 |
+
│ │ │ └─Tanh: 4-7 [116, 5] [116, 5] --
|
106 |
+
│ │ │ └─Linear: 4-8 [116, 5] [116, 2] 12
|
107 |
+
│ │ │ └─Tanh: 4-9 [116, 2] [116, 2] --
|
108 |
+
├─Readouts: 1-3 [1, 112, 116, 15, 29] [1, 7440, 116] 8,477,649
|
109 |
+
│ └─Gaussian2DReadout2: 2-3 [1, 112, 116, 15, 29] [1, 7440, 116] 870,480
|
110 |
+
│ │ └─Sequential: 3-6 [7440, 2] [7440, 2] --
|
111 |
+
│ │ │ └─Linear: 4-10 [7440, 2] [7440, 30] 90
|
112 |
+
│ │ │ └─ELU: 4-11 [7440, 30] [7440, 30] --
|
113 |
+
│ │ │ └─Linear: 4-12 [7440, 30] [7440, 2] 62
|
114 |
+
│ │ │ └─Tanh: 4-13 [7440, 2] [7440, 2] --
|
115 |
+
│ │ └─Sequential: 3-7 [7440, 2] [7440, 2] (recursive)
|
116 |
+
│ │ │ └─Linear: 4-14 [7440, 2] [7440, 30] (recursive)
|
117 |
+
│ │ │ └─ELU: 4-15 [7440, 30] [7440, 30] --
|
118 |
+
�� │ │ └─Linear: 4-16 [7440, 30] [7440, 2] (recursive)
|
119 |
+
│ │ │ └─Tanh: 4-17 [7440, 2] [7440, 2] --
|
120 |
+
│ │ └─Sequential: 3-8 [7440, 2] [7440, 2] (recursive)
|
121 |
+
│ │ │ └─Linear: 4-18 [7440, 2] [7440, 30] (recursive)
|
122 |
+
│ │ │ └─ELU: 4-19 [7440, 30] [7440, 30] --
|
123 |
+
│ │ │ └─Linear: 4-20 [7440, 30] [7440, 2] (recursive)
|
124 |
+
│ │ │ └─Tanh: 4-21 [7440, 2] [7440, 2] --
|
125 |
+
│ │ └─Sequential: 3-9 [116, 4] [116, 112] --
|
126 |
+
│ │ │ └─Linear: 4-22 [116, 4] [116, 112] 560
|
127 |
+
│ │ │ └─LayerNorm: 4-23 [116, 112] [116, 112] 224
|
128 |
+
│ │ │ └─GELU: 4-24 [116, 112] [116, 112] --
|
129 |
+
│ │ │ └─Dropout: 4-25 [116, 112] [116, 112] --
|
130 |
+
│ │ │ └─Linear: 4-26 [116, 112] [116, 112] 12,656
|
131 |
+
│ │ │ └─Tanh: 4-27 [116, 112] [116, 112] --
|
132 |
+
├─Exponential: 1-4 [1, 7440, 116] [1, 7440, 116] --
|
133 |
+
=======================================================================================================================================
|
134 |
+
Total params: 12,278,365
|
135 |
+
Trainable params: 12,278,365
|
136 |
+
Non-trainable params: 0
|
137 |
+
Total mult-adds (Units.MEGABYTES): 679.88
|
138 |
+
=======================================================================================================================================
|
139 |
+
Input size (MB): 1.29
|
140 |
+
Forward/backward pass size (MB): 9208.73
|
141 |
+
Params size (MB): 11.40
|
142 |
+
Estimated Total Size (MB): 9221.42
|
143 |
+
=======================================================================================================================================
|
002/output.log
ADDED
@@ -0,0 +1,942 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Use bfloat16 for core module.
|
2 |
+
Use parallel attention and MLP in ViViT.
|
3 |
+
|
4 |
+
Epoch 001/400
|
5 |
+
Train loss: 121388096.00 correlation: 0.0109
|
6 |
+
Validation loss: 200734000.00 correlation: 0.0221
|
7 |
+
Elapse: 522.91s
|
8 |
+
|
9 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
10 |
+
|
11 |
+
Epoch 002/400
|
12 |
+
Train loss: 98318960.00 correlation: 0.0308
|
13 |
+
Validation loss: 199955104.00 correlation: 0.0339
|
14 |
+
Elapse: 525.64s
|
15 |
+
|
16 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
17 |
+
|
18 |
+
Epoch 003/400
|
19 |
+
Train loss: 97097640.00 correlation: 0.0413
|
20 |
+
Validation loss: 199270752.00 correlation: 0.0396
|
21 |
+
Elapse: 531.95s
|
22 |
+
|
23 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
24 |
+
|
25 |
+
Epoch 004/400
|
26 |
+
Train loss: 96457752.00 correlation: 0.0479
|
27 |
+
Validation loss: 198723456.00 correlation: 0.0421
|
28 |
+
Elapse: 536.86s
|
29 |
+
|
30 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
31 |
+
|
32 |
+
Epoch 005/400
|
33 |
+
Train loss: 95920056.00 correlation: 0.0541
|
34 |
+
Validation loss: 197835248.00 correlation: 0.0461
|
35 |
+
Elapse: 538.89s
|
36 |
+
|
37 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
38 |
+
|
39 |
+
Epoch 006/400
|
40 |
+
Train loss: 95131240.00 correlation: 0.0621
|
41 |
+
Validation loss: 196873360.00 correlation: 0.0519
|
42 |
+
Elapse: 542.34s
|
43 |
+
|
44 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
45 |
+
|
46 |
+
Epoch 007/400
|
47 |
+
Train loss: 94226616.00 correlation: 0.0710
|
48 |
+
Validation loss: 195726576.00 correlation: 0.0578
|
49 |
+
Elapse: 541.43s
|
50 |
+
|
51 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
52 |
+
|
53 |
+
Epoch 008/400
|
54 |
+
Train loss: 93506680.00 correlation: 0.0783
|
55 |
+
Validation loss: 194520016.00 correlation: 0.0654
|
56 |
+
Elapse: 541.56s
|
57 |
+
|
58 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
59 |
+
|
60 |
+
Epoch 009/400
|
61 |
+
Train loss: 92727504.00 correlation: 0.0871
|
62 |
+
Validation loss: 193465776.00 correlation: 0.0716
|
63 |
+
Elapse: 543.31s
|
64 |
+
|
65 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
66 |
+
|
67 |
+
Epoch 010/400
|
68 |
+
Train loss: 91843728.00 correlation: 0.0966
|
69 |
+
Validation loss: 192176672.00 correlation: 0.0791
|
70 |
+
Elapse: 541.68s
|
71 |
+
|
72 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
73 |
+
|
74 |
+
Epoch 011/400
|
75 |
+
Train loss: 90936304.00 correlation: 0.1063
|
76 |
+
Validation loss: 190695968.00 correlation: 0.0928
|
77 |
+
Elapse: 540.29s
|
78 |
+
|
79 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
80 |
+
|
81 |
+
Epoch 012/400
|
82 |
+
Train loss: 90051912.00 correlation: 0.1153
|
83 |
+
Validation loss: 189604784.00 correlation: 0.1011
|
84 |
+
Elapse: 542.29s
|
85 |
+
|
86 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
87 |
+
|
88 |
+
Epoch 013/400
|
89 |
+
Train loss: 89180568.00 correlation: 0.1245
|
90 |
+
Validation loss: 188031648.00 correlation: 0.1112
|
91 |
+
Elapse: 542.62s
|
92 |
+
|
93 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
94 |
+
|
95 |
+
Epoch 014/400
|
96 |
+
Train loss: 88307792.00 correlation: 0.1337
|
97 |
+
Validation loss: 186159440.00 correlation: 0.1226
|
98 |
+
Elapse: 540.81s
|
99 |
+
|
100 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
101 |
+
|
102 |
+
Epoch 015/400
|
103 |
+
Train loss: 87278960.00 correlation: 0.1436
|
104 |
+
Validation loss: 184683440.00 correlation: 0.1313
|
105 |
+
Elapse: 543.63s
|
106 |
+
|
107 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
108 |
+
|
109 |
+
Epoch 016/400
|
110 |
+
Train loss: 86609264.00 correlation: 0.1505
|
111 |
+
Validation loss: 183679264.00 correlation: 0.1374
|
112 |
+
Elapse: 544.07s
|
113 |
+
|
114 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
115 |
+
|
116 |
+
Epoch 017/400
|
117 |
+
Train loss: 85933704.00 correlation: 0.1573
|
118 |
+
Validation loss: 182858960.00 correlation: 0.1427
|
119 |
+
Elapse: 543.60s
|
120 |
+
|
121 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
122 |
+
|
123 |
+
Epoch 018/400
|
124 |
+
Train loss: 85316224.00 correlation: 0.1634
|
125 |
+
Validation loss: 181758608.00 correlation: 0.1502
|
126 |
+
Elapse: 543.09s
|
127 |
+
|
128 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
129 |
+
|
130 |
+
Epoch 019/400
|
131 |
+
Train loss: 84800144.00 correlation: 0.1686
|
132 |
+
Validation loss: 181267248.00 correlation: 0.1538
|
133 |
+
Elapse: 545.10s
|
134 |
+
|
135 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
136 |
+
|
137 |
+
Epoch 020/400
|
138 |
+
Train loss: 84276656.00 correlation: 0.1737
|
139 |
+
Validation loss: 180435344.00 correlation: 0.1578
|
140 |
+
Elapse: 545.34s
|
141 |
+
|
142 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
143 |
+
|
144 |
+
Epoch 021/400
|
145 |
+
Train loss: 83717728.00 correlation: 0.1793
|
146 |
+
Validation loss: 179796752.00 correlation: 0.1639
|
147 |
+
Elapse: 545.93s
|
148 |
+
|
149 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
150 |
+
|
151 |
+
Epoch 022/400
|
152 |
+
Train loss: 83306056.00 correlation: 0.1836
|
153 |
+
Validation loss: 178887952.00 correlation: 0.1689
|
154 |
+
Elapse: 545.45s
|
155 |
+
|
156 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
157 |
+
|
158 |
+
Epoch 023/400
|
159 |
+
Train loss: 82787680.00 correlation: 0.1887
|
160 |
+
Validation loss: 177999440.00 correlation: 0.1749
|
161 |
+
Elapse: 545.47s
|
162 |
+
|
163 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
164 |
+
|
165 |
+
Epoch 024/400
|
166 |
+
Train loss: 82335960.00 correlation: 0.1933
|
167 |
+
Validation loss: 177650256.00 correlation: 0.1774
|
168 |
+
Elapse: 545.75s
|
169 |
+
|
170 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
171 |
+
|
172 |
+
Epoch 025/400
|
173 |
+
Train loss: 82013392.00 correlation: 0.1962
|
174 |
+
Validation loss: 177572752.00 correlation: 0.1786
|
175 |
+
Elapse: 545.69s
|
176 |
+
|
177 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
178 |
+
|
179 |
+
Epoch 026/400
|
180 |
+
Train loss: 81675472.00 correlation: 0.1996
|
181 |
+
Validation loss: 176845120.00 correlation: 0.1841
|
182 |
+
Elapse: 545.58s
|
183 |
+
|
184 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
185 |
+
|
186 |
+
Epoch 027/400
|
187 |
+
Train loss: 81393008.00 correlation: 0.2025
|
188 |
+
Validation loss: 176056032.00 correlation: 0.1886
|
189 |
+
Elapse: 545.76s
|
190 |
+
|
191 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
192 |
+
|
193 |
+
Epoch 028/400
|
194 |
+
Train loss: 80972248.00 correlation: 0.2065
|
195 |
+
Validation loss: 175799008.00 correlation: 0.1898
|
196 |
+
Elapse: 545.76s
|
197 |
+
|
198 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
199 |
+
|
200 |
+
Epoch 029/400
|
201 |
+
Train loss: 80749744.00 correlation: 0.2086
|
202 |
+
Validation loss: 175376608.00 correlation: 0.1918
|
203 |
+
Elapse: 546.06s
|
204 |
+
|
205 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
206 |
+
|
207 |
+
Epoch 030/400
|
208 |
+
Train loss: 80453840.00 correlation: 0.2117
|
209 |
+
Validation loss: 174830400.00 correlation: 0.1967
|
210 |
+
Elapse: 546.10s
|
211 |
+
|
212 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
213 |
+
|
214 |
+
Epoch 031/400
|
215 |
+
Train loss: 80186704.00 correlation: 0.2145
|
216 |
+
Validation loss: 174322544.00 correlation: 0.1984
|
217 |
+
Elapse: 545.45s
|
218 |
+
|
219 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
220 |
+
|
221 |
+
Epoch 032/400
|
222 |
+
Train loss: 79856432.00 correlation: 0.2176
|
223 |
+
Validation loss: 174104672.00 correlation: 0.2003
|
224 |
+
Elapse: 545.77s
|
225 |
+
|
226 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
227 |
+
|
228 |
+
Epoch 033/400
|
229 |
+
Train loss: 79589576.00 correlation: 0.2200
|
230 |
+
Validation loss: 173607248.00 correlation: 0.2031
|
231 |
+
Elapse: 545.80s
|
232 |
+
|
233 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
234 |
+
|
235 |
+
Epoch 034/400
|
236 |
+
Train loss: 79380120.00 correlation: 0.2221
|
237 |
+
Validation loss: 173319472.00 correlation: 0.2055
|
238 |
+
Elapse: 545.70s
|
239 |
+
|
240 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
241 |
+
|
242 |
+
Epoch 035/400
|
243 |
+
Train loss: 79158640.00 correlation: 0.2243
|
244 |
+
Validation loss: 172901472.00 correlation: 0.2089
|
245 |
+
Elapse: 545.61s
|
246 |
+
|
247 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
248 |
+
|
249 |
+
Epoch 036/400
|
250 |
+
Train loss: 78927200.00 correlation: 0.2266
|
251 |
+
Validation loss: 172636560.00 correlation: 0.2097
|
252 |
+
Elapse: 546.53s
|
253 |
+
|
254 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
255 |
+
|
256 |
+
Epoch 037/400
|
257 |
+
Train loss: 78682176.00 correlation: 0.2288
|
258 |
+
Validation loss: 172407184.00 correlation: 0.2118
|
259 |
+
Elapse: 545.83s
|
260 |
+
|
261 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
262 |
+
|
263 |
+
Epoch 038/400
|
264 |
+
Train loss: 78582504.00 correlation: 0.2299
|
265 |
+
Validation loss: 172238496.00 correlation: 0.2137
|
266 |
+
Elapse: 542.71s
|
267 |
+
|
268 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
269 |
+
|
270 |
+
Epoch 039/400
|
271 |
+
Train loss: 78397632.00 correlation: 0.2314
|
272 |
+
Validation loss: 171969648.00 correlation: 0.2147
|
273 |
+
Elapse: 545.53s
|
274 |
+
|
275 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
276 |
+
|
277 |
+
Epoch 040/400
|
278 |
+
Train loss: 78234600.00 correlation: 0.2330
|
279 |
+
Validation loss: 171758000.00 correlation: 0.2170
|
280 |
+
Elapse: 545.77s
|
281 |
+
|
282 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
283 |
+
|
284 |
+
Epoch 041/400
|
285 |
+
Train loss: 78047656.00 correlation: 0.2349
|
286 |
+
Validation loss: 171651168.00 correlation: 0.2175
|
287 |
+
Elapse: 545.10s
|
288 |
+
|
289 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
290 |
+
|
291 |
+
Epoch 042/400
|
292 |
+
Train loss: 77868808.00 correlation: 0.2362
|
293 |
+
Validation loss: 171537312.00 correlation: 0.2173
|
294 |
+
Elapse: 545.58s
|
295 |
+
|
296 |
+
Epoch 043/400
|
297 |
+
Train loss: 77839128.00 correlation: 0.2370
|
298 |
+
Validation loss: 171300016.00 correlation: 0.2185
|
299 |
+
Elapse: 546.30s
|
300 |
+
|
301 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
302 |
+
|
303 |
+
Epoch 044/400
|
304 |
+
Train loss: 77629288.00 correlation: 0.2390
|
305 |
+
Validation loss: 171374944.00 correlation: 0.2191
|
306 |
+
Elapse: 546.42s
|
307 |
+
|
308 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
309 |
+
|
310 |
+
Epoch 045/400
|
311 |
+
Train loss: 77550776.00 correlation: 0.2396
|
312 |
+
Validation loss: 171207344.00 correlation: 0.2194
|
313 |
+
Elapse: 545.96s
|
314 |
+
|
315 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
316 |
+
|
317 |
+
Epoch 046/400
|
318 |
+
Train loss: 77437640.00 correlation: 0.2408
|
319 |
+
Validation loss: 171176240.00 correlation: 0.2198
|
320 |
+
Elapse: 546.38s
|
321 |
+
|
322 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
323 |
+
|
324 |
+
Epoch 047/400
|
325 |
+
Train loss: 77397712.00 correlation: 0.2412
|
326 |
+
Validation loss: 170808800.00 correlation: 0.2224
|
327 |
+
Elapse: 545.84s
|
328 |
+
|
329 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
330 |
+
|
331 |
+
Epoch 048/400
|
332 |
+
Train loss: 77307432.00 correlation: 0.2422
|
333 |
+
Validation loss: 170735520.00 correlation: 0.2233
|
334 |
+
Elapse: 546.33s
|
335 |
+
|
336 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
337 |
+
|
338 |
+
Epoch 049/400
|
339 |
+
Train loss: 77119432.00 correlation: 0.2439
|
340 |
+
Validation loss: 170442368.00 correlation: 0.2245
|
341 |
+
Elapse: 545.45s
|
342 |
+
|
343 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
344 |
+
|
345 |
+
Epoch 050/400
|
346 |
+
Train loss: 76988832.00 correlation: 0.2449
|
347 |
+
Validation loss: 170672960.00 correlation: 0.2232
|
348 |
+
Elapse: 544.34s
|
349 |
+
|
350 |
+
Epoch 051/400
|
351 |
+
Train loss: 76992464.00 correlation: 0.2450
|
352 |
+
Validation loss: 170562112.00 correlation: 0.2244
|
353 |
+
Elapse: 545.56s
|
354 |
+
|
355 |
+
Epoch 052/400
|
356 |
+
Train loss: 76925112.00 correlation: 0.2452
|
357 |
+
Validation loss: 170404016.00 correlation: 0.2248
|
358 |
+
Elapse: 545.72s
|
359 |
+
|
360 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
361 |
+
|
362 |
+
Epoch 053/400
|
363 |
+
Train loss: 76844464.00 correlation: 0.2460
|
364 |
+
Validation loss: 170137952.00 correlation: 0.2261
|
365 |
+
Elapse: 545.92s
|
366 |
+
|
367 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
368 |
+
|
369 |
+
Epoch 054/400
|
370 |
+
Train loss: 76812920.00 correlation: 0.2469
|
371 |
+
Validation loss: 170023120.00 correlation: 0.2259
|
372 |
+
Elapse: 545.56s
|
373 |
+
|
374 |
+
Epoch 055/400
|
375 |
+
Train loss: 76702536.00 correlation: 0.2475
|
376 |
+
Validation loss: 170054384.00 correlation: 0.2263
|
377 |
+
Elapse: 544.95s
|
378 |
+
|
379 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
380 |
+
|
381 |
+
Epoch 056/400
|
382 |
+
Train loss: 76612752.00 correlation: 0.2485
|
383 |
+
Validation loss: 170032864.00 correlation: 0.2272
|
384 |
+
Elapse: 545.49s
|
385 |
+
|
386 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
387 |
+
|
388 |
+
Epoch 057/400
|
389 |
+
Train loss: 76617696.00 correlation: 0.2485
|
390 |
+
Validation loss: 169630816.00 correlation: 0.2293
|
391 |
+
Elapse: 545.90s
|
392 |
+
|
393 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
394 |
+
|
395 |
+
Epoch 058/400
|
396 |
+
Train loss: 76465880.00 correlation: 0.2499
|
397 |
+
Validation loss: 169825600.00 correlation: 0.2283
|
398 |
+
Elapse: 545.37s
|
399 |
+
|
400 |
+
Epoch 059/400
|
401 |
+
Train loss: 76456912.00 correlation: 0.2499
|
402 |
+
Validation loss: 169766688.00 correlation: 0.2284
|
403 |
+
Elapse: 545.61s
|
404 |
+
|
405 |
+
Epoch 060/400
|
406 |
+
Train loss: 76426872.00 correlation: 0.2501
|
407 |
+
Validation loss: 169651072.00 correlation: 0.2298
|
408 |
+
Elapse: 545.66s
|
409 |
+
|
410 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
411 |
+
|
412 |
+
Epoch 061/400
|
413 |
+
Train loss: 76272176.00 correlation: 0.2515
|
414 |
+
Validation loss: 169694896.00 correlation: 0.2290
|
415 |
+
Elapse: 544.26s
|
416 |
+
|
417 |
+
Epoch 062/400
|
418 |
+
Train loss: 76381040.00 correlation: 0.2506
|
419 |
+
Validation loss: 169396208.00 correlation: 0.2316
|
420 |
+
Elapse: 544.91s
|
421 |
+
|
422 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
423 |
+
|
424 |
+
Epoch 063/400
|
425 |
+
Train loss: 76206744.00 correlation: 0.2523
|
426 |
+
Validation loss: 169683888.00 correlation: 0.2297
|
427 |
+
Elapse: 544.69s
|
428 |
+
|
429 |
+
Epoch 064/400
|
430 |
+
Train loss: 76167792.00 correlation: 0.2527
|
431 |
+
Validation loss: 169194928.00 correlation: 0.2329
|
432 |
+
Elapse: 545.55s
|
433 |
+
|
434 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
435 |
+
|
436 |
+
Epoch 065/400
|
437 |
+
Train loss: 76127384.00 correlation: 0.2528
|
438 |
+
Validation loss: 169763808.00 correlation: 0.2287
|
439 |
+
Elapse: 545.54s
|
440 |
+
|
441 |
+
Epoch 066/400
|
442 |
+
Train loss: 76104336.00 correlation: 0.2531
|
443 |
+
Validation loss: 169165280.00 correlation: 0.2327
|
444 |
+
Elapse: 545.65s
|
445 |
+
|
446 |
+
Epoch 067/400
|
447 |
+
Train loss: 76021512.00 correlation: 0.2539
|
448 |
+
Validation loss: 169219872.00 correlation: 0.2317
|
449 |
+
Elapse: 545.30s
|
450 |
+
|
451 |
+
Epoch 068/400
|
452 |
+
Train loss: 76148160.00 correlation: 0.2528
|
453 |
+
Validation loss: 169344656.00 correlation: 0.2314
|
454 |
+
Elapse: 545.59s
|
455 |
+
|
456 |
+
Epoch 069/400
|
457 |
+
Train loss: 75939984.00 correlation: 0.2545
|
458 |
+
Validation loss: 169043376.00 correlation: 0.2339
|
459 |
+
Elapse: 545.18s
|
460 |
+
|
461 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
462 |
+
|
463 |
+
Epoch 070/400
|
464 |
+
Train loss: 75822872.00 correlation: 0.2557
|
465 |
+
Validation loss: 169167760.00 correlation: 0.2328
|
466 |
+
Elapse: 544.88s
|
467 |
+
|
468 |
+
Epoch 071/400
|
469 |
+
Train loss: 75873072.00 correlation: 0.2551
|
470 |
+
Validation loss: 169123712.00 correlation: 0.2336
|
471 |
+
Elapse: 545.60s
|
472 |
+
|
473 |
+
Epoch 072/400
|
474 |
+
Train loss: 75867984.00 correlation: 0.2552
|
475 |
+
Validation loss: 168947232.00 correlation: 0.2344
|
476 |
+
Elapse: 545.61s
|
477 |
+
|
478 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
479 |
+
|
480 |
+
Epoch 073/400
|
481 |
+
Train loss: 75840912.00 correlation: 0.2555
|
482 |
+
Validation loss: 169026784.00 correlation: 0.2348
|
483 |
+
Elapse: 545.60s
|
484 |
+
|
485 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
486 |
+
|
487 |
+
Epoch 074/400
|
488 |
+
Train loss: 75855384.00 correlation: 0.2555
|
489 |
+
Validation loss: 168842592.00 correlation: 0.2341
|
490 |
+
Elapse: 545.99s
|
491 |
+
|
492 |
+
Epoch 075/400
|
493 |
+
Train loss: 75737744.00 correlation: 0.2565
|
494 |
+
Validation loss: 168971312.00 correlation: 0.2336
|
495 |
+
Elapse: 545.40s
|
496 |
+
|
497 |
+
Epoch 076/400
|
498 |
+
Train loss: 75735656.00 correlation: 0.2565
|
499 |
+
Validation loss: 168829920.00 correlation: 0.2338
|
500 |
+
Elapse: 546.00s
|
501 |
+
|
502 |
+
Epoch 077/400
|
503 |
+
Train loss: 75607888.00 correlation: 0.2576
|
504 |
+
Validation loss: 168935968.00 correlation: 0.2349
|
505 |
+
Elapse: 545.47s
|
506 |
+
|
507 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
508 |
+
|
509 |
+
Epoch 078/400
|
510 |
+
Train loss: 75679128.00 correlation: 0.2571
|
511 |
+
Validation loss: 168987280.00 correlation: 0.2328
|
512 |
+
Elapse: 545.11s
|
513 |
+
|
514 |
+
Epoch 079/400
|
515 |
+
Train loss: 75621152.00 correlation: 0.2574
|
516 |
+
Validation loss: 168822512.00 correlation: 0.2347
|
517 |
+
Elapse: 545.59s
|
518 |
+
|
519 |
+
Epoch 080/400
|
520 |
+
Train loss: 75483728.00 correlation: 0.2590
|
521 |
+
Validation loss: 168774416.00 correlation: 0.2347
|
522 |
+
Elapse: 545.47s
|
523 |
+
|
524 |
+
Epoch 081/400
|
525 |
+
Train loss: 75531304.00 correlation: 0.2586
|
526 |
+
Validation loss: 169126304.00 correlation: 0.2331
|
527 |
+
Elapse: 545.29s
|
528 |
+
|
529 |
+
Epoch 082/400
|
530 |
+
Train loss: 75558736.00 correlation: 0.2583
|
531 |
+
Validation loss: 168670160.00 correlation: 0.2354
|
532 |
+
Elapse: 545.72s
|
533 |
+
|
534 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
535 |
+
|
536 |
+
Epoch 083/400
|
537 |
+
Train loss: 75590176.00 correlation: 0.2579
|
538 |
+
Validation loss: 169091472.00 correlation: 0.2330
|
539 |
+
Elapse: 545.76s
|
540 |
+
|
541 |
+
Epoch 084/400
|
542 |
+
Train loss: 75406416.00 correlation: 0.2595
|
543 |
+
Validation loss: 169084192.00 correlation: 0.2329
|
544 |
+
Elapse: 545.78s
|
545 |
+
|
546 |
+
Epoch 085/400
|
547 |
+
Train loss: 75376912.00 correlation: 0.2599
|
548 |
+
Validation loss: 168861952.00 correlation: 0.2341
|
549 |
+
Elapse: 545.89s
|
550 |
+
|
551 |
+
Epoch 086/400
|
552 |
+
Train loss: 75349048.00 correlation: 0.2604
|
553 |
+
Validation loss: 168882304.00 correlation: 0.2349
|
554 |
+
Elapse: 545.73s
|
555 |
+
|
556 |
+
Epoch 087/400
|
557 |
+
Train loss: 75302984.00 correlation: 0.2607
|
558 |
+
Validation loss: 169006784.00 correlation: 0.2333
|
559 |
+
Elapse: 545.26s
|
560 |
+
|
561 |
+
Loaded checkpoint from epoch 82 (correlation: 0.2354).
|
562 |
+
|
563 |
+
Reduce learning rate of core to 1.4400e-03 (num. reduce: 1).
|
564 |
+
Reduce learning rate of readouts to 1.0800e-03 (num. reduce: 1).
|
565 |
+
Reduce learning rate of shifters to 1.0800e-03 (num. reduce: 1).
|
566 |
+
|
567 |
+
Epoch 088/400
|
568 |
+
Train loss: 73472912.00 correlation: 0.2760
|
569 |
+
Validation loss: 166967968.00 correlation: 0.2466
|
570 |
+
Elapse: 546.46s
|
571 |
+
|
572 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
573 |
+
|
574 |
+
Epoch 089/400
|
575 |
+
Train loss: 72834528.00 correlation: 0.2820
|
576 |
+
Validation loss: 166834160.00 correlation: 0.2485
|
577 |
+
Elapse: 546.50s
|
578 |
+
|
579 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
580 |
+
|
581 |
+
Epoch 090/400
|
582 |
+
Train loss: 72607408.00 correlation: 0.2844
|
583 |
+
Validation loss: 166764992.00 correlation: 0.2490
|
584 |
+
Elapse: 546.18s
|
585 |
+
|
586 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
587 |
+
|
588 |
+
Epoch 091/400
|
589 |
+
Train loss: 72571872.00 correlation: 0.2846
|
590 |
+
Validation loss: 166824368.00 correlation: 0.2476
|
591 |
+
Elapse: 546.25s
|
592 |
+
|
593 |
+
Epoch 092/400
|
594 |
+
Train loss: 72491600.00 correlation: 0.2854
|
595 |
+
Validation loss: 166791872.00 correlation: 0.2474
|
596 |
+
Elapse: 545.90s
|
597 |
+
|
598 |
+
Epoch 093/400
|
599 |
+
Train loss: 72479560.00 correlation: 0.2856
|
600 |
+
Validation loss: 166900064.00 correlation: 0.2473
|
601 |
+
Elapse: 546.88s
|
602 |
+
|
603 |
+
Epoch 094/400
|
604 |
+
Train loss: 72391640.00 correlation: 0.2867
|
605 |
+
Validation loss: 166895872.00 correlation: 0.2471
|
606 |
+
Elapse: 546.67s
|
607 |
+
|
608 |
+
Epoch 095/400
|
609 |
+
Train loss: 72406800.00 correlation: 0.2865
|
610 |
+
Validation loss: 166785824.00 correlation: 0.2477
|
611 |
+
Elapse: 546.76s
|
612 |
+
|
613 |
+
Loaded checkpoint from epoch 90 (correlation: 0.2490).
|
614 |
+
|
615 |
+
Reduce learning rate of core to 4.3200e-04 (num. reduce: 1).
|
616 |
+
Reduce learning rate of readouts to 3.2400e-04 (num. reduce: 1).
|
617 |
+
Reduce learning rate of shifters to 3.2400e-04 (num. reduce: 1).
|
618 |
+
|
619 |
+
Epoch 096/400
|
620 |
+
Train loss: 71820392.00 correlation: 0.2914
|
621 |
+
Validation loss: 166357664.00 correlation: 0.2510
|
622 |
+
Elapse: 546.29s
|
623 |
+
|
624 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
625 |
+
|
626 |
+
Epoch 097/400
|
627 |
+
Train loss: 71646128.00 correlation: 0.2926
|
628 |
+
Validation loss: 166358480.00 correlation: 0.2512
|
629 |
+
Elapse: 546.63s
|
630 |
+
|
631 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
632 |
+
|
633 |
+
Epoch 098/400
|
634 |
+
Train loss: 71469944.00 correlation: 0.2943
|
635 |
+
Validation loss: 166261168.00 correlation: 0.2520
|
636 |
+
Elapse: 547.33s
|
637 |
+
|
638 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
639 |
+
|
640 |
+
Epoch 099/400
|
641 |
+
Train loss: 71457032.00 correlation: 0.2945
|
642 |
+
Validation loss: 166242256.00 correlation: 0.2517
|
643 |
+
Elapse: 547.22s
|
644 |
+
|
645 |
+
Epoch 100/400
|
646 |
+
Train loss: 71381520.00 correlation: 0.2953
|
647 |
+
Validation loss: 166269072.00 correlation: 0.2516
|
648 |
+
Elapse: 546.93s
|
649 |
+
|
650 |
+
Epoch 101/400
|
651 |
+
Train loss: 71365904.00 correlation: 0.2954
|
652 |
+
Validation loss: 166306016.00 correlation: 0.2512
|
653 |
+
Elapse: 547.14s
|
654 |
+
|
655 |
+
Epoch 102/400
|
656 |
+
Train loss: 71313408.00 correlation: 0.2956
|
657 |
+
Validation loss: 166202720.00 correlation: 0.2520
|
658 |
+
Elapse: 547.18s
|
659 |
+
|
660 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
661 |
+
|
662 |
+
Epoch 103/400
|
663 |
+
Train loss: 71246520.00 correlation: 0.2963
|
664 |
+
Validation loss: 166201664.00 correlation: 0.2519
|
665 |
+
Elapse: 546.59s
|
666 |
+
|
667 |
+
Epoch 104/400
|
668 |
+
Train loss: 71237544.00 correlation: 0.2967
|
669 |
+
Validation loss: 166225280.00 correlation: 0.2516
|
670 |
+
Elapse: 546.47s
|
671 |
+
|
672 |
+
Epoch 105/400
|
673 |
+
Train loss: 71175248.00 correlation: 0.2973
|
674 |
+
Validation loss: 166234304.00 correlation: 0.2515
|
675 |
+
Elapse: 546.73s
|
676 |
+
|
677 |
+
Epoch 106/400
|
678 |
+
Train loss: 71139096.00 correlation: 0.2976
|
679 |
+
Validation loss: 166179840.00 correlation: 0.2518
|
680 |
+
Elapse: 547.27s
|
681 |
+
|
682 |
+
Epoch 107/400
|
683 |
+
Train loss: 71152664.00 correlation: 0.2972
|
684 |
+
Validation loss: 166277328.00 correlation: 0.2509
|
685 |
+
Elapse: 547.28s
|
686 |
+
|
687 |
+
Loaded checkpoint from epoch 102 (correlation: 0.2520).
|
688 |
+
|
689 |
+
Reduce learning rate of core to 1.2960e-04 (num. reduce: 1).
|
690 |
+
Reduce learning rate of readouts to 9.7200e-05 (num. reduce: 1).
|
691 |
+
Reduce learning rate of shifters to 9.7200e-05 (num. reduce: 1).
|
692 |
+
|
693 |
+
Epoch 108/400
|
694 |
+
Train loss: 70975272.00 correlation: 0.2990
|
695 |
+
Validation loss: 166102416.00 correlation: 0.2526
|
696 |
+
Elapse: 547.38s
|
697 |
+
|
698 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
699 |
+
|
700 |
+
Epoch 109/400
|
701 |
+
Train loss: 70927400.00 correlation: 0.2990
|
702 |
+
Validation loss: 166090848.00 correlation: 0.2526
|
703 |
+
Elapse: 547.10s
|
704 |
+
|
705 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
706 |
+
|
707 |
+
Epoch 110/400
|
708 |
+
Train loss: 70928176.00 correlation: 0.2993
|
709 |
+
Validation loss: 166087520.00 correlation: 0.2526
|
710 |
+
Elapse: 547.24s
|
711 |
+
|
712 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
713 |
+
|
714 |
+
Epoch 111/400
|
715 |
+
Train loss: 70948912.00 correlation: 0.2989
|
716 |
+
Validation loss: 166067424.00 correlation: 0.2526
|
717 |
+
Elapse: 547.30s
|
718 |
+
|
719 |
+
Epoch 112/400
|
720 |
+
Train loss: 70843856.00 correlation: 0.2999
|
721 |
+
Validation loss: 166089904.00 correlation: 0.2527
|
722 |
+
Elapse: 547.44s
|
723 |
+
|
724 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
725 |
+
|
726 |
+
Epoch 113/400
|
727 |
+
Train loss: 70930864.00 correlation: 0.2991
|
728 |
+
Validation loss: 166048192.00 correlation: 0.2527
|
729 |
+
Elapse: 547.22s
|
730 |
+
|
731 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
732 |
+
|
733 |
+
Epoch 114/400
|
734 |
+
Train loss: 70888224.00 correlation: 0.2998
|
735 |
+
Validation loss: 166076336.00 correlation: 0.2525
|
736 |
+
Elapse: 547.07s
|
737 |
+
|
738 |
+
Epoch 115/400
|
739 |
+
Train loss: 70807400.00 correlation: 0.3003
|
740 |
+
Validation loss: 166078992.00 correlation: 0.2524
|
741 |
+
Elapse: 547.34s
|
742 |
+
|
743 |
+
Epoch 116/400
|
744 |
+
Train loss: 70784824.00 correlation: 0.3006
|
745 |
+
Validation loss: 166036512.00 correlation: 0.2528
|
746 |
+
Elapse: 547.33s
|
747 |
+
|
748 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
749 |
+
|
750 |
+
Epoch 117/400
|
751 |
+
Train loss: 70760888.00 correlation: 0.3007
|
752 |
+
Validation loss: 166109792.00 correlation: 0.2523
|
753 |
+
Elapse: 547.36s
|
754 |
+
|
755 |
+
Epoch 118/400
|
756 |
+
Train loss: 70793224.00 correlation: 0.3003
|
757 |
+
Validation loss: 166033088.00 correlation: 0.2527
|
758 |
+
Elapse: 547.66s
|
759 |
+
|
760 |
+
Epoch 119/400
|
761 |
+
Train loss: 70801416.00 correlation: 0.3002
|
762 |
+
Validation loss: 166062960.00 correlation: 0.2529
|
763 |
+
Elapse: 547.68s
|
764 |
+
|
765 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
766 |
+
|
767 |
+
Epoch 120/400
|
768 |
+
Train loss: 70748944.00 correlation: 0.3009
|
769 |
+
Validation loss: 166063152.00 correlation: 0.2524
|
770 |
+
Elapse: 547.18s
|
771 |
+
|
772 |
+
Epoch 121/400
|
773 |
+
Train loss: 70736464.00 correlation: 0.3010
|
774 |
+
Validation loss: 166058976.00 correlation: 0.2528
|
775 |
+
Elapse: 547.53s
|
776 |
+
|
777 |
+
Epoch 122/400
|
778 |
+
Train loss: 70653008.00 correlation: 0.3019
|
779 |
+
Validation loss: 166041920.00 correlation: 0.2527
|
780 |
+
Elapse: 547.68s
|
781 |
+
|
782 |
+
Epoch 123/400
|
783 |
+
Train loss: 70723656.00 correlation: 0.3011
|
784 |
+
Validation loss: 166053344.00 correlation: 0.2525
|
785 |
+
Elapse: 547.37s
|
786 |
+
|
787 |
+
Epoch 124/400
|
788 |
+
Train loss: 70689936.00 correlation: 0.3016
|
789 |
+
Validation loss: 166053472.00 correlation: 0.2526
|
790 |
+
Elapse: 547.93s
|
791 |
+
|
792 |
+
Loaded checkpoint from epoch 119 (correlation: 0.2529).
|
793 |
+
|
794 |
+
Reduce learning rate of core to 3.8880e-05 (num. reduce: 1).
|
795 |
+
Reduce learning rate of readouts to 2.9160e-05 (num. reduce: 1).
|
796 |
+
Reduce learning rate of shifters to 2.9160e-05 (num. reduce: 1).
|
797 |
+
|
798 |
+
Epoch 125/400
|
799 |
+
Train loss: 70604440.00 correlation: 0.3023
|
800 |
+
Validation loss: 166025312.00 correlation: 0.2529
|
801 |
+
Elapse: 547.63s
|
802 |
+
|
803 |
+
Epoch 126/400
|
804 |
+
Train loss: 70608160.00 correlation: 0.3021
|
805 |
+
Validation loss: 166010512.00 correlation: 0.2530
|
806 |
+
Elapse: 547.36s
|
807 |
+
|
808 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
809 |
+
|
810 |
+
Epoch 127/400
|
811 |
+
Train loss: 70626448.00 correlation: 0.3020
|
812 |
+
Validation loss: 166023648.00 correlation: 0.2528
|
813 |
+
Elapse: 547.13s
|
814 |
+
|
815 |
+
Epoch 128/400
|
816 |
+
Train loss: 70612096.00 correlation: 0.3018
|
817 |
+
Validation loss: 166023216.00 correlation: 0.2529
|
818 |
+
Elapse: 546.99s
|
819 |
+
|
820 |
+
Epoch 129/400
|
821 |
+
Train loss: 70635640.00 correlation: 0.3020
|
822 |
+
Validation loss: 166036208.00 correlation: 0.2528
|
823 |
+
Elapse: 547.23s
|
824 |
+
|
825 |
+
Epoch 130/400
|
826 |
+
Train loss: 70666920.00 correlation: 0.3015
|
827 |
+
Validation loss: 166035808.00 correlation: 0.2527
|
828 |
+
Elapse: 546.99s
|
829 |
+
|
830 |
+
Epoch 131/400
|
831 |
+
Train loss: 70564592.00 correlation: 0.3028
|
832 |
+
Validation loss: 166005856.00 correlation: 0.2528
|
833 |
+
Elapse: 547.30s
|
834 |
+
|
835 |
+
Loaded checkpoint from epoch 126 (correlation: 0.2530).
|
836 |
+
|
837 |
+
Reduce learning rate of core to 1.1664e-05 (num. reduce: 1).
|
838 |
+
Reduce learning rate of readouts to 8.7480e-06 (num. reduce: 1).
|
839 |
+
Reduce learning rate of shifters to 8.7480e-06 (num. reduce: 1).
|
840 |
+
|
841 |
+
Epoch 132/400
|
842 |
+
Train loss: 70603848.00 correlation: 0.3022
|
843 |
+
Validation loss: 166004944.00 correlation: 0.2530
|
844 |
+
Elapse: 547.32s
|
845 |
+
|
846 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
|
847 |
+
|
848 |
+
Epoch 133/400
|
849 |
+
Train loss: 70533872.00 correlation: 0.3031
|
850 |
+
Validation loss: 166019360.00 correlation: 0.2529
|
851 |
+
Elapse: 547.50s
|
852 |
+
|
853 |
+
Epoch 134/400
|
854 |
+
Train loss: 70635248.00 correlation: 0.3019
|
855 |
+
Validation loss: 166021888.00 correlation: 0.2529
|
856 |
+
Elapse: 547.34s
|
857 |
+
|
858 |
+
Epoch 135/400
|
859 |
+
Train loss: 70620176.00 correlation: 0.3020
|
860 |
+
Validation loss: 166009888.00 correlation: 0.2529
|
861 |
+
Elapse: 546.38s
|
862 |
+
|
863 |
+
Epoch 136/400
|
864 |
+
Train loss: 70572368.00 correlation: 0.3023
|
865 |
+
Validation loss: 166012144.00 correlation: 0.2529
|
866 |
+
Elapse: 547.10s
|
867 |
+
|
868 |
+
Epoch 137/400
|
869 |
+
Train loss: 70658640.00 correlation: 0.3016
|
870 |
+
Validation loss: 166018080.00 correlation: 0.2529
|
871 |
+
Elapse: 546.90s
|
872 |
+
|
873 |
+
Loaded checkpoint from epoch 132 (correlation: 0.2530).
|
874 |
+
|
875 |
+
Reduce learning rate of core to 3.4992e-06 (num. reduce: 1).
|
876 |
+
Reduce learning rate of readouts to 2.6244e-06 (num. reduce: 1).
|
877 |
+
Reduce learning rate of shifters to 2.6244e-06 (num. reduce: 1).
|
878 |
+
|
879 |
+
Epoch 138/400
|
880 |
+
Train loss: 70545520.00 correlation: 0.3026
|
881 |
+
Validation loss: 166011936.00 correlation: 0.2530
|
882 |
+
Elapse: 546.72s
|
883 |
+
|
884 |
+
Epoch 139/400
|
885 |
+
Train loss: 70622800.00 correlation: 0.3018
|
886 |
+
Validation loss: 166013088.00 correlation: 0.2529
|
887 |
+
Elapse: 547.01s
|
888 |
+
|
889 |
+
Epoch 140/400
|
890 |
+
Train loss: 70572936.00 correlation: 0.3025
|
891 |
+
Validation loss: 166013696.00 correlation: 0.2529
|
892 |
+
Elapse: 547.38s
|
893 |
+
|
894 |
+
Epoch 141/400
|
895 |
+
Train loss: 70624016.00 correlation: 0.3020
|
896 |
+
Validation loss: 166012496.00 correlation: 0.2530
|
897 |
+
Elapse: 546.98s
|
898 |
+
|
899 |
+
Epoch 142/400
|
900 |
+
Train loss: 70651392.00 correlation: 0.3018
|
901 |
+
Validation loss: 166017120.00 correlation: 0.2529
|
902 |
+
Elapse: 547.57s
|
903 |
+
|
904 |
+
Loaded checkpoint from epoch 132 (correlation: 0.2530).
|
905 |
+
|
906 |
+
Reduce learning rate of core to 1.0498e-06 (num. reduce: 2).
|
907 |
+
Reduce learning rate of readouts to 7.8732e-07 (num. reduce: 2).
|
908 |
+
Reduce learning rate of shifters to 7.8732e-07 (num. reduce: 2).
|
909 |
+
|
910 |
+
Epoch 143/400
|
911 |
+
Train loss: 70616608.00 correlation: 0.3018
|
912 |
+
Validation loss: 166009488.00 correlation: 0.2530
|
913 |
+
Elapse: 547.46s
|
914 |
+
|
915 |
+
Epoch 144/400
|
916 |
+
Train loss: 70557224.00 correlation: 0.3027
|
917 |
+
Validation loss: 166010240.00 correlation: 0.2530
|
918 |
+
Elapse: 547.42s
|
919 |
+
|
920 |
+
Epoch 145/400
|
921 |
+
Train loss: 70617064.00 correlation: 0.3020
|
922 |
+
Validation loss: 166011824.00 correlation: 0.2530
|
923 |
+
Elapse: 547.48s
|
924 |
+
|
925 |
+
Epoch 146/400
|
926 |
+
Train loss: 70601720.00 correlation: 0.3022
|
927 |
+
Validation loss: 166010880.00 correlation: 0.2530
|
928 |
+
Elapse: 547.26s
|
929 |
+
|
930 |
+
Epoch 147/400
|
931 |
+
Train loss: 70616768.00 correlation: 0.3021
|
932 |
+
Validation loss: 166012944.00 correlation: 0.2530
|
933 |
+
Elapse: 547.43s
|
934 |
+
|
935 |
+
Model has not improved after 2 LR reductions.
|
936 |
+
|
937 |
+
Loaded checkpoint from epoch 132 (correlation: 0.2530).
|
938 |
+
|
939 |
+
|
940 |
+
ValidationA: 0.2508 B: 0.2804 C: 0.2750 D: 0.2393 E: 0.2390 F: 0.2346 G: 0.2573 H: 0.2379 I: 0.2555 J: 0.2599 average: 0.2530
|
941 |
+
|
942 |
+
Results saved to /home/storage/runs/vivit_ensemble/009.
|
003/args.yaml
ADDED
@@ -0,0 +1,87 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
adam_beta1: 0.9
|
2 |
+
adam_beta2: 0.999
|
3 |
+
adam_eps: 1e-08
|
4 |
+
batch_size: 6
|
5 |
+
cache_data: false
|
6 |
+
center_crop: 1.0
|
7 |
+
clear_output_dir: true
|
8 |
+
core: vivit
|
9 |
+
core_behavior_mode: 2
|
10 |
+
core_compile: false
|
11 |
+
core_drop_path: 0.0505
|
12 |
+
core_emb_dim: 112
|
13 |
+
core_ff_activation: gelu
|
14 |
+
core_ff_dropout: 0.0592
|
15 |
+
core_flash_attention: 1
|
16 |
+
core_head_dim: 48
|
17 |
+
core_lr: 0.0048
|
18 |
+
core_mha_dropout: 0.358
|
19 |
+
core_mlp_dim: 136
|
20 |
+
core_norm_qk: false
|
21 |
+
core_num_heads: 11
|
22 |
+
core_p_dropout: 0.1338
|
23 |
+
core_parallel_attention: true
|
24 |
+
core_patch_mode: 0
|
25 |
+
core_pos_encoding: 3
|
26 |
+
core_spatial_depth: 3
|
27 |
+
core_spatial_patch_size: 7
|
28 |
+
core_spatial_patch_stride: 2
|
29 |
+
core_temporal_depth: 5
|
30 |
+
core_temporal_patch_size: 25
|
31 |
+
core_temporal_patch_stride: 1
|
32 |
+
core_weight_decay: 0.1789
|
33 |
+
criterion: poisson_correlation
|
34 |
+
critic_mode: 0
|
35 |
+
crop_frame: 140
|
36 |
+
data: /home/sensorium2023
|
37 |
+
deterministic: false
|
38 |
+
device: cuda
|
39 |
+
dpi: 120
|
40 |
+
ds_mode: 3
|
41 |
+
ds_scale: 1
|
42 |
+
epochs: 400
|
43 |
+
format: svg
|
44 |
+
git_hash: 1033c29
|
45 |
+
grad_checkpointing: 0
|
46 |
+
grad_norm: null
|
47 |
+
input_shapes:
|
48 |
+
behavior: [2, 140]
|
49 |
+
pupil_center: [2, 140]
|
50 |
+
video: [1, 140, 36, 64]
|
51 |
+
limit_data: null
|
52 |
+
lr: 0.0036
|
53 |
+
max_frame: 300
|
54 |
+
micro_batch_size: 6
|
55 |
+
modulator_mode: 0
|
56 |
+
mouse_ids: [A, B, C, D, E, F, G, H, I, J]
|
57 |
+
num_workers: 2
|
58 |
+
output_dir: /home/storage/runs/003
|
59 |
+
output_mode: 1
|
60 |
+
output_shapes:
|
61 |
+
A: [7440, 140]
|
62 |
+
B: [7928, 140]
|
63 |
+
C: [8285, 140]
|
64 |
+
D: [7671, 140]
|
65 |
+
E: [7495, 140]
|
66 |
+
F: [7863, 140]
|
67 |
+
G: [7908, 140]
|
68 |
+
H: [8202, 140]
|
69 |
+
I: [7939, 140]
|
70 |
+
J: [8122, 140]
|
71 |
+
precision: "32"
|
72 |
+
pretrain_core: null
|
73 |
+
readout: gaussian2d
|
74 |
+
readout_bias_mode: 2
|
75 |
+
readout_dropout: 0.0
|
76 |
+
readout_grid_mode: 1
|
77 |
+
restore: null
|
78 |
+
save_plots: false
|
79 |
+
seed: 12
|
80 |
+
shifter_layers: 3
|
81 |
+
shifter_mode: 1
|
82 |
+
shifter_size: 5
|
83 |
+
stat_mode: 1
|
84 |
+
trainable_params: 12278365
|
85 |
+
transform_mode: 2
|
86 |
+
verbose: 1
|
87 |
+
weight_decay: 0.3939
|
003/ckpt/model_state.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09874ebf6e03ea617ccd08af30de997d9ca2d372fd68f9fe26696e58b675f025
|
3 |
+
size 148268583
|
003/evaluation.yaml
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
validation: {A: 0.24746963381767273, B: 0.27505889534950256, C: 0.27303239703178406,
|
2 |
+
D: 0.23642510175704956, E: 0.23546315729618073, F: 0.23425357043743134, G: 0.2543371021747589,
|
3 |
+
H: 0.23437707126140594, I: 0.2602153420448303, J: 0.2588430643081665, average: 0.25094753354787824}
|
003/model.txt
ADDED
@@ -0,0 +1,143 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
=======================================================================================================================================
|
2 |
+
Layer (type:depth-idx) Input Shape Output Shape Param #
|
3 |
+
=======================================================================================================================================
|
4 |
+
Model -- [1, 7440, 116] --
|
5 |
+
├─ViViTCore: 1-1 -- [1, 112, 116, 15, 29] --
|
6 |
+
│ └─ViViT: 2-1 [1, 5, 140, 36, 64] [1, 112, 116, 15, 29] --
|
7 |
+
│ │ └─Tokenizer: 3-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] 79,632
|
8 |
+
│ │ │ └─Sequential: 4-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] --
|
9 |
+
│ │ │ │ └─Unfold3d: 5-1 [1, 5, 140, 36, 64] [1, 116, 435, 6125] --
|
10 |
+
│ │ │ │ └─LayerNorm: 5-2 [1, 116, 435, 6125] [1, 116, 435, 6125] 12,250
|
11 |
+
│ │ │ │ └─Linear: 5-3 [1, 116, 435, 6125] [1, 116, 435, 112] 686,112
|
12 |
+
│ │ │ │ └─LayerNorm: 5-4 [1, 116, 435, 112] [1, 116, 435, 112] 224
|
13 |
+
│ │ │ │ └─Dropout: 5-5 [1, 116, 435, 112] [1, 116, 435, 112] --
|
14 |
+
│ │ └─Transformer: 3-2 [116, 435, 112] [116, 435, 112] --
|
15 |
+
│ │ │ └─ModuleList: 4-2 -- -- --
|
16 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-6 [116, 435, 112] [116, 435, 112] --
|
17 |
+
│ │ │ │ │ └─LayerNorm: 6-1 [116, 435, 112] [116, 435, 112] 224
|
18 |
+
│ │ │ │ │ └─Linear: 6-2 [116, 435, 112] [116, 435, 1720] 192,640
|
19 |
+
│ │ │ │ │ └─Linear: 6-3 [116, 435, 528] [116, 435, 112] 59,136
|
20 |
+
│ │ │ │ │ └─DropPath: 6-4 [116, 435, 112] [116, 435, 112] --
|
21 |
+
│ │ │ │ │ └─Sequential: 6-5 [116, 435, 136] [116, 435, 112] --
|
22 |
+
│ │ │ │ │ │ └─GELU: 7-1 [116, 435, 136] [116, 435, 136] --
|
23 |
+
│ │ │ │ │ │ └─Dropout: 7-2 [116, 435, 136] [116, 435, 136] --
|
24 |
+
│ │ │ │ │ │ └─Linear: 7-3 [116, 435, 136] [116, 435, 112] 15,232
|
25 |
+
│ │ │ │ │ └─DropPath: 6-6 [116, 435, 112] [116, 435, 112] --
|
26 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-7 [116, 435, 112] [116, 435, 112] --
|
27 |
+
│ │ │ │ │ └─LayerNorm: 6-7 [116, 435, 112] [116, 435, 112] 224
|
28 |
+
│ │ │ │ │ └─Linear: 6-8 [116, 435, 112] [116, 435, 1720] 192,640
|
29 |
+
│ │ │ │ │ └─Linear: 6-9 [116, 435, 528] [116, 435, 112] 59,136
|
30 |
+
│ │ │ │ │ └─DropPath: 6-10 [116, 435, 112] [116, 435, 112] --
|
31 |
+
│ │ │ │ │ └─Sequential: 6-11 [116, 435, 136] [116, 435, 112] --
|
32 |
+
│ │ │ │ │ │ └─GELU: 7-4 [116, 435, 136] [116, 435, 136] --
|
33 |
+
│ │ │ │ │ │ └─Dropout: 7-5 [116, 435, 136] [116, 435, 136] --
|
34 |
+
│ │ │ │ │ │ └─Linear: 7-6 [116, 435, 136] [116, 435, 112] 15,232
|
35 |
+
│ │ │ │ │ └─DropPath: 6-12 [116, 435, 112] [116, 435, 112] --
|
36 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-8 [116, 435, 112] [116, 435, 112] --
|
37 |
+
│ │ │ │ │ └─LayerNorm: 6-13 [116, 435, 112] [116, 435, 112] 224
|
38 |
+
│ │ │ │ │ └─Linear: 6-14 [116, 435, 112] [116, 435, 1720] 192,640
|
39 |
+
│ │ │ │ │ └─Linear: 6-15 [116, 435, 528] [116, 435, 112] 59,136
|
40 |
+
│ │ │ │ │ └─DropPath: 6-16 [116, 435, 112] [116, 435, 112] --
|
41 |
+
│ │ │ │ │ └─Sequential: 6-17 [116, 435, 136] [116, 435, 112] --
|
42 |
+
│ │ │ │ │ │ └─GELU: 7-7 [116, 435, 136] [116, 435, 136] --
|
43 |
+
│ │ │ │ │ │ └─Dropout: 7-8 [116, 435, 136] [116, 435, 136] --
|
44 |
+
│ │ │ │ │ │ └─Linear: 7-9 [116, 435, 136] [116, 435, 112] 15,232
|
45 |
+
│ │ │ │ │ └─DropPath: 6-18 [116, 435, 112] [116, 435, 112] --
|
46 |
+
│ │ └─Transformer: 3-3 [435, 116, 112] [435, 116, 112] --
|
47 |
+
│ │ │ └─ModuleList: 4-3 -- -- --
|
48 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-9 [435, 116, 112] [435, 116, 112] --
|
49 |
+
│ │ │ │ │ └─LayerNorm: 6-19 [435, 116, 112] [435, 116, 112] 224
|
50 |
+
│ │ │ │ │ └─Linear: 6-20 [435, 116, 112] [435, 116, 1720] 192,640
|
51 |
+
│ │ │ │ │ └─Linear: 6-21 [435, 116, 528] [435, 116, 112] 59,136
|
52 |
+
│ │ │ │ │ └─DropPath: 6-22 [435, 116, 112] [435, 116, 112] --
|
53 |
+
│ │ │ │ │ └─Sequential: 6-23 [435, 116, 136] [435, 116, 112] --
|
54 |
+
│ │ │ │ │ │ └─GELU: 7-10 [435, 116, 136] [435, 116, 136] --
|
55 |
+
│ │ │ │ │ │ └─Dropout: 7-11 [435, 116, 136] [435, 116, 136] --
|
56 |
+
│ │ │ │ │ │ └─Linear: 7-12 [435, 116, 136] [435, 116, 112] 15,232
|
57 |
+
│ │ │ │ │ └─DropPath: 6-24 [435, 116, 112] [435, 116, 112] --
|
58 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-10 [435, 116, 112] [435, 116, 112] --
|
59 |
+
│ │ │ │ │ └─LayerNorm: 6-25 [435, 116, 112] [435, 116, 112] 224
|
60 |
+
│ │ │ │ │ └─Linear: 6-26 [435, 116, 112] [435, 116, 1720] 192,640
|
61 |
+
│ │ │ │ │ └─Linear: 6-27 [435, 116, 528] [435, 116, 112] 59,136
|
62 |
+
│ │ │ │ │ └─DropPath: 6-28 [435, 116, 112] [435, 116, 112] --
|
63 |
+
│ │ │ │ │ └─Sequential: 6-29 [435, 116, 136] [435, 116, 112] --
|
64 |
+
│ │ │ │ │ │ └─GELU: 7-13 [435, 116, 136] [435, 116, 136] --
|
65 |
+
│ │ │ │ │ │ └─Dropout: 7-14 [435, 116, 136] [435, 116, 136] --
|
66 |
+
│ │ │ │ │ │ └─Linear: 7-15 [435, 116, 136] [435, 116, 112] 15,232
|
67 |
+
│ │ │ │ │ └─DropPath: 6-30 [435, 116, 112] [435, 116, 112] --
|
68 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-11 [435, 116, 112] [435, 116, 112] --
|
69 |
+
│ │ │ │ │ └─LayerNorm: 6-31 [435, 116, 112] [435, 116, 112] 224
|
70 |
+
│ │ │ │ │ └─Linear: 6-32 [435, 116, 112] [435, 116, 1720] 192,640
|
71 |
+
│ │ │ │ │ └─Linear: 6-33 [435, 116, 528] [435, 116, 112] 59,136
|
72 |
+
│ │ │ │ │ └─DropPath: 6-34 [435, 116, 112] [435, 116, 112] --
|
73 |
+
│ │ │ │ │ └─Sequential: 6-35 [435, 116, 136] [435, 116, 112] --
|
74 |
+
│ │ │ │ │ │ └─GELU: 7-16 [435, 116, 136] [435, 116, 136] --
|
75 |
+
│ │ │ │ │ │ └─Dropout: 7-17 [435, 116, 136] [435, 116, 136] --
|
76 |
+
│ │ │ │ │ │ └─Linear: 7-18 [435, 116, 136] [435, 116, 112] 15,232
|
77 |
+
│ │ │ │ │ └─DropPath: 6-36 [435, 116, 112] [435, 116, 112] --
|
78 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-12 [435, 116, 112] [435, 116, 112] --
|
79 |
+
│ │ │ │ │ └─LayerNorm: 6-37 [435, 116, 112] [435, 116, 112] 224
|
80 |
+
│ │ │ │ │ └─Linear: 6-38 [435, 116, 112] [435, 116, 1720] 192,640
|
81 |
+
│ │ │ │ │ └─Linear: 6-39 [435, 116, 528] [435, 116, 112] 59,136
|
82 |
+
│ │ │ │ │ └─DropPath: 6-40 [435, 116, 112] [435, 116, 112] --
|
83 |
+
│ │ │ │ │ └─Sequential: 6-41 [435, 116, 136] [435, 116, 112] --
|
84 |
+
│ │ │ │ │ │ └─GELU: 7-19 [435, 116, 136] [435, 116, 136] --
|
85 |
+
│ │ │ │ │ │ └─Dropout: 7-20 [435, 116, 136] [435, 116, 136] --
|
86 |
+
│ │ │ │ │ │ └─Linear: 7-21 [435, 116, 136] [435, 116, 112] 15,232
|
87 |
+
│ │ │ │ │ └─DropPath: 6-42 [435, 116, 112] [435, 116, 112] --
|
88 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-13 [435, 116, 112] [435, 116, 112] --
|
89 |
+
│ │ │ │ │ └─LayerNorm: 6-43 [435, 116, 112] [435, 116, 112] 224
|
90 |
+
│ │ │ │ │ └─Linear: 6-44 [435, 116, 112] [435, 116, 1720] 192,640
|
91 |
+
│ │ │ │ │ └─Linear: 6-45 [435, 116, 528] [435, 116, 112] 59,136
|
92 |
+
│ │ │ │ │ └─DropPath: 6-46 [435, 116, 112] [435, 116, 112] --
|
93 |
+
│ │ │ │ │ └─Sequential: 6-47 [435, 116, 136] [435, 116, 112] --
|
94 |
+
│ │ │ │ │ │ └─GELU: 7-22 [435, 116, 136] [435, 116, 136] --
|
95 |
+
│ │ │ │ │ │ └─Dropout: 7-23 [435, 116, 136] [435, 116, 136] --
|
96 |
+
│ │ │ │ │ │ └─Linear: 7-24 [435, 116, 136] [435, 116, 112] 15,232
|
97 |
+
│ │ │ │ │ └─DropPath: 6-48 [435, 116, 112] [435, 116, 112] --
|
98 |
+
│ │ └─Rearrange: 3-4 [1, 116, 435, 112] [1, 112, 116, 15, 29] --
|
99 |
+
├─MLPShifters: 1-2 -- [1, 2, 116] 513
|
100 |
+
│ └─MLPShifter: 2-2 [116, 2] [116, 2] --
|
101 |
+
│ │ └─Sequential: 3-5 [116, 2] [116, 2] --
|
102 |
+
│ │ │ └─Linear: 4-4 [116, 2] [116, 5] 15
|
103 |
+
│ │ │ └─Tanh: 4-5 [116, 5] [116, 5] --
|
104 |
+
│ │ │ └─Linear: 4-6 [116, 5] [116, 5] 30
|
105 |
+
│ │ │ └─Tanh: 4-7 [116, 5] [116, 5] --
|
106 |
+
│ │ │ └─Linear: 4-8 [116, 5] [116, 2] 12
|
107 |
+
│ │ │ └─Tanh: 4-9 [116, 2] [116, 2] --
|
108 |
+
├─Readouts: 1-3 [1, 112, 116, 15, 29] [1, 7440, 116] 8,477,649
|
109 |
+
│ └─Gaussian2DReadout2: 2-3 [1, 112, 116, 15, 29] [1, 7440, 116] 870,480
|
110 |
+
│ │ └─Sequential: 3-6 [7440, 2] [7440, 2] --
|
111 |
+
│ │ │ └─Linear: 4-10 [7440, 2] [7440, 30] 90
|
112 |
+
│ │ │ └─ELU: 4-11 [7440, 30] [7440, 30] --
|
113 |
+
│ │ │ └─Linear: 4-12 [7440, 30] [7440, 2] 62
|
114 |
+
│ │ │ └─Tanh: 4-13 [7440, 2] [7440, 2] --
|
115 |
+
│ │ └─Sequential: 3-7 [7440, 2] [7440, 2] (recursive)
|
116 |
+
│ │ │ └─Linear: 4-14 [7440, 2] [7440, 30] (recursive)
|
117 |
+
│ │ │ └─ELU: 4-15 [7440, 30] [7440, 30] --
|
118 |
+
�� │ │ └─Linear: 4-16 [7440, 30] [7440, 2] (recursive)
|
119 |
+
│ │ │ └─Tanh: 4-17 [7440, 2] [7440, 2] --
|
120 |
+
│ │ └─Sequential: 3-8 [7440, 2] [7440, 2] (recursive)
|
121 |
+
│ │ │ └─Linear: 4-18 [7440, 2] [7440, 30] (recursive)
|
122 |
+
│ │ │ └─ELU: 4-19 [7440, 30] [7440, 30] --
|
123 |
+
│ │ │ └─Linear: 4-20 [7440, 30] [7440, 2] (recursive)
|
124 |
+
│ │ │ └─Tanh: 4-21 [7440, 2] [7440, 2] --
|
125 |
+
│ │ └─Sequential: 3-9 [116, 4] [116, 112] --
|
126 |
+
│ │ │ └─Linear: 4-22 [116, 4] [116, 112] 560
|
127 |
+
│ │ │ └─LayerNorm: 4-23 [116, 112] [116, 112] 224
|
128 |
+
│ │ │ └─GELU: 4-24 [116, 112] [116, 112] --
|
129 |
+
│ │ │ └─Dropout: 4-25 [116, 112] [116, 112] --
|
130 |
+
│ │ │ └─Linear: 4-26 [116, 112] [116, 112] 12,656
|
131 |
+
│ │ │ └─Tanh: 4-27 [116, 112] [116, 112] --
|
132 |
+
├─Exponential: 1-4 [1, 7440, 116] [1, 7440, 116] --
|
133 |
+
=======================================================================================================================================
|
134 |
+
Total params: 12,278,365
|
135 |
+
Trainable params: 12,278,365
|
136 |
+
Non-trainable params: 0
|
137 |
+
Total mult-adds (Units.MEGABYTES): 679.88
|
138 |
+
=======================================================================================================================================
|
139 |
+
Input size (MB): 1.29
|
140 |
+
Forward/backward pass size (MB): 9208.73
|
141 |
+
Params size (MB): 11.40
|
142 |
+
Estimated Total Size (MB): 9221.42
|
143 |
+
=======================================================================================================================================
|
003/output.log
ADDED
@@ -0,0 +1,789 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Use bfloat16 for core module.
|
2 |
+
Use parallel attention and MLP in ViViT.
|
3 |
+
|
4 |
+
Epoch 001/400
|
5 |
+
Train loss: 112704208.00 correlation: 0.0126
|
6 |
+
Validation loss: 199545376.00 correlation: 0.0293
|
7 |
+
Elapse: 540.35s
|
8 |
+
|
9 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
10 |
+
|
11 |
+
Epoch 002/400
|
12 |
+
Train loss: 97414480.00 correlation: 0.0393
|
13 |
+
Validation loss: 198820640.00 correlation: 0.0410
|
14 |
+
Elapse: 549.83s
|
15 |
+
|
16 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
17 |
+
|
18 |
+
Epoch 003/400
|
19 |
+
Train loss: 95851936.00 correlation: 0.0545
|
20 |
+
Validation loss: 197542912.00 correlation: 0.0493
|
21 |
+
Elapse: 552.73s
|
22 |
+
|
23 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
24 |
+
|
25 |
+
Epoch 004/400
|
26 |
+
Train loss: 94762680.00 correlation: 0.0658
|
27 |
+
Validation loss: 195978896.00 correlation: 0.0592
|
28 |
+
Elapse: 553.22s
|
29 |
+
|
30 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
31 |
+
|
32 |
+
Epoch 005/400
|
33 |
+
Train loss: 93366904.00 correlation: 0.0807
|
34 |
+
Validation loss: 193138784.00 correlation: 0.0786
|
35 |
+
Elapse: 551.37s
|
36 |
+
|
37 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
38 |
+
|
39 |
+
Epoch 006/400
|
40 |
+
Train loss: 91530000.00 correlation: 0.0996
|
41 |
+
Validation loss: 190414640.00 correlation: 0.0957
|
42 |
+
Elapse: 548.87s
|
43 |
+
|
44 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
45 |
+
|
46 |
+
Epoch 007/400
|
47 |
+
Train loss: 90052112.00 correlation: 0.1151
|
48 |
+
Validation loss: 187958800.00 correlation: 0.1117
|
49 |
+
Elapse: 545.45s
|
50 |
+
|
51 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
52 |
+
|
53 |
+
Epoch 008/400
|
54 |
+
Train loss: 88550296.00 correlation: 0.1303
|
55 |
+
Validation loss: 185819104.00 correlation: 0.1231
|
56 |
+
Elapse: 542.13s
|
57 |
+
|
58 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
59 |
+
|
60 |
+
Epoch 009/400
|
61 |
+
Train loss: 87211088.00 correlation: 0.1444
|
62 |
+
Validation loss: 183781008.00 correlation: 0.1379
|
63 |
+
Elapse: 540.39s
|
64 |
+
|
65 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
66 |
+
|
67 |
+
Epoch 010/400
|
68 |
+
Train loss: 85912744.00 correlation: 0.1575
|
69 |
+
Validation loss: 182160864.00 correlation: 0.1483
|
70 |
+
Elapse: 539.93s
|
71 |
+
|
72 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
73 |
+
|
74 |
+
Epoch 011/400
|
75 |
+
Train loss: 84825776.00 correlation: 0.1681
|
76 |
+
Validation loss: 180796960.00 correlation: 0.1574
|
77 |
+
Elapse: 539.05s
|
78 |
+
|
79 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
80 |
+
|
81 |
+
Epoch 012/400
|
82 |
+
Train loss: 83932096.00 correlation: 0.1768
|
83 |
+
Validation loss: 179665872.00 correlation: 0.1651
|
84 |
+
Elapse: 539.83s
|
85 |
+
|
86 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
87 |
+
|
88 |
+
Epoch 013/400
|
89 |
+
Train loss: 83185960.00 correlation: 0.1841
|
90 |
+
Validation loss: 178867920.00 correlation: 0.1706
|
91 |
+
Elapse: 540.49s
|
92 |
+
|
93 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
94 |
+
|
95 |
+
Epoch 014/400
|
96 |
+
Train loss: 82619600.00 correlation: 0.1896
|
97 |
+
Validation loss: 178183616.00 correlation: 0.1749
|
98 |
+
Elapse: 540.25s
|
99 |
+
|
100 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
101 |
+
|
102 |
+
Epoch 015/400
|
103 |
+
Train loss: 82049104.00 correlation: 0.1953
|
104 |
+
Validation loss: 177195872.00 correlation: 0.1811
|
105 |
+
Elapse: 539.98s
|
106 |
+
|
107 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
108 |
+
|
109 |
+
Epoch 016/400
|
110 |
+
Train loss: 81438744.00 correlation: 0.2013
|
111 |
+
Validation loss: 176732480.00 correlation: 0.1848
|
112 |
+
Elapse: 539.92s
|
113 |
+
|
114 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
115 |
+
|
116 |
+
Epoch 017/400
|
117 |
+
Train loss: 80981184.00 correlation: 0.2058
|
118 |
+
Validation loss: 175869328.00 correlation: 0.1895
|
119 |
+
Elapse: 540.34s
|
120 |
+
|
121 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
122 |
+
|
123 |
+
Epoch 018/400
|
124 |
+
Train loss: 80463984.00 correlation: 0.2108
|
125 |
+
Validation loss: 175137504.00 correlation: 0.1941
|
126 |
+
Elapse: 540.52s
|
127 |
+
|
128 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
129 |
+
|
130 |
+
Epoch 019/400
|
131 |
+
Train loss: 80076456.00 correlation: 0.2145
|
132 |
+
Validation loss: 174743216.00 correlation: 0.1976
|
133 |
+
Elapse: 540.79s
|
134 |
+
|
135 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
136 |
+
|
137 |
+
Epoch 020/400
|
138 |
+
Train loss: 79770240.00 correlation: 0.2180
|
139 |
+
Validation loss: 174354656.00 correlation: 0.1999
|
140 |
+
Elapse: 541.02s
|
141 |
+
|
142 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
143 |
+
|
144 |
+
Epoch 021/400
|
145 |
+
Train loss: 79389680.00 correlation: 0.2210
|
146 |
+
Validation loss: 173737072.00 correlation: 0.2049
|
147 |
+
Elapse: 540.85s
|
148 |
+
|
149 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
150 |
+
|
151 |
+
Epoch 022/400
|
152 |
+
Train loss: 79099264.00 correlation: 0.2238
|
153 |
+
Validation loss: 173426080.00 correlation: 0.2057
|
154 |
+
Elapse: 542.08s
|
155 |
+
|
156 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
157 |
+
|
158 |
+
Epoch 023/400
|
159 |
+
Train loss: 78893584.00 correlation: 0.2259
|
160 |
+
Validation loss: 172965088.00 correlation: 0.2094
|
161 |
+
Elapse: 542.73s
|
162 |
+
|
163 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
164 |
+
|
165 |
+
Epoch 024/400
|
166 |
+
Train loss: 78610448.00 correlation: 0.2286
|
167 |
+
Validation loss: 172757408.00 correlation: 0.2102
|
168 |
+
Elapse: 543.17s
|
169 |
+
|
170 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
171 |
+
|
172 |
+
Epoch 025/400
|
173 |
+
Train loss: 78350984.00 correlation: 0.2311
|
174 |
+
Validation loss: 172301040.00 correlation: 0.2136
|
175 |
+
Elapse: 543.01s
|
176 |
+
|
177 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
178 |
+
|
179 |
+
Epoch 026/400
|
180 |
+
Train loss: 78082256.00 correlation: 0.2338
|
181 |
+
Validation loss: 172086432.00 correlation: 0.2145
|
182 |
+
Elapse: 543.35s
|
183 |
+
|
184 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
185 |
+
|
186 |
+
Epoch 027/400
|
187 |
+
Train loss: 77827456.00 correlation: 0.2363
|
188 |
+
Validation loss: 171786464.00 correlation: 0.2169
|
189 |
+
Elapse: 543.66s
|
190 |
+
|
191 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
192 |
+
|
193 |
+
Epoch 028/400
|
194 |
+
Train loss: 77638136.00 correlation: 0.2379
|
195 |
+
Validation loss: 171793264.00 correlation: 0.2171
|
196 |
+
Elapse: 543.62s
|
197 |
+
|
198 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
199 |
+
|
200 |
+
Epoch 029/400
|
201 |
+
Train loss: 77553520.00 correlation: 0.2390
|
202 |
+
Validation loss: 171183824.00 correlation: 0.2206
|
203 |
+
Elapse: 543.14s
|
204 |
+
|
205 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
206 |
+
|
207 |
+
Epoch 030/400
|
208 |
+
Train loss: 77293184.00 correlation: 0.2414
|
209 |
+
Validation loss: 171063472.00 correlation: 0.2218
|
210 |
+
Elapse: 542.93s
|
211 |
+
|
212 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
213 |
+
|
214 |
+
Epoch 031/400
|
215 |
+
Train loss: 77137136.00 correlation: 0.2425
|
216 |
+
Validation loss: 170927232.00 correlation: 0.2215
|
217 |
+
Elapse: 542.90s
|
218 |
+
|
219 |
+
Epoch 032/400
|
220 |
+
Train loss: 77036008.00 correlation: 0.2439
|
221 |
+
Validation loss: 170678112.00 correlation: 0.2241
|
222 |
+
Elapse: 544.22s
|
223 |
+
|
224 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
225 |
+
|
226 |
+
Epoch 033/400
|
227 |
+
Train loss: 76850512.00 correlation: 0.2458
|
228 |
+
Validation loss: 170585168.00 correlation: 0.2249
|
229 |
+
Elapse: 543.38s
|
230 |
+
|
231 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
232 |
+
|
233 |
+
Epoch 034/400
|
234 |
+
Train loss: 76745528.00 correlation: 0.2467
|
235 |
+
Validation loss: 170361008.00 correlation: 0.2261
|
236 |
+
Elapse: 543.46s
|
237 |
+
|
238 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
239 |
+
|
240 |
+
Epoch 035/400
|
241 |
+
Train loss: 76631640.00 correlation: 0.2479
|
242 |
+
Validation loss: 170159952.00 correlation: 0.2272
|
243 |
+
Elapse: 544.31s
|
244 |
+
|
245 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
246 |
+
|
247 |
+
Epoch 036/400
|
248 |
+
Train loss: 76572216.00 correlation: 0.2483
|
249 |
+
Validation loss: 170068624.00 correlation: 0.2280
|
250 |
+
Elapse: 544.03s
|
251 |
+
|
252 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
253 |
+
|
254 |
+
Epoch 037/400
|
255 |
+
Train loss: 76306000.00 correlation: 0.2511
|
256 |
+
Validation loss: 170078272.00 correlation: 0.2281
|
257 |
+
Elapse: 543.66s
|
258 |
+
|
259 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
260 |
+
|
261 |
+
Epoch 038/400
|
262 |
+
Train loss: 76521968.00 correlation: 0.2488
|
263 |
+
Validation loss: 170034304.00 correlation: 0.2284
|
264 |
+
Elapse: 543.78s
|
265 |
+
|
266 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
267 |
+
|
268 |
+
Epoch 039/400
|
269 |
+
Train loss: 76277552.00 correlation: 0.2512
|
270 |
+
Validation loss: 169955232.00 correlation: 0.2283
|
271 |
+
Elapse: 544.11s
|
272 |
+
|
273 |
+
Epoch 040/400
|
274 |
+
Train loss: 76083856.00 correlation: 0.2532
|
275 |
+
Validation loss: 169547568.00 correlation: 0.2316
|
276 |
+
Elapse: 544.27s
|
277 |
+
|
278 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
279 |
+
|
280 |
+
Epoch 041/400
|
281 |
+
Train loss: 76034800.00 correlation: 0.2536
|
282 |
+
Validation loss: 169778400.00 correlation: 0.2301
|
283 |
+
Elapse: 544.31s
|
284 |
+
|
285 |
+
Epoch 042/400
|
286 |
+
Train loss: 75948104.00 correlation: 0.2542
|
287 |
+
Validation loss: 169703472.00 correlation: 0.2304
|
288 |
+
Elapse: 543.89s
|
289 |
+
|
290 |
+
Epoch 043/400
|
291 |
+
Train loss: 75900336.00 correlation: 0.2549
|
292 |
+
Validation loss: 169460816.00 correlation: 0.2314
|
293 |
+
Elapse: 543.95s
|
294 |
+
|
295 |
+
Epoch 044/400
|
296 |
+
Train loss: 75856872.00 correlation: 0.2554
|
297 |
+
Validation loss: 169446544.00 correlation: 0.2314
|
298 |
+
Elapse: 543.85s
|
299 |
+
|
300 |
+
Epoch 045/400
|
301 |
+
Train loss: 75771024.00 correlation: 0.2563
|
302 |
+
Validation loss: 169373568.00 correlation: 0.2320
|
303 |
+
Elapse: 544.58s
|
304 |
+
|
305 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
306 |
+
|
307 |
+
Epoch 046/400
|
308 |
+
Train loss: 75747888.00 correlation: 0.2564
|
309 |
+
Validation loss: 169484960.00 correlation: 0.2316
|
310 |
+
Elapse: 544.29s
|
311 |
+
|
312 |
+
Epoch 047/400
|
313 |
+
Train loss: 75614488.00 correlation: 0.2578
|
314 |
+
Validation loss: 169374048.00 correlation: 0.2332
|
315 |
+
Elapse: 544.59s
|
316 |
+
|
317 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
318 |
+
|
319 |
+
Epoch 048/400
|
320 |
+
Train loss: 75621768.00 correlation: 0.2577
|
321 |
+
Validation loss: 169829152.00 correlation: 0.2292
|
322 |
+
Elapse: 544.60s
|
323 |
+
|
324 |
+
Epoch 049/400
|
325 |
+
Train loss: 75540576.00 correlation: 0.2584
|
326 |
+
Validation loss: 169151584.00 correlation: 0.2322
|
327 |
+
Elapse: 545.07s
|
328 |
+
|
329 |
+
Epoch 050/400
|
330 |
+
Train loss: 75552112.00 correlation: 0.2587
|
331 |
+
Validation loss: 169218528.00 correlation: 0.2327
|
332 |
+
Elapse: 544.47s
|
333 |
+
|
334 |
+
Epoch 051/400
|
335 |
+
Train loss: 75440728.00 correlation: 0.2597
|
336 |
+
Validation loss: 169177248.00 correlation: 0.2329
|
337 |
+
Elapse: 544.75s
|
338 |
+
|
339 |
+
Epoch 052/400
|
340 |
+
Train loss: 75499728.00 correlation: 0.2591
|
341 |
+
Validation loss: 169380720.00 correlation: 0.2327
|
342 |
+
Elapse: 544.77s
|
343 |
+
|
344 |
+
Loaded checkpoint from epoch 47 (correlation: 0.2332).
|
345 |
+
|
346 |
+
Reduce learning rate of core to 1.4400e-03 (num. reduce: 1).
|
347 |
+
Reduce learning rate of readouts to 1.0800e-03 (num. reduce: 1).
|
348 |
+
Reduce learning rate of shifters to 1.0800e-03 (num. reduce: 1).
|
349 |
+
|
350 |
+
Epoch 053/400
|
351 |
+
Train loss: 73633064.00 correlation: 0.2750
|
352 |
+
Validation loss: 167526240.00 correlation: 0.2446
|
353 |
+
Elapse: 545.49s
|
354 |
+
|
355 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
356 |
+
|
357 |
+
Epoch 054/400
|
358 |
+
Train loss: 72992880.00 correlation: 0.2809
|
359 |
+
Validation loss: 167505792.00 correlation: 0.2447
|
360 |
+
Elapse: 545.66s
|
361 |
+
|
362 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
363 |
+
|
364 |
+
Epoch 055/400
|
365 |
+
Train loss: 72791024.00 correlation: 0.2827
|
366 |
+
Validation loss: 167337248.00 correlation: 0.2451
|
367 |
+
Elapse: 545.82s
|
368 |
+
|
369 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
370 |
+
|
371 |
+
Epoch 056/400
|
372 |
+
Train loss: 72699672.00 correlation: 0.2837
|
373 |
+
Validation loss: 167396864.00 correlation: 0.2453
|
374 |
+
Elapse: 545.65s
|
375 |
+
|
376 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
377 |
+
|
378 |
+
Epoch 057/400
|
379 |
+
Train loss: 72666128.00 correlation: 0.2841
|
380 |
+
Validation loss: 167320224.00 correlation: 0.2457
|
381 |
+
Elapse: 546.33s
|
382 |
+
|
383 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
384 |
+
|
385 |
+
Epoch 058/400
|
386 |
+
Train loss: 72662680.00 correlation: 0.2840
|
387 |
+
Validation loss: 167358624.00 correlation: 0.2457
|
388 |
+
Elapse: 545.38s
|
389 |
+
|
390 |
+
Epoch 059/400
|
391 |
+
Train loss: 72528456.00 correlation: 0.2854
|
392 |
+
Validation loss: 167347344.00 correlation: 0.2456
|
393 |
+
Elapse: 546.44s
|
394 |
+
|
395 |
+
Epoch 060/400
|
396 |
+
Train loss: 72553424.00 correlation: 0.2854
|
397 |
+
Validation loss: 167294624.00 correlation: 0.2462
|
398 |
+
Elapse: 546.17s
|
399 |
+
|
400 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
401 |
+
|
402 |
+
Epoch 061/400
|
403 |
+
Train loss: 72496144.00 correlation: 0.2860
|
404 |
+
Validation loss: 167428896.00 correlation: 0.2444
|
405 |
+
Elapse: 545.96s
|
406 |
+
|
407 |
+
Epoch 062/400
|
408 |
+
Train loss: 72479344.00 correlation: 0.2859
|
409 |
+
Validation loss: 167235104.00 correlation: 0.2454
|
410 |
+
Elapse: 546.11s
|
411 |
+
|
412 |
+
Epoch 063/400
|
413 |
+
Train loss: 72437912.00 correlation: 0.2863
|
414 |
+
Validation loss: 167384528.00 correlation: 0.2447
|
415 |
+
Elapse: 546.05s
|
416 |
+
|
417 |
+
Epoch 064/400
|
418 |
+
Train loss: 72443952.00 correlation: 0.2864
|
419 |
+
Validation loss: 167276464.00 correlation: 0.2452
|
420 |
+
Elapse: 546.23s
|
421 |
+
|
422 |
+
Epoch 065/400
|
423 |
+
Train loss: 72421648.00 correlation: 0.2869
|
424 |
+
Validation loss: 167359664.00 correlation: 0.2448
|
425 |
+
Elapse: 546.55s
|
426 |
+
|
427 |
+
Loaded checkpoint from epoch 60 (correlation: 0.2462).
|
428 |
+
|
429 |
+
Reduce learning rate of core to 4.3200e-04 (num. reduce: 1).
|
430 |
+
Reduce learning rate of readouts to 3.2400e-04 (num. reduce: 1).
|
431 |
+
Reduce learning rate of shifters to 3.2400e-04 (num. reduce: 1).
|
432 |
+
|
433 |
+
Epoch 066/400
|
434 |
+
Train loss: 71631360.00 correlation: 0.2929
|
435 |
+
Validation loss: 166762592.00 correlation: 0.2488
|
436 |
+
Elapse: 546.04s
|
437 |
+
|
438 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
439 |
+
|
440 |
+
Epoch 067/400
|
441 |
+
Train loss: 71301752.00 correlation: 0.2963
|
442 |
+
Validation loss: 166766816.00 correlation: 0.2491
|
443 |
+
Elapse: 546.30s
|
444 |
+
|
445 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
446 |
+
|
447 |
+
Epoch 068/400
|
448 |
+
Train loss: 71239384.00 correlation: 0.2970
|
449 |
+
Validation loss: 166698608.00 correlation: 0.2493
|
450 |
+
Elapse: 546.54s
|
451 |
+
|
452 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
453 |
+
|
454 |
+
Epoch 069/400
|
455 |
+
Train loss: 71140904.00 correlation: 0.2977
|
456 |
+
Validation loss: 166688480.00 correlation: 0.2493
|
457 |
+
Elapse: 546.57s
|
458 |
+
|
459 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
460 |
+
|
461 |
+
Epoch 070/400
|
462 |
+
Train loss: 71157128.00 correlation: 0.2979
|
463 |
+
Validation loss: 166701680.00 correlation: 0.2493
|
464 |
+
Elapse: 546.93s
|
465 |
+
|
466 |
+
Epoch 071/400
|
467 |
+
Train loss: 71109936.00 correlation: 0.2983
|
468 |
+
Validation loss: 166666112.00 correlation: 0.2493
|
469 |
+
Elapse: 546.33s
|
470 |
+
|
471 |
+
Epoch 072/400
|
472 |
+
Train loss: 71014384.00 correlation: 0.2990
|
473 |
+
Validation loss: 166637680.00 correlation: 0.2493
|
474 |
+
Elapse: 546.25s
|
475 |
+
|
476 |
+
Epoch 073/400
|
477 |
+
Train loss: 71012144.00 correlation: 0.2989
|
478 |
+
Validation loss: 166633760.00 correlation: 0.2495
|
479 |
+
Elapse: 546.14s
|
480 |
+
|
481 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
482 |
+
|
483 |
+
Epoch 074/400
|
484 |
+
Train loss: 70962312.00 correlation: 0.2996
|
485 |
+
Validation loss: 166724848.00 correlation: 0.2491
|
486 |
+
Elapse: 546.66s
|
487 |
+
|
488 |
+
Epoch 075/400
|
489 |
+
Train loss: 70909096.00 correlation: 0.3002
|
490 |
+
Validation loss: 166680192.00 correlation: 0.2492
|
491 |
+
Elapse: 546.39s
|
492 |
+
|
493 |
+
Epoch 076/400
|
494 |
+
Train loss: 70859696.00 correlation: 0.3007
|
495 |
+
Validation loss: 166666160.00 correlation: 0.2493
|
496 |
+
Elapse: 546.76s
|
497 |
+
|
498 |
+
Epoch 077/400
|
499 |
+
Train loss: 70862616.00 correlation: 0.3006
|
500 |
+
Validation loss: 166644512.00 correlation: 0.2493
|
501 |
+
Elapse: 546.35s
|
502 |
+
|
503 |
+
Epoch 078/400
|
504 |
+
Train loss: 70866920.00 correlation: 0.3008
|
505 |
+
Validation loss: 166689088.00 correlation: 0.2489
|
506 |
+
Elapse: 546.43s
|
507 |
+
|
508 |
+
Loaded checkpoint from epoch 73 (correlation: 0.2495).
|
509 |
+
|
510 |
+
Reduce learning rate of core to 1.2960e-04 (num. reduce: 1).
|
511 |
+
Reduce learning rate of readouts to 9.7200e-05 (num. reduce: 1).
|
512 |
+
Reduce learning rate of shifters to 9.7200e-05 (num. reduce: 1).
|
513 |
+
|
514 |
+
Epoch 079/400
|
515 |
+
Train loss: 70659088.00 correlation: 0.3023
|
516 |
+
Validation loss: 166495968.00 correlation: 0.2504
|
517 |
+
Elapse: 546.32s
|
518 |
+
|
519 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
520 |
+
|
521 |
+
Epoch 080/400
|
522 |
+
Train loss: 70583640.00 correlation: 0.3029
|
523 |
+
Validation loss: 166499952.00 correlation: 0.2503
|
524 |
+
Elapse: 546.55s
|
525 |
+
|
526 |
+
Epoch 081/400
|
527 |
+
Train loss: 70541232.00 correlation: 0.3031
|
528 |
+
Validation loss: 166486608.00 correlation: 0.2504
|
529 |
+
Elapse: 546.44s
|
530 |
+
|
531 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
532 |
+
|
533 |
+
Epoch 082/400
|
534 |
+
Train loss: 70561208.00 correlation: 0.3030
|
535 |
+
Validation loss: 166498080.00 correlation: 0.2505
|
536 |
+
Elapse: 546.48s
|
537 |
+
|
538 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
539 |
+
|
540 |
+
Epoch 083/400
|
541 |
+
Train loss: 70504848.00 correlation: 0.3037
|
542 |
+
Validation loss: 166479744.00 correlation: 0.2504
|
543 |
+
Elapse: 545.91s
|
544 |
+
|
545 |
+
Epoch 084/400
|
546 |
+
Train loss: 70483280.00 correlation: 0.3037
|
547 |
+
Validation loss: 166527136.00 correlation: 0.2504
|
548 |
+
Elapse: 546.39s
|
549 |
+
|
550 |
+
Epoch 085/400
|
551 |
+
Train loss: 70486104.00 correlation: 0.3039
|
552 |
+
Validation loss: 166507024.00 correlation: 0.2504
|
553 |
+
Elapse: 546.66s
|
554 |
+
|
555 |
+
Epoch 086/400
|
556 |
+
Train loss: 70448464.00 correlation: 0.3042
|
557 |
+
Validation loss: 166480160.00 correlation: 0.2505
|
558 |
+
Elapse: 546.13s
|
559 |
+
|
560 |
+
Epoch 087/400
|
561 |
+
Train loss: 70433528.00 correlation: 0.3043
|
562 |
+
Validation loss: 166521664.00 correlation: 0.2504
|
563 |
+
Elapse: 546.51s
|
564 |
+
|
565 |
+
Loaded checkpoint from epoch 82 (correlation: 0.2505).
|
566 |
+
|
567 |
+
Reduce learning rate of core to 3.8880e-05 (num. reduce: 1).
|
568 |
+
Reduce learning rate of readouts to 2.9160e-05 (num. reduce: 1).
|
569 |
+
Reduce learning rate of shifters to 2.9160e-05 (num. reduce: 1).
|
570 |
+
|
571 |
+
Epoch 088/400
|
572 |
+
Train loss: 70419248.00 correlation: 0.3041
|
573 |
+
Validation loss: 166470848.00 correlation: 0.2507
|
574 |
+
Elapse: 546.72s
|
575 |
+
|
576 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
577 |
+
|
578 |
+
Epoch 089/400
|
579 |
+
Train loss: 70456936.00 correlation: 0.3039
|
580 |
+
Validation loss: 166478544.00 correlation: 0.2507
|
581 |
+
Elapse: 546.31s
|
582 |
+
|
583 |
+
Epoch 090/400
|
584 |
+
Train loss: 70377392.00 correlation: 0.3047
|
585 |
+
Validation loss: 166470880.00 correlation: 0.2508
|
586 |
+
Elapse: 546.64s
|
587 |
+
|
588 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
589 |
+
|
590 |
+
Epoch 091/400
|
591 |
+
Train loss: 70370720.00 correlation: 0.3048
|
592 |
+
Validation loss: 166471712.00 correlation: 0.2507
|
593 |
+
Elapse: 546.55s
|
594 |
+
|
595 |
+
Epoch 092/400
|
596 |
+
Train loss: 70332624.00 correlation: 0.3052
|
597 |
+
Validation loss: 166468176.00 correlation: 0.2506
|
598 |
+
Elapse: 546.51s
|
599 |
+
|
600 |
+
Epoch 093/400
|
601 |
+
Train loss: 70375248.00 correlation: 0.3046
|
602 |
+
Validation loss: 166466304.00 correlation: 0.2507
|
603 |
+
Elapse: 547.09s
|
604 |
+
|
605 |
+
Epoch 094/400
|
606 |
+
Train loss: 70312208.00 correlation: 0.3053
|
607 |
+
Validation loss: 166426080.00 correlation: 0.2509
|
608 |
+
Elapse: 546.36s
|
609 |
+
|
610 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
611 |
+
|
612 |
+
Epoch 095/400
|
613 |
+
Train loss: 70306024.00 correlation: 0.3054
|
614 |
+
Validation loss: 166448992.00 correlation: 0.2509
|
615 |
+
Elapse: 546.42s
|
616 |
+
|
617 |
+
Epoch 096/400
|
618 |
+
Train loss: 70301760.00 correlation: 0.3053
|
619 |
+
Validation loss: 166460400.00 correlation: 0.2508
|
620 |
+
Elapse: 545.99s
|
621 |
+
|
622 |
+
Epoch 097/400
|
623 |
+
Train loss: 70339392.00 correlation: 0.3050
|
624 |
+
Validation loss: 166448912.00 correlation: 0.2507
|
625 |
+
Elapse: 546.74s
|
626 |
+
|
627 |
+
Epoch 098/400
|
628 |
+
Train loss: 70365064.00 correlation: 0.3048
|
629 |
+
Validation loss: 166476400.00 correlation: 0.2506
|
630 |
+
Elapse: 546.17s
|
631 |
+
|
632 |
+
Epoch 099/400
|
633 |
+
Train loss: 70304792.00 correlation: 0.3053
|
634 |
+
Validation loss: 166451168.00 correlation: 0.2507
|
635 |
+
Elapse: 545.82s
|
636 |
+
|
637 |
+
Loaded checkpoint from epoch 94 (correlation: 0.2509).
|
638 |
+
|
639 |
+
Reduce learning rate of core to 1.1664e-05 (num. reduce: 1).
|
640 |
+
Reduce learning rate of readouts to 8.7480e-06 (num. reduce: 1).
|
641 |
+
Reduce learning rate of shifters to 8.7480e-06 (num. reduce: 1).
|
642 |
+
|
643 |
+
Epoch 100/400
|
644 |
+
Train loss: 70282520.00 correlation: 0.3055
|
645 |
+
Validation loss: 166444240.00 correlation: 0.2509
|
646 |
+
Elapse: 546.60s
|
647 |
+
|
648 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
649 |
+
|
650 |
+
Epoch 101/400
|
651 |
+
Train loss: 70321056.00 correlation: 0.3050
|
652 |
+
Validation loss: 166451424.00 correlation: 0.2509
|
653 |
+
Elapse: 546.61s
|
654 |
+
|
655 |
+
Epoch 102/400
|
656 |
+
Train loss: 70312536.00 correlation: 0.3052
|
657 |
+
Validation loss: 166450992.00 correlation: 0.2509
|
658 |
+
Elapse: 546.64s
|
659 |
+
|
660 |
+
Epoch 103/400
|
661 |
+
Train loss: 70294928.00 correlation: 0.3057
|
662 |
+
Validation loss: 166437664.00 correlation: 0.2509
|
663 |
+
Elapse: 546.47s
|
664 |
+
|
665 |
+
Epoch 104/400
|
666 |
+
Train loss: 70265648.00 correlation: 0.3058
|
667 |
+
Validation loss: 166443488.00 correlation: 0.2509
|
668 |
+
Elapse: 546.86s
|
669 |
+
|
670 |
+
Epoch 105/400
|
671 |
+
Train loss: 70228080.00 correlation: 0.3058
|
672 |
+
Validation loss: 166447312.00 correlation: 0.2508
|
673 |
+
Elapse: 546.77s
|
674 |
+
|
675 |
+
Loaded checkpoint from epoch 100 (correlation: 0.2509).
|
676 |
+
|
677 |
+
Reduce learning rate of core to 3.4992e-06 (num. reduce: 1).
|
678 |
+
Reduce learning rate of readouts to 2.6244e-06 (num. reduce: 1).
|
679 |
+
Reduce learning rate of shifters to 2.6244e-06 (num. reduce: 1).
|
680 |
+
|
681 |
+
Epoch 106/400
|
682 |
+
Train loss: 70303288.00 correlation: 0.3053
|
683 |
+
Validation loss: 166441600.00 correlation: 0.2509
|
684 |
+
Elapse: 546.61s
|
685 |
+
|
686 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
687 |
+
|
688 |
+
Epoch 107/400
|
689 |
+
Train loss: 70329360.00 correlation: 0.3052
|
690 |
+
Validation loss: 166438976.00 correlation: 0.2509
|
691 |
+
Elapse: 546.25s
|
692 |
+
|
693 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
|
694 |
+
|
695 |
+
Epoch 108/400
|
696 |
+
Train loss: 70249752.00 correlation: 0.3063
|
697 |
+
Validation loss: 166440032.00 correlation: 0.2509
|
698 |
+
Elapse: 546.40s
|
699 |
+
|
700 |
+
Epoch 109/400
|
701 |
+
Train loss: 70245592.00 correlation: 0.3059
|
702 |
+
Validation loss: 166436832.00 correlation: 0.2509
|
703 |
+
Elapse: 546.34s
|
704 |
+
|
705 |
+
Epoch 110/400
|
706 |
+
Train loss: 70323520.00 correlation: 0.3050
|
707 |
+
Validation loss: 166439552.00 correlation: 0.2509
|
708 |
+
Elapse: 546.33s
|
709 |
+
|
710 |
+
Epoch 111/400
|
711 |
+
Train loss: 70291648.00 correlation: 0.3053
|
712 |
+
Validation loss: 166438448.00 correlation: 0.2509
|
713 |
+
Elapse: 546.45s
|
714 |
+
|
715 |
+
Epoch 112/400
|
716 |
+
Train loss: 70337264.00 correlation: 0.3050
|
717 |
+
Validation loss: 166435040.00 correlation: 0.2509
|
718 |
+
Elapse: 546.37s
|
719 |
+
|
720 |
+
Loaded checkpoint from epoch 107 (correlation: 0.2509).
|
721 |
+
|
722 |
+
Reduce learning rate of core to 1.0498e-06 (num. reduce: 1).
|
723 |
+
Reduce learning rate of readouts to 7.8732e-07 (num. reduce: 1).
|
724 |
+
Reduce learning rate of shifters to 7.8732e-07 (num. reduce: 1).
|
725 |
+
|
726 |
+
Epoch 113/400
|
727 |
+
Train loss: 70326192.00 correlation: 0.3050
|
728 |
+
Validation loss: 166438976.00 correlation: 0.2509
|
729 |
+
Elapse: 546.86s
|
730 |
+
|
731 |
+
Epoch 114/400
|
732 |
+
Train loss: 70297808.00 correlation: 0.3056
|
733 |
+
Validation loss: 166439680.00 correlation: 0.2509
|
734 |
+
Elapse: 546.99s
|
735 |
+
|
736 |
+
Epoch 115/400
|
737 |
+
Train loss: 70375312.00 correlation: 0.3045
|
738 |
+
Validation loss: 166439312.00 correlation: 0.2509
|
739 |
+
Elapse: 547.26s
|
740 |
+
|
741 |
+
Epoch 116/400
|
742 |
+
Train loss: 70331832.00 correlation: 0.3050
|
743 |
+
Validation loss: 166439392.00 correlation: 0.2509
|
744 |
+
Elapse: 546.75s
|
745 |
+
|
746 |
+
Epoch 117/400
|
747 |
+
Train loss: 70241608.00 correlation: 0.3060
|
748 |
+
Validation loss: 166441104.00 correlation: 0.2509
|
749 |
+
Elapse: 546.43s
|
750 |
+
|
751 |
+
Loaded checkpoint from epoch 107 (correlation: 0.2509).
|
752 |
+
|
753 |
+
Reduce learning rate of core to 3.1493e-07 (num. reduce: 2).
|
754 |
+
Reduce learning rate of readouts to 2.3620e-07 (num. reduce: 2).
|
755 |
+
Reduce learning rate of shifters to 2.3620e-07 (num. reduce: 2).
|
756 |
+
|
757 |
+
Epoch 118/400
|
758 |
+
Train loss: 70344976.00 correlation: 0.3049
|
759 |
+
Validation loss: 166439680.00 correlation: 0.2509
|
760 |
+
Elapse: 546.75s
|
761 |
+
|
762 |
+
Epoch 119/400
|
763 |
+
Train loss: 70278184.00 correlation: 0.3054
|
764 |
+
Validation loss: 166439840.00 correlation: 0.2509
|
765 |
+
Elapse: 547.33s
|
766 |
+
|
767 |
+
Epoch 120/400
|
768 |
+
Train loss: 70224856.00 correlation: 0.3062
|
769 |
+
Validation loss: 166439440.00 correlation: 0.2509
|
770 |
+
Elapse: 546.94s
|
771 |
+
|
772 |
+
Epoch 121/400
|
773 |
+
Train loss: 70317744.00 correlation: 0.3049
|
774 |
+
Validation loss: 166439280.00 correlation: 0.2509
|
775 |
+
Elapse: 547.22s
|
776 |
+
|
777 |
+
Epoch 122/400
|
778 |
+
Train loss: 70322624.00 correlation: 0.3052
|
779 |
+
Validation loss: 166438784.00 correlation: 0.2509
|
780 |
+
Elapse: 546.83s
|
781 |
+
|
782 |
+
Model has not improved after 2 LR reductions.
|
783 |
+
|
784 |
+
Loaded checkpoint from epoch 107 (correlation: 0.2509).
|
785 |
+
|
786 |
+
|
787 |
+
ValidationA: 0.2475 B: 0.2751 C: 0.2730 D: 0.2364 E: 0.2355 F: 0.2343 G: 0.2543 H: 0.2344 I: 0.2602 J: 0.2588 average: 0.2509
|
788 |
+
|
789 |
+
Results saved to /home/storage/runs/vivit_ensemble/012.
|
004/args.yaml
ADDED
@@ -0,0 +1,87 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
adam_beta1: 0.9
|
2 |
+
adam_beta2: 0.999
|
3 |
+
adam_eps: 1e-08
|
4 |
+
batch_size: 6
|
5 |
+
cache_data: false
|
6 |
+
center_crop: 1.0
|
7 |
+
clear_output_dir: true
|
8 |
+
core: vivit
|
9 |
+
core_behavior_mode: 2
|
10 |
+
core_compile: false
|
11 |
+
core_drop_path: 0.0505
|
12 |
+
core_emb_dim: 112
|
13 |
+
core_ff_activation: gelu
|
14 |
+
core_ff_dropout: 0.0592
|
15 |
+
core_flash_attention: 1
|
16 |
+
core_head_dim: 48
|
17 |
+
core_lr: 0.0048
|
18 |
+
core_mha_dropout: 0.358
|
19 |
+
core_mlp_dim: 136
|
20 |
+
core_norm_qk: false
|
21 |
+
core_num_heads: 11
|
22 |
+
core_p_dropout: 0.1338
|
23 |
+
core_parallel_attention: true
|
24 |
+
core_patch_mode: 0
|
25 |
+
core_pos_encoding: 3
|
26 |
+
core_spatial_depth: 3
|
27 |
+
core_spatial_patch_size: 7
|
28 |
+
core_spatial_patch_stride: 2
|
29 |
+
core_temporal_depth: 5
|
30 |
+
core_temporal_patch_size: 25
|
31 |
+
core_temporal_patch_stride: 1
|
32 |
+
core_weight_decay: 0.1789
|
33 |
+
criterion: poisson_correlation
|
34 |
+
critic_mode: 0
|
35 |
+
crop_frame: 140
|
36 |
+
data: /home/sensorium2023
|
37 |
+
deterministic: false
|
38 |
+
device: cuda
|
39 |
+
dpi: 120
|
40 |
+
ds_mode: 3
|
41 |
+
ds_scale: 1
|
42 |
+
epochs: 400
|
43 |
+
format: svg
|
44 |
+
git_hash: 1033c29
|
45 |
+
grad_checkpointing: 0
|
46 |
+
grad_norm: null
|
47 |
+
input_shapes:
|
48 |
+
behavior: [2, 140]
|
49 |
+
pupil_center: [2, 140]
|
50 |
+
video: [1, 140, 36, 64]
|
51 |
+
limit_data: null
|
52 |
+
lr: 0.0036
|
53 |
+
max_frame: 300
|
54 |
+
micro_batch_size: 6
|
55 |
+
modulator_mode: 0
|
56 |
+
mouse_ids: [A, B, C, D, E, F, G, H, I, J]
|
57 |
+
num_workers: 2
|
58 |
+
output_dir: /home/storage/runs/004
|
59 |
+
output_mode: 1
|
60 |
+
output_shapes:
|
61 |
+
A: [7440, 140]
|
62 |
+
B: [7928, 140]
|
63 |
+
C: [8285, 140]
|
64 |
+
D: [7671, 140]
|
65 |
+
E: [7495, 140]
|
66 |
+
F: [7863, 140]
|
67 |
+
G: [7908, 140]
|
68 |
+
H: [8202, 140]
|
69 |
+
I: [7939, 140]
|
70 |
+
J: [8122, 140]
|
71 |
+
precision: "32"
|
72 |
+
pretrain_core: null
|
73 |
+
readout: gaussian2d
|
74 |
+
readout_bias_mode: 2
|
75 |
+
readout_dropout: 0.0
|
76 |
+
readout_grid_mode: 1
|
77 |
+
restore: null
|
78 |
+
save_plots: false
|
79 |
+
seed: 15
|
80 |
+
shifter_layers: 3
|
81 |
+
shifter_mode: 1
|
82 |
+
shifter_size: 5
|
83 |
+
stat_mode: 1
|
84 |
+
trainable_params: 12278365
|
85 |
+
transform_mode: 2
|
86 |
+
verbose: 1
|
87 |
+
weight_decay: 0.3939
|
004/ckpt/model_state.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8538df1cffe25f014e11f5db7e89d7b4e8167dd9545be98a14aa7f78e7bc6b42
|
3 |
+
size 148268583
|
004/evaluation.yaml
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
validation: {A: 0.24283820390701294, B: 0.2745824456214905, C: 0.2716088593006134,
|
2 |
+
D: 0.2359682023525238, E: 0.2350907325744629, F: 0.2335391342639923, G: 0.25313541293144226,
|
3 |
+
H: 0.23314021527767181, I: 0.25676068663597107, J: 0.2575773298740387, average: 0.24942412227392197}
|
004/model.txt
ADDED
@@ -0,0 +1,143 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
=======================================================================================================================================
|
2 |
+
Layer (type:depth-idx) Input Shape Output Shape Param #
|
3 |
+
=======================================================================================================================================
|
4 |
+
Model -- [1, 7440, 116] --
|
5 |
+
├─ViViTCore: 1-1 -- [1, 112, 116, 15, 29] --
|
6 |
+
│ └─ViViT: 2-1 [1, 5, 140, 36, 64] [1, 112, 116, 15, 29] --
|
7 |
+
│ │ └─Tokenizer: 3-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] 79,632
|
8 |
+
│ │ │ └─Sequential: 4-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] --
|
9 |
+
│ │ │ │ └─Unfold3d: 5-1 [1, 5, 140, 36, 64] [1, 116, 435, 6125] --
|
10 |
+
│ │ │ │ └─LayerNorm: 5-2 [1, 116, 435, 6125] [1, 116, 435, 6125] 12,250
|
11 |
+
│ │ │ │ └─Linear: 5-3 [1, 116, 435, 6125] [1, 116, 435, 112] 686,112
|
12 |
+
│ │ │ │ └─LayerNorm: 5-4 [1, 116, 435, 112] [1, 116, 435, 112] 224
|
13 |
+
│ │ │ │ └─Dropout: 5-5 [1, 116, 435, 112] [1, 116, 435, 112] --
|
14 |
+
│ │ └─Transformer: 3-2 [116, 435, 112] [116, 435, 112] --
|
15 |
+
│ │ │ └─ModuleList: 4-2 -- -- --
|
16 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-6 [116, 435, 112] [116, 435, 112] --
|
17 |
+
│ │ │ │ │ └─LayerNorm: 6-1 [116, 435, 112] [116, 435, 112] 224
|
18 |
+
│ │ │ │ │ └─Linear: 6-2 [116, 435, 112] [116, 435, 1720] 192,640
|
19 |
+
│ │ │ │ │ └─Linear: 6-3 [116, 435, 528] [116, 435, 112] 59,136
|
20 |
+
│ │ │ │ │ └─DropPath: 6-4 [116, 435, 112] [116, 435, 112] --
|
21 |
+
│ │ │ │ │ └─Sequential: 6-5 [116, 435, 136] [116, 435, 112] --
|
22 |
+
│ │ │ │ │ │ └─GELU: 7-1 [116, 435, 136] [116, 435, 136] --
|
23 |
+
│ │ │ │ │ │ └─Dropout: 7-2 [116, 435, 136] [116, 435, 136] --
|
24 |
+
│ │ │ │ │ │ └─Linear: 7-3 [116, 435, 136] [116, 435, 112] 15,232
|
25 |
+
│ │ │ │ │ └─DropPath: 6-6 [116, 435, 112] [116, 435, 112] --
|
26 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-7 [116, 435, 112] [116, 435, 112] --
|
27 |
+
│ │ │ │ │ └─LayerNorm: 6-7 [116, 435, 112] [116, 435, 112] 224
|
28 |
+
│ │ │ │ │ └─Linear: 6-8 [116, 435, 112] [116, 435, 1720] 192,640
|
29 |
+
│ │ │ │ │ └─Linear: 6-9 [116, 435, 528] [116, 435, 112] 59,136
|
30 |
+
│ │ │ │ │ └─DropPath: 6-10 [116, 435, 112] [116, 435, 112] --
|
31 |
+
│ │ │ │ │ └─Sequential: 6-11 [116, 435, 136] [116, 435, 112] --
|
32 |
+
│ │ │ │ │ │ └─GELU: 7-4 [116, 435, 136] [116, 435, 136] --
|
33 |
+
│ │ │ │ │ │ └─Dropout: 7-5 [116, 435, 136] [116, 435, 136] --
|
34 |
+
│ │ │ │ │ │ └─Linear: 7-6 [116, 435, 136] [116, 435, 112] 15,232
|
35 |
+
│ │ │ │ │ └─DropPath: 6-12 [116, 435, 112] [116, 435, 112] --
|
36 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-8 [116, 435, 112] [116, 435, 112] --
|
37 |
+
│ │ │ │ │ └─LayerNorm: 6-13 [116, 435, 112] [116, 435, 112] 224
|
38 |
+
│ │ │ │ │ └─Linear: 6-14 [116, 435, 112] [116, 435, 1720] 192,640
|
39 |
+
│ │ │ │ │ └─Linear: 6-15 [116, 435, 528] [116, 435, 112] 59,136
|
40 |
+
│ │ │ │ │ └─DropPath: 6-16 [116, 435, 112] [116, 435, 112] --
|
41 |
+
│ │ │ │ │ └─Sequential: 6-17 [116, 435, 136] [116, 435, 112] --
|
42 |
+
│ │ │ │ │ │ └─GELU: 7-7 [116, 435, 136] [116, 435, 136] --
|
43 |
+
│ │ │ │ │ │ └─Dropout: 7-8 [116, 435, 136] [116, 435, 136] --
|
44 |
+
│ │ │ │ │ │ └─Linear: 7-9 [116, 435, 136] [116, 435, 112] 15,232
|
45 |
+
│ │ │ │ │ └─DropPath: 6-18 [116, 435, 112] [116, 435, 112] --
|
46 |
+
│ │ └─Transformer: 3-3 [435, 116, 112] [435, 116, 112] --
|
47 |
+
│ │ │ └─ModuleList: 4-3 -- -- --
|
48 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-9 [435, 116, 112] [435, 116, 112] --
|
49 |
+
│ │ │ │ │ └─LayerNorm: 6-19 [435, 116, 112] [435, 116, 112] 224
|
50 |
+
│ │ │ │ │ └─Linear: 6-20 [435, 116, 112] [435, 116, 1720] 192,640
|
51 |
+
│ │ │ │ │ └─Linear: 6-21 [435, 116, 528] [435, 116, 112] 59,136
|
52 |
+
│ │ │ │ │ └─DropPath: 6-22 [435, 116, 112] [435, 116, 112] --
|
53 |
+
│ │ │ │ │ └─Sequential: 6-23 [435, 116, 136] [435, 116, 112] --
|
54 |
+
│ │ │ │ │ │ └─GELU: 7-10 [435, 116, 136] [435, 116, 136] --
|
55 |
+
│ │ │ │ │ │ └─Dropout: 7-11 [435, 116, 136] [435, 116, 136] --
|
56 |
+
│ │ │ │ │ │ └─Linear: 7-12 [435, 116, 136] [435, 116, 112] 15,232
|
57 |
+
│ │ │ │ │ └─DropPath: 6-24 [435, 116, 112] [435, 116, 112] --
|
58 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-10 [435, 116, 112] [435, 116, 112] --
|
59 |
+
│ │ │ │ │ └─LayerNorm: 6-25 [435, 116, 112] [435, 116, 112] 224
|
60 |
+
│ │ │ │ │ └─Linear: 6-26 [435, 116, 112] [435, 116, 1720] 192,640
|
61 |
+
│ │ │ │ │ └─Linear: 6-27 [435, 116, 528] [435, 116, 112] 59,136
|
62 |
+
│ │ │ │ │ └─DropPath: 6-28 [435, 116, 112] [435, 116, 112] --
|
63 |
+
│ │ │ │ │ └─Sequential: 6-29 [435, 116, 136] [435, 116, 112] --
|
64 |
+
│ │ │ │ │ │ └─GELU: 7-13 [435, 116, 136] [435, 116, 136] --
|
65 |
+
│ │ │ │ │ │ └─Dropout: 7-14 [435, 116, 136] [435, 116, 136] --
|
66 |
+
│ │ │ │ │ │ └─Linear: 7-15 [435, 116, 136] [435, 116, 112] 15,232
|
67 |
+
│ │ │ │ │ └─DropPath: 6-30 [435, 116, 112] [435, 116, 112] --
|
68 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-11 [435, 116, 112] [435, 116, 112] --
|
69 |
+
│ │ │ │ │ └─LayerNorm: 6-31 [435, 116, 112] [435, 116, 112] 224
|
70 |
+
│ │ │ │ │ └─Linear: 6-32 [435, 116, 112] [435, 116, 1720] 192,640
|
71 |
+
│ │ │ │ │ └─Linear: 6-33 [435, 116, 528] [435, 116, 112] 59,136
|
72 |
+
│ │ │ │ │ └─DropPath: 6-34 [435, 116, 112] [435, 116, 112] --
|
73 |
+
│ │ │ │ │ └─Sequential: 6-35 [435, 116, 136] [435, 116, 112] --
|
74 |
+
│ │ │ │ │ │ └─GELU: 7-16 [435, 116, 136] [435, 116, 136] --
|
75 |
+
│ │ │ │ │ │ └─Dropout: 7-17 [435, 116, 136] [435, 116, 136] --
|
76 |
+
│ │ │ │ │ │ └─Linear: 7-18 [435, 116, 136] [435, 116, 112] 15,232
|
77 |
+
│ │ │ │ │ └─DropPath: 6-36 [435, 116, 112] [435, 116, 112] --
|
78 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-12 [435, 116, 112] [435, 116, 112] --
|
79 |
+
│ │ │ │ │ └─LayerNorm: 6-37 [435, 116, 112] [435, 116, 112] 224
|
80 |
+
│ │ │ │ │ └─Linear: 6-38 [435, 116, 112] [435, 116, 1720] 192,640
|
81 |
+
│ │ │ │ │ └─Linear: 6-39 [435, 116, 528] [435, 116, 112] 59,136
|
82 |
+
│ │ │ │ │ └─DropPath: 6-40 [435, 116, 112] [435, 116, 112] --
|
83 |
+
│ │ │ │ │ └─Sequential: 6-41 [435, 116, 136] [435, 116, 112] --
|
84 |
+
│ │ │ │ │ │ └─GELU: 7-19 [435, 116, 136] [435, 116, 136] --
|
85 |
+
│ │ │ │ │ │ └─Dropout: 7-20 [435, 116, 136] [435, 116, 136] --
|
86 |
+
│ │ │ │ │ │ └─Linear: 7-21 [435, 116, 136] [435, 116, 112] 15,232
|
87 |
+
│ │ │ │ │ └─DropPath: 6-42 [435, 116, 112] [435, 116, 112] --
|
88 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-13 [435, 116, 112] [435, 116, 112] --
|
89 |
+
│ │ │ │ │ └─LayerNorm: 6-43 [435, 116, 112] [435, 116, 112] 224
|
90 |
+
│ │ │ │ │ └─Linear: 6-44 [435, 116, 112] [435, 116, 1720] 192,640
|
91 |
+
│ │ │ │ │ └─Linear: 6-45 [435, 116, 528] [435, 116, 112] 59,136
|
92 |
+
│ │ │ │ │ └─DropPath: 6-46 [435, 116, 112] [435, 116, 112] --
|
93 |
+
│ │ │ │ │ └─Sequential: 6-47 [435, 116, 136] [435, 116, 112] --
|
94 |
+
│ │ │ │ │ │ └─GELU: 7-22 [435, 116, 136] [435, 116, 136] --
|
95 |
+
│ │ │ │ │ │ └─Dropout: 7-23 [435, 116, 136] [435, 116, 136] --
|
96 |
+
│ │ │ │ │ │ └─Linear: 7-24 [435, 116, 136] [435, 116, 112] 15,232
|
97 |
+
│ │ │ │ │ └─DropPath: 6-48 [435, 116, 112] [435, 116, 112] --
|
98 |
+
│ │ └─Rearrange: 3-4 [1, 116, 435, 112] [1, 112, 116, 15, 29] --
|
99 |
+
├─MLPShifters: 1-2 -- [1, 2, 116] 513
|
100 |
+
│ └─MLPShifter: 2-2 [116, 2] [116, 2] --
|
101 |
+
│ │ └─Sequential: 3-5 [116, 2] [116, 2] --
|
102 |
+
│ │ │ └─Linear: 4-4 [116, 2] [116, 5] 15
|
103 |
+
│ │ │ └─Tanh: 4-5 [116, 5] [116, 5] --
|
104 |
+
│ │ │ └─Linear: 4-6 [116, 5] [116, 5] 30
|
105 |
+
│ │ │ └─Tanh: 4-7 [116, 5] [116, 5] --
|
106 |
+
│ │ │ └─Linear: 4-8 [116, 5] [116, 2] 12
|
107 |
+
│ │ │ └─Tanh: 4-9 [116, 2] [116, 2] --
|
108 |
+
├─Readouts: 1-3 [1, 112, 116, 15, 29] [1, 7440, 116] 8,477,649
|
109 |
+
│ └─Gaussian2DReadout2: 2-3 [1, 112, 116, 15, 29] [1, 7440, 116] 870,480
|
110 |
+
│ │ └─Sequential: 3-6 [7440, 2] [7440, 2] --
|
111 |
+
│ │ │ └─Linear: 4-10 [7440, 2] [7440, 30] 90
|
112 |
+
│ │ │ └─ELU: 4-11 [7440, 30] [7440, 30] --
|
113 |
+
│ │ │ └─Linear: 4-12 [7440, 30] [7440, 2] 62
|
114 |
+
│ │ │ └─Tanh: 4-13 [7440, 2] [7440, 2] --
|
115 |
+
│ │ └─Sequential: 3-7 [7440, 2] [7440, 2] (recursive)
|
116 |
+
│ │ │ └─Linear: 4-14 [7440, 2] [7440, 30] (recursive)
|
117 |
+
│ │ │ └─ELU: 4-15 [7440, 30] [7440, 30] --
|
118 |
+
�� │ │ └─Linear: 4-16 [7440, 30] [7440, 2] (recursive)
|
119 |
+
│ │ │ └─Tanh: 4-17 [7440, 2] [7440, 2] --
|
120 |
+
│ │ └─Sequential: 3-8 [7440, 2] [7440, 2] (recursive)
|
121 |
+
│ │ │ └─Linear: 4-18 [7440, 2] [7440, 30] (recursive)
|
122 |
+
│ │ │ └─ELU: 4-19 [7440, 30] [7440, 30] --
|
123 |
+
│ │ │ └─Linear: 4-20 [7440, 30] [7440, 2] (recursive)
|
124 |
+
│ │ │ └─Tanh: 4-21 [7440, 2] [7440, 2] --
|
125 |
+
│ │ └─Sequential: 3-9 [116, 4] [116, 112] --
|
126 |
+
│ │ │ └─Linear: 4-22 [116, 4] [116, 112] 560
|
127 |
+
│ │ │ └─LayerNorm: 4-23 [116, 112] [116, 112] 224
|
128 |
+
│ │ │ └─GELU: 4-24 [116, 112] [116, 112] --
|
129 |
+
│ │ │ └─Dropout: 4-25 [116, 112] [116, 112] --
|
130 |
+
│ │ │ └─Linear: 4-26 [116, 112] [116, 112] 12,656
|
131 |
+
│ │ │ └─Tanh: 4-27 [116, 112] [116, 112] --
|
132 |
+
├─Exponential: 1-4 [1, 7440, 116] [1, 7440, 116] --
|
133 |
+
=======================================================================================================================================
|
134 |
+
Total params: 12,278,365
|
135 |
+
Trainable params: 12,278,365
|
136 |
+
Non-trainable params: 0
|
137 |
+
Total mult-adds (Units.MEGABYTES): 679.88
|
138 |
+
=======================================================================================================================================
|
139 |
+
Input size (MB): 1.29
|
140 |
+
Forward/backward pass size (MB): 9208.73
|
141 |
+
Params size (MB): 11.40
|
142 |
+
Estimated Total Size (MB): 9221.42
|
143 |
+
=======================================================================================================================================
|
004/output.log
ADDED
@@ -0,0 +1,770 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Use bfloat16 for core module.
|
2 |
+
Use parallel attention and MLP in ViViT.
|
3 |
+
|
4 |
+
Epoch 001/400
|
5 |
+
Train loss: 108875712.00 correlation: 0.0142
|
6 |
+
Validation loss: 200009632.00 correlation: 0.0280
|
7 |
+
Elapse: 536.31s
|
8 |
+
|
9 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
10 |
+
|
11 |
+
Epoch 002/400
|
12 |
+
Train loss: 97286888.00 correlation: 0.0397
|
13 |
+
Validation loss: 199179056.00 correlation: 0.0389
|
14 |
+
Elapse: 540.45s
|
15 |
+
|
16 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
17 |
+
|
18 |
+
Epoch 003/400
|
19 |
+
Train loss: 96065840.00 correlation: 0.0525
|
20 |
+
Validation loss: 198705632.00 correlation: 0.0414
|
21 |
+
Elapse: 548.06s
|
22 |
+
|
23 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
24 |
+
|
25 |
+
Epoch 004/400
|
26 |
+
Train loss: 95196720.00 correlation: 0.0616
|
27 |
+
Validation loss: 197267888.00 correlation: 0.0520
|
28 |
+
Elapse: 550.50s
|
29 |
+
|
30 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
31 |
+
|
32 |
+
Epoch 005/400
|
33 |
+
Train loss: 94175976.00 correlation: 0.0728
|
34 |
+
Validation loss: 195531712.00 correlation: 0.0637
|
35 |
+
Elapse: 549.52s
|
36 |
+
|
37 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
38 |
+
|
39 |
+
Epoch 006/400
|
40 |
+
Train loss: 92696320.00 correlation: 0.0883
|
41 |
+
Validation loss: 193088208.00 correlation: 0.0800
|
42 |
+
Elapse: 547.83s
|
43 |
+
|
44 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
45 |
+
|
46 |
+
Epoch 007/400
|
47 |
+
Train loss: 91328912.00 correlation: 0.1027
|
48 |
+
Validation loss: 190954368.00 correlation: 0.0931
|
49 |
+
Elapse: 546.41s
|
50 |
+
|
51 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
52 |
+
|
53 |
+
Epoch 008/400
|
54 |
+
Train loss: 90154608.00 correlation: 0.1149
|
55 |
+
Validation loss: 189186224.00 correlation: 0.1027
|
56 |
+
Elapse: 544.21s
|
57 |
+
|
58 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
59 |
+
|
60 |
+
Epoch 009/400
|
61 |
+
Train loss: 88984904.00 correlation: 0.1267
|
62 |
+
Validation loss: 187096768.00 correlation: 0.1152
|
63 |
+
Elapse: 542.67s
|
64 |
+
|
65 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
66 |
+
|
67 |
+
Epoch 010/400
|
68 |
+
Train loss: 87719928.00 correlation: 0.1389
|
69 |
+
Validation loss: 185224656.00 correlation: 0.1287
|
70 |
+
Elapse: 541.24s
|
71 |
+
|
72 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
73 |
+
|
74 |
+
Epoch 011/400
|
75 |
+
Train loss: 86455896.00 correlation: 0.1522
|
76 |
+
Validation loss: 183495936.00 correlation: 0.1386
|
77 |
+
Elapse: 540.40s
|
78 |
+
|
79 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
80 |
+
|
81 |
+
Epoch 012/400
|
82 |
+
Train loss: 85286208.00 correlation: 0.1638
|
83 |
+
Validation loss: 181750576.00 correlation: 0.1502
|
84 |
+
Elapse: 539.78s
|
85 |
+
|
86 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
87 |
+
|
88 |
+
Epoch 013/400
|
89 |
+
Train loss: 84359632.00 correlation: 0.1728
|
90 |
+
Validation loss: 180806192.00 correlation: 0.1570
|
91 |
+
Elapse: 540.59s
|
92 |
+
|
93 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
94 |
+
|
95 |
+
Epoch 014/400
|
96 |
+
Train loss: 83654496.00 correlation: 0.1800
|
97 |
+
Validation loss: 179662112.00 correlation: 0.1648
|
98 |
+
Elapse: 539.99s
|
99 |
+
|
100 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
101 |
+
|
102 |
+
Epoch 015/400
|
103 |
+
Train loss: 82936160.00 correlation: 0.1870
|
104 |
+
Validation loss: 178832416.00 correlation: 0.1697
|
105 |
+
Elapse: 540.96s
|
106 |
+
|
107 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
108 |
+
|
109 |
+
Epoch 016/400
|
110 |
+
Train loss: 82256432.00 correlation: 0.1933
|
111 |
+
Validation loss: 177940560.00 correlation: 0.1755
|
112 |
+
Elapse: 541.08s
|
113 |
+
|
114 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
115 |
+
|
116 |
+
Epoch 017/400
|
117 |
+
Train loss: 81816704.00 correlation: 0.1974
|
118 |
+
Validation loss: 177331792.00 correlation: 0.1789
|
119 |
+
Elapse: 541.24s
|
120 |
+
|
121 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
122 |
+
|
123 |
+
Epoch 018/400
|
124 |
+
Train loss: 81317624.00 correlation: 0.2024
|
125 |
+
Validation loss: 176620096.00 correlation: 0.1839
|
126 |
+
Elapse: 541.38s
|
127 |
+
|
128 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
129 |
+
|
130 |
+
Epoch 019/400
|
131 |
+
Train loss: 80761904.00 correlation: 0.2073
|
132 |
+
Validation loss: 175956080.00 correlation: 0.1882
|
133 |
+
Elapse: 540.85s
|
134 |
+
|
135 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
136 |
+
|
137 |
+
Epoch 020/400
|
138 |
+
Train loss: 80425104.00 correlation: 0.2111
|
139 |
+
Validation loss: 175399376.00 correlation: 0.1923
|
140 |
+
Elapse: 541.23s
|
141 |
+
|
142 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
143 |
+
|
144 |
+
Epoch 021/400
|
145 |
+
Train loss: 80006704.00 correlation: 0.2149
|
146 |
+
Validation loss: 174810944.00 correlation: 0.1963
|
147 |
+
Elapse: 540.64s
|
148 |
+
|
149 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
150 |
+
|
151 |
+
Epoch 022/400
|
152 |
+
Train loss: 79605576.00 correlation: 0.2188
|
153 |
+
Validation loss: 174441312.00 correlation: 0.1990
|
154 |
+
Elapse: 541.29s
|
155 |
+
|
156 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
157 |
+
|
158 |
+
Epoch 023/400
|
159 |
+
Train loss: 79238384.00 correlation: 0.2225
|
160 |
+
Validation loss: 173628144.00 correlation: 0.2041
|
161 |
+
Elapse: 541.23s
|
162 |
+
|
163 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
164 |
+
|
165 |
+
Epoch 024/400
|
166 |
+
Train loss: 78942312.00 correlation: 0.2253
|
167 |
+
Validation loss: 173239408.00 correlation: 0.2069
|
168 |
+
Elapse: 541.38s
|
169 |
+
|
170 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
171 |
+
|
172 |
+
Epoch 025/400
|
173 |
+
Train loss: 78635512.00 correlation: 0.2284
|
174 |
+
Validation loss: 172979872.00 correlation: 0.2084
|
175 |
+
Elapse: 541.43s
|
176 |
+
|
177 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
178 |
+
|
179 |
+
Epoch 026/400
|
180 |
+
Train loss: 78411792.00 correlation: 0.2303
|
181 |
+
Validation loss: 172513792.00 correlation: 0.2110
|
182 |
+
Elapse: 541.42s
|
183 |
+
|
184 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
185 |
+
|
186 |
+
Epoch 027/400
|
187 |
+
Train loss: 78185872.00 correlation: 0.2329
|
188 |
+
Validation loss: 172230208.00 correlation: 0.2128
|
189 |
+
Elapse: 540.87s
|
190 |
+
|
191 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
192 |
+
|
193 |
+
Epoch 028/400
|
194 |
+
Train loss: 77904656.00 correlation: 0.2353
|
195 |
+
Validation loss: 172162992.00 correlation: 0.2139
|
196 |
+
Elapse: 541.44s
|
197 |
+
|
198 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
199 |
+
|
200 |
+
Epoch 029/400
|
201 |
+
Train loss: 77741728.00 correlation: 0.2368
|
202 |
+
Validation loss: 171699152.00 correlation: 0.2166
|
203 |
+
Elapse: 542.05s
|
204 |
+
|
205 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
206 |
+
|
207 |
+
Epoch 030/400
|
208 |
+
Train loss: 77624216.00 correlation: 0.2381
|
209 |
+
Validation loss: 171523792.00 correlation: 0.2179
|
210 |
+
Elapse: 541.70s
|
211 |
+
|
212 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
213 |
+
|
214 |
+
Epoch 031/400
|
215 |
+
Train loss: 77405640.00 correlation: 0.2398
|
216 |
+
Validation loss: 171512912.00 correlation: 0.2182
|
217 |
+
Elapse: 541.80s
|
218 |
+
|
219 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
220 |
+
|
221 |
+
Epoch 032/400
|
222 |
+
Train loss: 77315544.00 correlation: 0.2411
|
223 |
+
Validation loss: 171059296.00 correlation: 0.2209
|
224 |
+
Elapse: 541.92s
|
225 |
+
|
226 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
227 |
+
|
228 |
+
Epoch 033/400
|
229 |
+
Train loss: 77214704.00 correlation: 0.2420
|
230 |
+
Validation loss: 171228784.00 correlation: 0.2201
|
231 |
+
Elapse: 541.77s
|
232 |
+
|
233 |
+
Epoch 034/400
|
234 |
+
Train loss: 77108704.00 correlation: 0.2433
|
235 |
+
Validation loss: 170971952.00 correlation: 0.2219
|
236 |
+
Elapse: 541.81s
|
237 |
+
|
238 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
239 |
+
|
240 |
+
Epoch 035/400
|
241 |
+
Train loss: 76970384.00 correlation: 0.2445
|
242 |
+
Validation loss: 170653312.00 correlation: 0.2236
|
243 |
+
Elapse: 542.50s
|
244 |
+
|
245 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
246 |
+
|
247 |
+
Epoch 036/400
|
248 |
+
Train loss: 76829184.00 correlation: 0.2459
|
249 |
+
Validation loss: 170723072.00 correlation: 0.2228
|
250 |
+
Elapse: 542.11s
|
251 |
+
|
252 |
+
Epoch 037/400
|
253 |
+
Train loss: 76814728.00 correlation: 0.2461
|
254 |
+
Validation loss: 170317536.00 correlation: 0.2260
|
255 |
+
Elapse: 542.26s
|
256 |
+
|
257 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
258 |
+
|
259 |
+
Epoch 038/400
|
260 |
+
Train loss: 76648232.00 correlation: 0.2476
|
261 |
+
Validation loss: 170352096.00 correlation: 0.2263
|
262 |
+
Elapse: 542.30s
|
263 |
+
|
264 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
265 |
+
|
266 |
+
Epoch 039/400
|
267 |
+
Train loss: 76570480.00 correlation: 0.2485
|
268 |
+
Validation loss: 170048544.00 correlation: 0.2276
|
269 |
+
Elapse: 542.30s
|
270 |
+
|
271 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
272 |
+
|
273 |
+
Epoch 040/400
|
274 |
+
Train loss: 76481936.00 correlation: 0.2492
|
275 |
+
Validation loss: 170178064.00 correlation: 0.2271
|
276 |
+
Elapse: 542.72s
|
277 |
+
|
278 |
+
Epoch 041/400
|
279 |
+
Train loss: 76392648.00 correlation: 0.2501
|
280 |
+
Validation loss: 169916672.00 correlation: 0.2292
|
281 |
+
Elapse: 542.22s
|
282 |
+
|
283 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
284 |
+
|
285 |
+
Epoch 042/400
|
286 |
+
Train loss: 76277856.00 correlation: 0.2512
|
287 |
+
Validation loss: 169939984.00 correlation: 0.2288
|
288 |
+
Elapse: 542.30s
|
289 |
+
|
290 |
+
Epoch 043/400
|
291 |
+
Train loss: 76200912.00 correlation: 0.2518
|
292 |
+
Validation loss: 169966848.00 correlation: 0.2293
|
293 |
+
Elapse: 543.01s
|
294 |
+
|
295 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
296 |
+
|
297 |
+
Epoch 044/400
|
298 |
+
Train loss: 76180752.00 correlation: 0.2520
|
299 |
+
Validation loss: 169804672.00 correlation: 0.2301
|
300 |
+
Elapse: 541.51s
|
301 |
+
|
302 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
303 |
+
|
304 |
+
Epoch 045/400
|
305 |
+
Train loss: 76124944.00 correlation: 0.2529
|
306 |
+
Validation loss: 169699056.00 correlation: 0.2297
|
307 |
+
Elapse: 541.18s
|
308 |
+
|
309 |
+
Epoch 046/400
|
310 |
+
Train loss: 75982544.00 correlation: 0.2542
|
311 |
+
Validation loss: 169554976.00 correlation: 0.2308
|
312 |
+
Elapse: 541.59s
|
313 |
+
|
314 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
315 |
+
|
316 |
+
Epoch 047/400
|
317 |
+
Train loss: 75966320.00 correlation: 0.2542
|
318 |
+
Validation loss: 169422160.00 correlation: 0.2317
|
319 |
+
Elapse: 540.36s
|
320 |
+
|
321 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
322 |
+
|
323 |
+
Epoch 048/400
|
324 |
+
Train loss: 75923248.00 correlation: 0.2547
|
325 |
+
Validation loss: 169780352.00 correlation: 0.2287
|
326 |
+
Elapse: 540.75s
|
327 |
+
|
328 |
+
Epoch 049/400
|
329 |
+
Train loss: 75947968.00 correlation: 0.2547
|
330 |
+
Validation loss: 169837856.00 correlation: 0.2298
|
331 |
+
Elapse: 541.57s
|
332 |
+
|
333 |
+
Epoch 050/400
|
334 |
+
Train loss: 75809040.00 correlation: 0.2556
|
335 |
+
Validation loss: 169605200.00 correlation: 0.2306
|
336 |
+
Elapse: 541.98s
|
337 |
+
|
338 |
+
Epoch 051/400
|
339 |
+
Train loss: 75789808.00 correlation: 0.2558
|
340 |
+
Validation loss: 169401440.00 correlation: 0.2307
|
341 |
+
Elapse: 542.15s
|
342 |
+
|
343 |
+
Epoch 052/400
|
344 |
+
Train loss: 75764560.00 correlation: 0.2561
|
345 |
+
Validation loss: 169899840.00 correlation: 0.2291
|
346 |
+
Elapse: 541.98s
|
347 |
+
|
348 |
+
Loaded checkpoint from epoch 47 (correlation: 0.2317).
|
349 |
+
|
350 |
+
Reduce learning rate of core to 1.4400e-03 (num. reduce: 1).
|
351 |
+
Reduce learning rate of readouts to 1.0800e-03 (num. reduce: 1).
|
352 |
+
Reduce learning rate of shifters to 1.0800e-03 (num. reduce: 1).
|
353 |
+
|
354 |
+
Epoch 053/400
|
355 |
+
Train loss: 73947496.00 correlation: 0.2716
|
356 |
+
Validation loss: 167854176.00 correlation: 0.2423
|
357 |
+
Elapse: 542.40s
|
358 |
+
|
359 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
360 |
+
|
361 |
+
Epoch 054/400
|
362 |
+
Train loss: 73334280.00 correlation: 0.2771
|
363 |
+
Validation loss: 167810464.00 correlation: 0.2430
|
364 |
+
Elapse: 543.06s
|
365 |
+
|
366 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
367 |
+
|
368 |
+
Epoch 055/400
|
369 |
+
Train loss: 73178416.00 correlation: 0.2788
|
370 |
+
Validation loss: 167610272.00 correlation: 0.2431
|
371 |
+
Elapse: 543.11s
|
372 |
+
|
373 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
374 |
+
|
375 |
+
Epoch 056/400
|
376 |
+
Train loss: 73106944.00 correlation: 0.2793
|
377 |
+
Validation loss: 167676960.00 correlation: 0.2432
|
378 |
+
Elapse: 543.44s
|
379 |
+
|
380 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
381 |
+
|
382 |
+
Epoch 057/400
|
383 |
+
Train loss: 73098200.00 correlation: 0.2798
|
384 |
+
Validation loss: 167731616.00 correlation: 0.2427
|
385 |
+
Elapse: 543.05s
|
386 |
+
|
387 |
+
Epoch 058/400
|
388 |
+
Train loss: 73030688.00 correlation: 0.2803
|
389 |
+
Validation loss: 167715872.00 correlation: 0.2427
|
390 |
+
Elapse: 543.72s
|
391 |
+
|
392 |
+
Epoch 059/400
|
393 |
+
Train loss: 72944768.00 correlation: 0.2814
|
394 |
+
Validation loss: 167514192.00 correlation: 0.2440
|
395 |
+
Elapse: 543.63s
|
396 |
+
|
397 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
398 |
+
|
399 |
+
Epoch 060/400
|
400 |
+
Train loss: 72929872.00 correlation: 0.2815
|
401 |
+
Validation loss: 167771024.00 correlation: 0.2423
|
402 |
+
Elapse: 543.29s
|
403 |
+
|
404 |
+
Epoch 061/400
|
405 |
+
Train loss: 72848184.00 correlation: 0.2822
|
406 |
+
Validation loss: 167556976.00 correlation: 0.2437
|
407 |
+
Elapse: 543.81s
|
408 |
+
|
409 |
+
Epoch 062/400
|
410 |
+
Train loss: 72894440.00 correlation: 0.2819
|
411 |
+
Validation loss: 167687056.00 correlation: 0.2429
|
412 |
+
Elapse: 543.05s
|
413 |
+
|
414 |
+
Epoch 063/400
|
415 |
+
Train loss: 72843624.00 correlation: 0.2824
|
416 |
+
Validation loss: 167582688.00 correlation: 0.2431
|
417 |
+
Elapse: 544.00s
|
418 |
+
|
419 |
+
Epoch 064/400
|
420 |
+
Train loss: 72864712.00 correlation: 0.2818
|
421 |
+
Validation loss: 167485088.00 correlation: 0.2435
|
422 |
+
Elapse: 543.20s
|
423 |
+
|
424 |
+
Loaded checkpoint from epoch 59 (correlation: 0.2440).
|
425 |
+
|
426 |
+
Reduce learning rate of core to 4.3200e-04 (num. reduce: 1).
|
427 |
+
Reduce learning rate of readouts to 3.2400e-04 (num. reduce: 1).
|
428 |
+
Reduce learning rate of shifters to 3.2400e-04 (num. reduce: 1).
|
429 |
+
|
430 |
+
Epoch 065/400
|
431 |
+
Train loss: 72100880.00 correlation: 0.2884
|
432 |
+
Validation loss: 167043168.00 correlation: 0.2470
|
433 |
+
Elapse: 543.83s
|
434 |
+
|
435 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
436 |
+
|
437 |
+
Epoch 066/400
|
438 |
+
Train loss: 71817264.00 correlation: 0.2907
|
439 |
+
Validation loss: 166928480.00 correlation: 0.2480
|
440 |
+
Elapse: 543.10s
|
441 |
+
|
442 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
443 |
+
|
444 |
+
Epoch 067/400
|
445 |
+
Train loss: 71765488.00 correlation: 0.2914
|
446 |
+
Validation loss: 166935472.00 correlation: 0.2473
|
447 |
+
Elapse: 543.05s
|
448 |
+
|
449 |
+
Epoch 068/400
|
450 |
+
Train loss: 71709384.00 correlation: 0.2919
|
451 |
+
Validation loss: 166836192.00 correlation: 0.2479
|
452 |
+
Elapse: 544.05s
|
453 |
+
|
454 |
+
Epoch 069/400
|
455 |
+
Train loss: 71609624.00 correlation: 0.2931
|
456 |
+
Validation loss: 166932704.00 correlation: 0.2478
|
457 |
+
Elapse: 544.51s
|
458 |
+
|
459 |
+
Epoch 070/400
|
460 |
+
Train loss: 71532048.00 correlation: 0.2937
|
461 |
+
Validation loss: 166911168.00 correlation: 0.2475
|
462 |
+
Elapse: 543.81s
|
463 |
+
|
464 |
+
Epoch 071/400
|
465 |
+
Train loss: 71531912.00 correlation: 0.2938
|
466 |
+
Validation loss: 166931488.00 correlation: 0.2474
|
467 |
+
Elapse: 543.44s
|
468 |
+
|
469 |
+
Loaded checkpoint from epoch 66 (correlation: 0.2480).
|
470 |
+
|
471 |
+
Reduce learning rate of core to 1.2960e-04 (num. reduce: 1).
|
472 |
+
Reduce learning rate of readouts to 9.7200e-05 (num. reduce: 1).
|
473 |
+
Reduce learning rate of shifters to 9.7200e-05 (num. reduce: 1).
|
474 |
+
|
475 |
+
Epoch 072/400
|
476 |
+
Train loss: 71521936.00 correlation: 0.2938
|
477 |
+
Validation loss: 166835152.00 correlation: 0.2481
|
478 |
+
Elapse: 544.28s
|
479 |
+
|
480 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
481 |
+
|
482 |
+
Epoch 073/400
|
483 |
+
Train loss: 71422952.00 correlation: 0.2945
|
484 |
+
Validation loss: 166809568.00 correlation: 0.2486
|
485 |
+
Elapse: 542.98s
|
486 |
+
|
487 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
488 |
+
|
489 |
+
Epoch 074/400
|
490 |
+
Train loss: 71402352.00 correlation: 0.2945
|
491 |
+
Validation loss: 166765920.00 correlation: 0.2487
|
492 |
+
Elapse: 544.22s
|
493 |
+
|
494 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
495 |
+
|
496 |
+
Epoch 075/400
|
497 |
+
Train loss: 71357648.00 correlation: 0.2949
|
498 |
+
Validation loss: 166766240.00 correlation: 0.2487
|
499 |
+
Elapse: 544.05s
|
500 |
+
|
501 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
502 |
+
|
503 |
+
Epoch 076/400
|
504 |
+
Train loss: 71315664.00 correlation: 0.2955
|
505 |
+
Validation loss: 166761216.00 correlation: 0.2489
|
506 |
+
Elapse: 544.69s
|
507 |
+
|
508 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
509 |
+
|
510 |
+
Epoch 077/400
|
511 |
+
Train loss: 71363472.00 correlation: 0.2948
|
512 |
+
Validation loss: 166736352.00 correlation: 0.2489
|
513 |
+
Elapse: 544.27s
|
514 |
+
|
515 |
+
Epoch 078/400
|
516 |
+
Train loss: 71227736.00 correlation: 0.2964
|
517 |
+
Validation loss: 166733360.00 correlation: 0.2489
|
518 |
+
Elapse: 544.22s
|
519 |
+
|
520 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
521 |
+
|
522 |
+
Epoch 079/400
|
523 |
+
Train loss: 71277464.00 correlation: 0.2955
|
524 |
+
Validation loss: 166735664.00 correlation: 0.2488
|
525 |
+
Elapse: 543.94s
|
526 |
+
|
527 |
+
Epoch 080/400
|
528 |
+
Train loss: 71206488.00 correlation: 0.2965
|
529 |
+
Validation loss: 166742432.00 correlation: 0.2489
|
530 |
+
Elapse: 544.10s
|
531 |
+
|
532 |
+
Epoch 081/400
|
533 |
+
Train loss: 71163264.00 correlation: 0.2968
|
534 |
+
Validation loss: 166738592.00 correlation: 0.2489
|
535 |
+
Elapse: 544.08s
|
536 |
+
|
537 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
538 |
+
|
539 |
+
Epoch 082/400
|
540 |
+
Train loss: 71186960.00 correlation: 0.2968
|
541 |
+
Validation loss: 166722656.00 correlation: 0.2489
|
542 |
+
Elapse: 544.32s
|
543 |
+
|
544 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
545 |
+
|
546 |
+
Epoch 083/400
|
547 |
+
Train loss: 71185200.00 correlation: 0.2968
|
548 |
+
Validation loss: 166706704.00 correlation: 0.2489
|
549 |
+
Elapse: 543.20s
|
550 |
+
|
551 |
+
Epoch 084/400
|
552 |
+
Train loss: 71172336.00 correlation: 0.2970
|
553 |
+
Validation loss: 166667952.00 correlation: 0.2490
|
554 |
+
Elapse: 544.33s
|
555 |
+
|
556 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
557 |
+
|
558 |
+
Epoch 085/400
|
559 |
+
Train loss: 71094784.00 correlation: 0.2977
|
560 |
+
Validation loss: 166736224.00 correlation: 0.2490
|
561 |
+
Elapse: 544.02s
|
562 |
+
|
563 |
+
Epoch 086/400
|
564 |
+
Train loss: 71121680.00 correlation: 0.2972
|
565 |
+
Validation loss: 166702080.00 correlation: 0.2491
|
566 |
+
Elapse: 544.15s
|
567 |
+
|
568 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
569 |
+
|
570 |
+
Epoch 087/400
|
571 |
+
Train loss: 71068680.00 correlation: 0.2980
|
572 |
+
Validation loss: 166759776.00 correlation: 0.2488
|
573 |
+
Elapse: 544.35s
|
574 |
+
|
575 |
+
Epoch 088/400
|
576 |
+
Train loss: 71037376.00 correlation: 0.2982
|
577 |
+
Validation loss: 166717840.00 correlation: 0.2488
|
578 |
+
Elapse: 544.48s
|
579 |
+
|
580 |
+
Epoch 089/400
|
581 |
+
Train loss: 71044336.00 correlation: 0.2979
|
582 |
+
Validation loss: 166688608.00 correlation: 0.2491
|
583 |
+
Elapse: 543.63s
|
584 |
+
|
585 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
586 |
+
|
587 |
+
Epoch 090/400
|
588 |
+
Train loss: 71028720.00 correlation: 0.2984
|
589 |
+
Validation loss: 166697808.00 correlation: 0.2488
|
590 |
+
Elapse: 544.01s
|
591 |
+
|
592 |
+
Epoch 091/400
|
593 |
+
Train loss: 70956424.00 correlation: 0.2991
|
594 |
+
Validation loss: 166683104.00 correlation: 0.2491
|
595 |
+
Elapse: 544.36s
|
596 |
+
|
597 |
+
Epoch 092/400
|
598 |
+
Train loss: 71034488.00 correlation: 0.2982
|
599 |
+
Validation loss: 166691024.00 correlation: 0.2491
|
600 |
+
Elapse: 544.53s
|
601 |
+
|
602 |
+
Epoch 093/400
|
603 |
+
Train loss: 71008336.00 correlation: 0.2981
|
604 |
+
Validation loss: 166667472.00 correlation: 0.2493
|
605 |
+
Elapse: 544.24s
|
606 |
+
|
607 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
608 |
+
|
609 |
+
Epoch 094/400
|
610 |
+
Train loss: 70955584.00 correlation: 0.2990
|
611 |
+
Validation loss: 166707392.00 correlation: 0.2487
|
612 |
+
Elapse: 543.78s
|
613 |
+
|
614 |
+
Epoch 095/400
|
615 |
+
Train loss: 70927976.00 correlation: 0.2993
|
616 |
+
Validation loss: 166647504.00 correlation: 0.2491
|
617 |
+
Elapse: 543.94s
|
618 |
+
|
619 |
+
Epoch 096/400
|
620 |
+
Train loss: 70877440.00 correlation: 0.2996
|
621 |
+
Validation loss: 166701728.00 correlation: 0.2486
|
622 |
+
Elapse: 543.45s
|
623 |
+
|
624 |
+
Epoch 097/400
|
625 |
+
Train loss: 70917616.00 correlation: 0.2991
|
626 |
+
Validation loss: 166641920.00 correlation: 0.2492
|
627 |
+
Elapse: 544.10s
|
628 |
+
|
629 |
+
Epoch 098/400
|
630 |
+
Train loss: 70867216.00 correlation: 0.2999
|
631 |
+
Validation loss: 166664160.00 correlation: 0.2492
|
632 |
+
Elapse: 544.30s
|
633 |
+
|
634 |
+
Loaded checkpoint from epoch 93 (correlation: 0.2493).
|
635 |
+
|
636 |
+
Reduce learning rate of core to 3.8880e-05 (num. reduce: 1).
|
637 |
+
Reduce learning rate of readouts to 2.9160e-05 (num. reduce: 1).
|
638 |
+
Reduce learning rate of shifters to 2.9160e-05 (num. reduce: 1).
|
639 |
+
|
640 |
+
Epoch 099/400
|
641 |
+
Train loss: 70901904.00 correlation: 0.2993
|
642 |
+
Validation loss: 166624560.00 correlation: 0.2493
|
643 |
+
Elapse: 544.44s
|
644 |
+
|
645 |
+
Epoch 100/400
|
646 |
+
Train loss: 70815976.00 correlation: 0.3000
|
647 |
+
Validation loss: 166631168.00 correlation: 0.2494
|
648 |
+
Elapse: 544.02s
|
649 |
+
|
650 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
651 |
+
|
652 |
+
Epoch 101/400
|
653 |
+
Train loss: 70876152.00 correlation: 0.2993
|
654 |
+
Validation loss: 166642400.00 correlation: 0.2492
|
655 |
+
Elapse: 544.50s
|
656 |
+
|
657 |
+
Epoch 102/400
|
658 |
+
Train loss: 70783744.00 correlation: 0.3006
|
659 |
+
Validation loss: 166643056.00 correlation: 0.2492
|
660 |
+
Elapse: 544.34s
|
661 |
+
|
662 |
+
Epoch 103/400
|
663 |
+
Train loss: 70822832.00 correlation: 0.3002
|
664 |
+
Validation loss: 166621408.00 correlation: 0.2494
|
665 |
+
Elapse: 544.59s
|
666 |
+
|
667 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
668 |
+
|
669 |
+
Epoch 104/400
|
670 |
+
Train loss: 70795760.00 correlation: 0.3005
|
671 |
+
Validation loss: 166626384.00 correlation: 0.2494
|
672 |
+
Elapse: 544.65s
|
673 |
+
|
674 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
|
675 |
+
|
676 |
+
Epoch 105/400
|
677 |
+
Train loss: 70758416.00 correlation: 0.3004
|
678 |
+
Validation loss: 166603600.00 correlation: 0.2494
|
679 |
+
Elapse: 544.30s
|
680 |
+
|
681 |
+
Epoch 106/400
|
682 |
+
Train loss: 70836856.00 correlation: 0.2999
|
683 |
+
Validation loss: 166631360.00 correlation: 0.2493
|
684 |
+
Elapse: 544.28s
|
685 |
+
|
686 |
+
Epoch 107/400
|
687 |
+
Train loss: 70783560.00 correlation: 0.3006
|
688 |
+
Validation loss: 166638304.00 correlation: 0.2493
|
689 |
+
Elapse: 544.44s
|
690 |
+
|
691 |
+
Epoch 108/400
|
692 |
+
Train loss: 70793304.00 correlation: 0.3004
|
693 |
+
Validation loss: 166632480.00 correlation: 0.2492
|
694 |
+
Elapse: 544.19s
|
695 |
+
|
696 |
+
Epoch 109/400
|
697 |
+
Train loss: 70730064.00 correlation: 0.3012
|
698 |
+
Validation loss: 166617632.00 correlation: 0.2493
|
699 |
+
Elapse: 543.89s
|
700 |
+
|
701 |
+
Loaded checkpoint from epoch 104 (correlation: 0.2494).
|
702 |
+
|
703 |
+
Reduce learning rate of core to 1.1664e-05 (num. reduce: 1).
|
704 |
+
Reduce learning rate of readouts to 8.7480e-06 (num. reduce: 1).
|
705 |
+
Reduce learning rate of shifters to 8.7480e-06 (num. reduce: 1).
|
706 |
+
|
707 |
+
Epoch 110/400
|
708 |
+
Train loss: 70741584.00 correlation: 0.3007
|
709 |
+
Validation loss: 166614400.00 correlation: 0.2493
|
710 |
+
Elapse: 544.26s
|
711 |
+
|
712 |
+
Epoch 111/400
|
713 |
+
Train loss: 70763320.00 correlation: 0.3005
|
714 |
+
Validation loss: 166633072.00 correlation: 0.2493
|
715 |
+
Elapse: 544.57s
|
716 |
+
|
717 |
+
Epoch 112/400
|
718 |
+
Train loss: 70721984.00 correlation: 0.3011
|
719 |
+
Validation loss: 166633552.00 correlation: 0.2493
|
720 |
+
Elapse: 544.64s
|
721 |
+
|
722 |
+
Epoch 113/400
|
723 |
+
Train loss: 70737856.00 correlation: 0.3009
|
724 |
+
Validation loss: 166608208.00 correlation: 0.2494
|
725 |
+
Elapse: 544.39s
|
726 |
+
|
727 |
+
Epoch 114/400
|
728 |
+
Train loss: 70798224.00 correlation: 0.3000
|
729 |
+
Validation loss: 166619792.00 correlation: 0.2494
|
730 |
+
Elapse: 543.95s
|
731 |
+
|
732 |
+
Loaded checkpoint from epoch 104 (correlation: 0.2494).
|
733 |
+
|
734 |
+
Reduce learning rate of core to 3.4992e-06 (num. reduce: 2).
|
735 |
+
Reduce learning rate of readouts to 2.6244e-06 (num. reduce: 2).
|
736 |
+
Reduce learning rate of shifters to 2.6244e-06 (num. reduce: 2).
|
737 |
+
|
738 |
+
Epoch 115/400
|
739 |
+
Train loss: 70736776.00 correlation: 0.3008
|
740 |
+
Validation loss: 166615600.00 correlation: 0.2494
|
741 |
+
Elapse: 544.31s
|
742 |
+
|
743 |
+
Epoch 116/400
|
744 |
+
Train loss: 70760608.00 correlation: 0.3006
|
745 |
+
Validation loss: 166622592.00 correlation: 0.2493
|
746 |
+
Elapse: 544.61s
|
747 |
+
|
748 |
+
Epoch 117/400
|
749 |
+
Train loss: 70707912.00 correlation: 0.3011
|
750 |
+
Validation loss: 166622416.00 correlation: 0.2494
|
751 |
+
Elapse: 544.73s
|
752 |
+
|
753 |
+
Epoch 118/400
|
754 |
+
Train loss: 70797264.00 correlation: 0.3002
|
755 |
+
Validation loss: 166620240.00 correlation: 0.2493
|
756 |
+
Elapse: 545.29s
|
757 |
+
|
758 |
+
Epoch 119/400
|
759 |
+
Train loss: 70782240.00 correlation: 0.3003
|
760 |
+
Validation loss: 166620000.00 correlation: 0.2493
|
761 |
+
Elapse: 544.33s
|
762 |
+
|
763 |
+
Model has not improved after 2 LR reductions.
|
764 |
+
|
765 |
+
Loaded checkpoint from epoch 104 (correlation: 0.2494).
|
766 |
+
|
767 |
+
|
768 |
+
ValidationA: 0.2428 B: 0.2746 C: 0.2716 D: 0.2360 E: 0.2351 F: 0.2335 G: 0.2531 H: 0.2331 I: 0.2568 J: 0.2576 average: 0.2494
|
769 |
+
|
770 |
+
Results saved to /home/storage/runs/vivit_ensemble/015.
|
005/args.yaml
ADDED
@@ -0,0 +1,87 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
adam_beta1: 0.9
|
2 |
+
adam_beta2: 0.999
|
3 |
+
adam_eps: 1e-08
|
4 |
+
batch_size: 6
|
5 |
+
cache_data: false
|
6 |
+
center_crop: 1.0
|
7 |
+
clear_output_dir: true
|
8 |
+
core: vivit
|
9 |
+
core_behavior_mode: 2
|
10 |
+
core_compile: false
|
11 |
+
core_drop_path: 0.0505
|
12 |
+
core_emb_dim: 112
|
13 |
+
core_ff_activation: gelu
|
14 |
+
core_ff_dropout: 0.0592
|
15 |
+
core_flash_attention: 1
|
16 |
+
core_head_dim: 48
|
17 |
+
core_lr: 0.0048
|
18 |
+
core_mha_dropout: 0.358
|
19 |
+
core_mlp_dim: 136
|
20 |
+
core_norm_qk: false
|
21 |
+
core_num_heads: 11
|
22 |
+
core_p_dropout: 0.1338
|
23 |
+
core_parallel_attention: true
|
24 |
+
core_patch_mode: 0
|
25 |
+
core_pos_encoding: 3
|
26 |
+
core_spatial_depth: 3
|
27 |
+
core_spatial_patch_size: 7
|
28 |
+
core_spatial_patch_stride: 2
|
29 |
+
core_temporal_depth: 5
|
30 |
+
core_temporal_patch_size: 25
|
31 |
+
core_temporal_patch_stride: 1
|
32 |
+
core_weight_decay: 0.1789
|
33 |
+
criterion: poisson_correlation
|
34 |
+
critic_mode: 0
|
35 |
+
crop_frame: 140
|
36 |
+
data: /home/sensorium2023
|
37 |
+
deterministic: false
|
38 |
+
device: cuda
|
39 |
+
dpi: 120
|
40 |
+
ds_mode: 3
|
41 |
+
ds_scale: 1
|
42 |
+
epochs: 400
|
43 |
+
format: svg
|
44 |
+
git_hash: 3cd580b
|
45 |
+
grad_checkpointing: 0
|
46 |
+
grad_norm: null
|
47 |
+
input_shapes:
|
48 |
+
behavior: [2, 140]
|
49 |
+
pupil_center: [2, 140]
|
50 |
+
video: [1, 140, 36, 64]
|
51 |
+
limit_data: null
|
52 |
+
lr: 0.0036
|
53 |
+
max_frame: 300
|
54 |
+
micro_batch_size: 6
|
55 |
+
modulator_mode: 0
|
56 |
+
mouse_ids: [A, B, C, D, E, F, G, H, I, J]
|
57 |
+
num_workers: 2
|
58 |
+
output_dir: /home/storage/runs/005
|
59 |
+
output_mode: 1
|
60 |
+
output_shapes:
|
61 |
+
A: [7440, 140]
|
62 |
+
B: [7928, 140]
|
63 |
+
C: [8285, 140]
|
64 |
+
D: [7671, 140]
|
65 |
+
E: [7495, 140]
|
66 |
+
F: [7863, 140]
|
67 |
+
G: [7908, 140]
|
68 |
+
H: [8202, 140]
|
69 |
+
I: [7939, 140]
|
70 |
+
J: [8122, 140]
|
71 |
+
precision: "32"
|
72 |
+
pretrain_core: null
|
73 |
+
readout: gaussian2d
|
74 |
+
readout_bias_mode: 2
|
75 |
+
readout_dropout: 0.0
|
76 |
+
readout_grid_mode: 1
|
77 |
+
restore: null
|
78 |
+
save_plots: false
|
79 |
+
seed: 28
|
80 |
+
shifter_layers: 3
|
81 |
+
shifter_mode: 1
|
82 |
+
shifter_size: 5
|
83 |
+
stat_mode: 1
|
84 |
+
trainable_params: 12278365
|
85 |
+
transform_mode: 2
|
86 |
+
verbose: 1
|
87 |
+
weight_decay: 0.3939
|
005/ckpt/model_state.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f8586d53aa03f24b6b533d7a172c6c33aefaf02e346d810dbb171fcf6202e2b
|
3 |
+
size 148268583
|
005/evaluation.yaml
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
validation: {A: 0.2465260773897171, B: 0.27831149101257324, C: 0.2688469886779785,
|
2 |
+
D: 0.22918999195098877, E: 0.23662497103214264, F: 0.2340845912694931, G: 0.254902184009552,
|
3 |
+
H: 0.23301741480827332, I: 0.25673478841781616, J: 0.2570823132991791, average: 0.2495320811867714}
|
005/model.txt
ADDED
@@ -0,0 +1,143 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
=======================================================================================================================================
|
2 |
+
Layer (type:depth-idx) Input Shape Output Shape Param #
|
3 |
+
=======================================================================================================================================
|
4 |
+
Model -- [1, 7440, 116] --
|
5 |
+
├─ViViTCore: 1-1 -- [1, 112, 116, 15, 29] --
|
6 |
+
│ └─ViViT: 2-1 [1, 5, 140, 36, 64] [1, 112, 116, 15, 29] --
|
7 |
+
│ │ └─Tokenizer: 3-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] 79,632
|
8 |
+
│ │ │ └─Sequential: 4-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] --
|
9 |
+
│ │ │ │ └─Unfold3d: 5-1 [1, 5, 140, 36, 64] [1, 116, 435, 6125] --
|
10 |
+
│ │ │ │ └─LayerNorm: 5-2 [1, 116, 435, 6125] [1, 116, 435, 6125] 12,250
|
11 |
+
│ │ │ │ └─Linear: 5-3 [1, 116, 435, 6125] [1, 116, 435, 112] 686,112
|
12 |
+
│ │ │ │ └─LayerNorm: 5-4 [1, 116, 435, 112] [1, 116, 435, 112] 224
|
13 |
+
│ │ │ │ └─Dropout: 5-5 [1, 116, 435, 112] [1, 116, 435, 112] --
|
14 |
+
│ │ └─Transformer: 3-2 [116, 435, 112] [116, 435, 112] --
|
15 |
+
│ │ │ └─ModuleList: 4-2 -- -- --
|
16 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-6 [116, 435, 112] [116, 435, 112] --
|
17 |
+
│ │ │ │ │ └─LayerNorm: 6-1 [116, 435, 112] [116, 435, 112] 224
|
18 |
+
│ │ │ │ │ └─Linear: 6-2 [116, 435, 112] [116, 435, 1720] 192,640
|
19 |
+
│ │ │ │ │ └─Linear: 6-3 [116, 435, 528] [116, 435, 112] 59,136
|
20 |
+
│ │ │ │ │ └─DropPath: 6-4 [116, 435, 112] [116, 435, 112] --
|
21 |
+
│ │ │ │ │ └─Sequential: 6-5 [116, 435, 136] [116, 435, 112] --
|
22 |
+
│ │ │ │ │ │ └─GELU: 7-1 [116, 435, 136] [116, 435, 136] --
|
23 |
+
│ │ │ │ │ │ └─Dropout: 7-2 [116, 435, 136] [116, 435, 136] --
|
24 |
+
│ │ │ │ │ │ └─Linear: 7-3 [116, 435, 136] [116, 435, 112] 15,232
|
25 |
+
│ │ │ │ │ └─DropPath: 6-6 [116, 435, 112] [116, 435, 112] --
|
26 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-7 [116, 435, 112] [116, 435, 112] --
|
27 |
+
│ │ │ │ │ └─LayerNorm: 6-7 [116, 435, 112] [116, 435, 112] 224
|
28 |
+
│ │ │ │ │ └─Linear: 6-8 [116, 435, 112] [116, 435, 1720] 192,640
|
29 |
+
│ │ │ │ │ └─Linear: 6-9 [116, 435, 528] [116, 435, 112] 59,136
|
30 |
+
│ │ │ │ │ └─DropPath: 6-10 [116, 435, 112] [116, 435, 112] --
|
31 |
+
│ │ │ │ │ └─Sequential: 6-11 [116, 435, 136] [116, 435, 112] --
|
32 |
+
│ │ │ │ │ │ └─GELU: 7-4 [116, 435, 136] [116, 435, 136] --
|
33 |
+
│ │ │ │ │ │ └─Dropout: 7-5 [116, 435, 136] [116, 435, 136] --
|
34 |
+
│ │ │ │ │ │ └─Linear: 7-6 [116, 435, 136] [116, 435, 112] 15,232
|
35 |
+
│ │ │ │ │ └─DropPath: 6-12 [116, 435, 112] [116, 435, 112] --
|
36 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-8 [116, 435, 112] [116, 435, 112] --
|
37 |
+
│ │ │ │ │ └─LayerNorm: 6-13 [116, 435, 112] [116, 435, 112] 224
|
38 |
+
│ │ │ │ │ └─Linear: 6-14 [116, 435, 112] [116, 435, 1720] 192,640
|
39 |
+
│ │ │ │ │ └─Linear: 6-15 [116, 435, 528] [116, 435, 112] 59,136
|
40 |
+
│ │ │ │ │ └─DropPath: 6-16 [116, 435, 112] [116, 435, 112] --
|
41 |
+
│ │ │ │ │ └─Sequential: 6-17 [116, 435, 136] [116, 435, 112] --
|
42 |
+
│ │ │ │ │ │ └─GELU: 7-7 [116, 435, 136] [116, 435, 136] --
|
43 |
+
│ │ │ │ │ │ └─Dropout: 7-8 [116, 435, 136] [116, 435, 136] --
|
44 |
+
│ │ │ │ │ │ └─Linear: 7-9 [116, 435, 136] [116, 435, 112] 15,232
|
45 |
+
│ │ │ │ │ └─DropPath: 6-18 [116, 435, 112] [116, 435, 112] --
|
46 |
+
│ │ └─Transformer: 3-3 [435, 116, 112] [435, 116, 112] --
|
47 |
+
│ │ │ └─ModuleList: 4-3 -- -- --
|
48 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-9 [435, 116, 112] [435, 116, 112] --
|
49 |
+
│ │ │ │ │ └─LayerNorm: 6-19 [435, 116, 112] [435, 116, 112] 224
|
50 |
+
│ │ │ │ │ └─Linear: 6-20 [435, 116, 112] [435, 116, 1720] 192,640
|
51 |
+
│ │ │ │ │ └─Linear: 6-21 [435, 116, 528] [435, 116, 112] 59,136
|
52 |
+
│ │ │ │ │ └─DropPath: 6-22 [435, 116, 112] [435, 116, 112] --
|
53 |
+
│ │ │ │ │ └─Sequential: 6-23 [435, 116, 136] [435, 116, 112] --
|
54 |
+
│ │ │ │ │ │ └─GELU: 7-10 [435, 116, 136] [435, 116, 136] --
|
55 |
+
│ │ │ │ │ │ └─Dropout: 7-11 [435, 116, 136] [435, 116, 136] --
|
56 |
+
│ │ │ │ │ │ └─Linear: 7-12 [435, 116, 136] [435, 116, 112] 15,232
|
57 |
+
│ │ │ │ │ └─DropPath: 6-24 [435, 116, 112] [435, 116, 112] --
|
58 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-10 [435, 116, 112] [435, 116, 112] --
|
59 |
+
│ │ │ │ │ └─LayerNorm: 6-25 [435, 116, 112] [435, 116, 112] 224
|
60 |
+
│ │ │ │ │ └─Linear: 6-26 [435, 116, 112] [435, 116, 1720] 192,640
|
61 |
+
│ │ │ │ │ └─Linear: 6-27 [435, 116, 528] [435, 116, 112] 59,136
|
62 |
+
│ │ │ │ │ └─DropPath: 6-28 [435, 116, 112] [435, 116, 112] --
|
63 |
+
│ │ │ │ │ └─Sequential: 6-29 [435, 116, 136] [435, 116, 112] --
|
64 |
+
│ │ │ │ │ │ └─GELU: 7-13 [435, 116, 136] [435, 116, 136] --
|
65 |
+
│ │ │ │ │ │ └─Dropout: 7-14 [435, 116, 136] [435, 116, 136] --
|
66 |
+
│ │ │ │ │ │ └─Linear: 7-15 [435, 116, 136] [435, 116, 112] 15,232
|
67 |
+
│ │ │ │ │ └─DropPath: 6-30 [435, 116, 112] [435, 116, 112] --
|
68 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-11 [435, 116, 112] [435, 116, 112] --
|
69 |
+
│ │ │ │ │ └─LayerNorm: 6-31 [435, 116, 112] [435, 116, 112] 224
|
70 |
+
│ │ │ │ │ └─Linear: 6-32 [435, 116, 112] [435, 116, 1720] 192,640
|
71 |
+
│ │ │ │ │ └─Linear: 6-33 [435, 116, 528] [435, 116, 112] 59,136
|
72 |
+
│ │ │ │ │ └─DropPath: 6-34 [435, 116, 112] [435, 116, 112] --
|
73 |
+
│ │ │ │ │ └─Sequential: 6-35 [435, 116, 136] [435, 116, 112] --
|
74 |
+
│ │ │ │ │ │ └─GELU: 7-16 [435, 116, 136] [435, 116, 136] --
|
75 |
+
│ │ │ │ │ │ └─Dropout: 7-17 [435, 116, 136] [435, 116, 136] --
|
76 |
+
│ │ │ │ │ │ └─Linear: 7-18 [435, 116, 136] [435, 116, 112] 15,232
|
77 |
+
│ │ │ │ │ └─DropPath: 6-36 [435, 116, 112] [435, 116, 112] --
|
78 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-12 [435, 116, 112] [435, 116, 112] --
|
79 |
+
│ │ │ │ │ └─LayerNorm: 6-37 [435, 116, 112] [435, 116, 112] 224
|
80 |
+
│ │ │ │ │ └─Linear: 6-38 [435, 116, 112] [435, 116, 1720] 192,640
|
81 |
+
│ │ │ │ │ └─Linear: 6-39 [435, 116, 528] [435, 116, 112] 59,136
|
82 |
+
│ │ │ │ │ └─DropPath: 6-40 [435, 116, 112] [435, 116, 112] --
|
83 |
+
│ │ │ │ │ └─Sequential: 6-41 [435, 116, 136] [435, 116, 112] --
|
84 |
+
│ │ │ │ │ │ └─GELU: 7-19 [435, 116, 136] [435, 116, 136] --
|
85 |
+
│ │ │ │ │ │ └─Dropout: 7-20 [435, 116, 136] [435, 116, 136] --
|
86 |
+
│ │ │ │ │ │ └─Linear: 7-21 [435, 116, 136] [435, 116, 112] 15,232
|
87 |
+
│ │ │ │ │ └─DropPath: 6-42 [435, 116, 112] [435, 116, 112] --
|
88 |
+
│ │ │ │ └─ParallelTransformerBlock: 5-13 [435, 116, 112] [435, 116, 112] --
|
89 |
+
│ │ │ │ │ └─LayerNorm: 6-43 [435, 116, 112] [435, 116, 112] 224
|
90 |
+
│ │ │ │ │ └─Linear: 6-44 [435, 116, 112] [435, 116, 1720] 192,640
|
91 |
+
│ │ │ │ │ └─Linear: 6-45 [435, 116, 528] [435, 116, 112] 59,136
|
92 |
+
│ │ │ │ │ └─DropPath: 6-46 [435, 116, 112] [435, 116, 112] --
|
93 |
+
│ │ │ │ │ └─Sequential: 6-47 [435, 116, 136] [435, 116, 112] --
|
94 |
+
│ │ │ │ │ │ └─GELU: 7-22 [435, 116, 136] [435, 116, 136] --
|
95 |
+
│ │ │ │ │ │ └─Dropout: 7-23 [435, 116, 136] [435, 116, 136] --
|
96 |
+
│ │ │ │ │ │ └─Linear: 7-24 [435, 116, 136] [435, 116, 112] 15,232
|
97 |
+
│ │ │ │ │ └─DropPath: 6-48 [435, 116, 112] [435, 116, 112] --
|
98 |
+
│ │ └─Rearrange: 3-4 [1, 116, 435, 112] [1, 112, 116, 15, 29] --
|
99 |
+
├─MLPShifters: 1-2 -- [1, 2, 116] 513
|
100 |
+
│ └─MLPShifter: 2-2 [116, 2] [116, 2] --
|
101 |
+
│ │ └─Sequential: 3-5 [116, 2] [116, 2] --
|
102 |
+
│ │ │ └─Linear: 4-4 [116, 2] [116, 5] 15
|
103 |
+
│ │ │ └─Tanh: 4-5 [116, 5] [116, 5] --
|
104 |
+
│ │ │ └─Linear: 4-6 [116, 5] [116, 5] 30
|
105 |
+
│ │ │ └─Tanh: 4-7 [116, 5] [116, 5] --
|
106 |
+
│ │ │ └─Linear: 4-8 [116, 5] [116, 2] 12
|
107 |
+
│ │ │ └─Tanh: 4-9 [116, 2] [116, 2] --
|
108 |
+
├─Readouts: 1-3 [1, 112, 116, 15, 29] [1, 7440, 116] 8,477,649
|
109 |
+
│ └─Gaussian2DReadout2: 2-3 [1, 112, 116, 15, 29] [1, 7440, 116] 870,480
|
110 |
+
│ │ └─Sequential: 3-6 [7440, 2] [7440, 2] --
|
111 |
+
│ │ │ └─Linear: 4-10 [7440, 2] [7440, 30] 90
|
112 |
+
│ │ │ └─ELU: 4-11 [7440, 30] [7440, 30] --
|
113 |
+
│ │ │ └─Linear: 4-12 [7440, 30] [7440, 2] 62
|
114 |
+
│ │ │ └─Tanh: 4-13 [7440, 2] [7440, 2] --
|
115 |
+
│ │ └─Sequential: 3-7 [7440, 2] [7440, 2] (recursive)
|
116 |
+
│ │ │ └─Linear: 4-14 [7440, 2] [7440, 30] (recursive)
|
117 |
+
│ │ │ └─ELU: 4-15 [7440, 30] [7440, 30] --
|
118 |
+
�� │ │ └─Linear: 4-16 [7440, 30] [7440, 2] (recursive)
|
119 |
+
│ │ │ └─Tanh: 4-17 [7440, 2] [7440, 2] --
|
120 |
+
│ │ └─Sequential: 3-8 [7440, 2] [7440, 2] (recursive)
|
121 |
+
│ │ │ └─Linear: 4-18 [7440, 2] [7440, 30] (recursive)
|
122 |
+
│ │ │ └─ELU: 4-19 [7440, 30] [7440, 30] --
|
123 |
+
│ │ │ └─Linear: 4-20 [7440, 30] [7440, 2] (recursive)
|
124 |
+
│ │ │ └─Tanh: 4-21 [7440, 2] [7440, 2] --
|
125 |
+
│ │ └─Sequential: 3-9 [116, 4] [116, 112] --
|
126 |
+
│ │ │ └─Linear: 4-22 [116, 4] [116, 112] 560
|
127 |
+
│ │ │ └─LayerNorm: 4-23 [116, 112] [116, 112] 224
|
128 |
+
│ │ │ └─GELU: 4-24 [116, 112] [116, 112] --
|
129 |
+
│ │ │ └─Dropout: 4-25 [116, 112] [116, 112] --
|
130 |
+
│ │ │ └─Linear: 4-26 [116, 112] [116, 112] 12,656
|
131 |
+
│ │ │ └─Tanh: 4-27 [116, 112] [116, 112] --
|
132 |
+
├─Exponential: 1-4 [1, 7440, 116] [1, 7440, 116] --
|
133 |
+
=======================================================================================================================================
|
134 |
+
Total params: 12,278,365
|
135 |
+
Trainable params: 12,278,365
|
136 |
+
Non-trainable params: 0
|
137 |
+
Total mult-adds (Units.MEGABYTES): 679.88
|
138 |
+
=======================================================================================================================================
|
139 |
+
Input size (MB): 1.29
|
140 |
+
Forward/backward pass size (MB): 9208.73
|
141 |
+
Params size (MB): 11.40
|
142 |
+
Estimated Total Size (MB): 9221.42
|
143 |
+
=======================================================================================================================================
|
005/output.log
ADDED
@@ -0,0 +1,822 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Use bfloat16 for core module.
|
2 |
+
Use parallel attention and MLP in ViViT.
|
3 |
+
|
4 |
+
Epoch 001/400
|
5 |
+
Train loss: 111647336.00 correlation: 0.0122
|
6 |
+
Validation loss: 200300080.00 correlation: 0.0267
|
7 |
+
Elapse: 537.13s
|
8 |
+
|
9 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
10 |
+
|
11 |
+
Epoch 002/400
|
12 |
+
Train loss: 97648256.00 correlation: 0.0367
|
13 |
+
Validation loss: 199289632.00 correlation: 0.0355
|
14 |
+
Elapse: 539.72s
|
15 |
+
|
16 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
17 |
+
|
18 |
+
Epoch 003/400
|
19 |
+
Train loss: 96321792.00 correlation: 0.0500
|
20 |
+
Validation loss: 198299696.00 correlation: 0.0446
|
21 |
+
Elapse: 548.37s
|
22 |
+
|
23 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
24 |
+
|
25 |
+
Epoch 004/400
|
26 |
+
Train loss: 95213544.00 correlation: 0.0617
|
27 |
+
Validation loss: 196983504.00 correlation: 0.0527
|
28 |
+
Elapse: 552.04s
|
29 |
+
|
30 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
31 |
+
|
32 |
+
Epoch 005/400
|
33 |
+
Train loss: 93915056.00 correlation: 0.0756
|
34 |
+
Validation loss: 195022704.00 correlation: 0.0660
|
35 |
+
Elapse: 551.29s
|
36 |
+
|
37 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
38 |
+
|
39 |
+
Epoch 006/400
|
40 |
+
Train loss: 92500376.00 correlation: 0.0909
|
41 |
+
Validation loss: 193045536.00 correlation: 0.0815
|
42 |
+
Elapse: 549.45s
|
43 |
+
|
44 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
45 |
+
|
46 |
+
Epoch 007/400
|
47 |
+
Train loss: 91511136.00 correlation: 0.1012
|
48 |
+
Validation loss: 191545056.00 correlation: 0.0905
|
49 |
+
Elapse: 547.11s
|
50 |
+
|
51 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
52 |
+
|
53 |
+
Epoch 008/400
|
54 |
+
Train loss: 90428944.00 correlation: 0.1113
|
55 |
+
Validation loss: 189976016.00 correlation: 0.0998
|
56 |
+
Elapse: 544.76s
|
57 |
+
|
58 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
59 |
+
|
60 |
+
Epoch 009/400
|
61 |
+
Train loss: 89301664.00 correlation: 0.1228
|
62 |
+
Validation loss: 188514336.00 correlation: 0.1074
|
63 |
+
Elapse: 541.79s
|
64 |
+
|
65 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
66 |
+
|
67 |
+
Epoch 010/400
|
68 |
+
Train loss: 88238616.00 correlation: 0.1335
|
69 |
+
Validation loss: 186730592.00 correlation: 0.1194
|
70 |
+
Elapse: 540.44s
|
71 |
+
|
72 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
73 |
+
|
74 |
+
Epoch 011/400
|
75 |
+
Train loss: 87239336.00 correlation: 0.1436
|
76 |
+
Validation loss: 185287104.00 correlation: 0.1296
|
77 |
+
Elapse: 539.71s
|
78 |
+
|
79 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
80 |
+
|
81 |
+
Epoch 012/400
|
82 |
+
Train loss: 86205256.00 correlation: 0.1540
|
83 |
+
Validation loss: 183237792.00 correlation: 0.1419
|
84 |
+
Elapse: 540.02s
|
85 |
+
|
86 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
87 |
+
|
88 |
+
Epoch 013/400
|
89 |
+
Train loss: 85068472.00 correlation: 0.1655
|
90 |
+
Validation loss: 181721296.00 correlation: 0.1515
|
91 |
+
Elapse: 539.81s
|
92 |
+
|
93 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
94 |
+
|
95 |
+
Epoch 014/400
|
96 |
+
Train loss: 84160560.00 correlation: 0.1745
|
97 |
+
Validation loss: 180469664.00 correlation: 0.1595
|
98 |
+
Elapse: 540.34s
|
99 |
+
|
100 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
101 |
+
|
102 |
+
Epoch 015/400
|
103 |
+
Train loss: 83386128.00 correlation: 0.1821
|
104 |
+
Validation loss: 179517792.00 correlation: 0.1658
|
105 |
+
Elapse: 540.81s
|
106 |
+
|
107 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
108 |
+
|
109 |
+
Epoch 016/400
|
110 |
+
Train loss: 82805200.00 correlation: 0.1877
|
111 |
+
Validation loss: 178801584.00 correlation: 0.1698
|
112 |
+
Elapse: 540.70s
|
113 |
+
|
114 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
115 |
+
|
116 |
+
Epoch 017/400
|
117 |
+
Train loss: 82275736.00 correlation: 0.1926
|
118 |
+
Validation loss: 177842080.00 correlation: 0.1761
|
119 |
+
Elapse: 540.76s
|
120 |
+
|
121 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
122 |
+
|
123 |
+
Epoch 018/400
|
124 |
+
Train loss: 81662840.00 correlation: 0.1987
|
125 |
+
Validation loss: 176971248.00 correlation: 0.1820
|
126 |
+
Elapse: 541.07s
|
127 |
+
|
128 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
129 |
+
|
130 |
+
Epoch 019/400
|
131 |
+
Train loss: 81147088.00 correlation: 0.2038
|
132 |
+
Validation loss: 176423600.00 correlation: 0.1858
|
133 |
+
Elapse: 541.20s
|
134 |
+
|
135 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
136 |
+
|
137 |
+
Epoch 020/400
|
138 |
+
Train loss: 80748784.00 correlation: 0.2079
|
139 |
+
Validation loss: 175690976.00 correlation: 0.1908
|
140 |
+
Elapse: 541.22s
|
141 |
+
|
142 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
143 |
+
|
144 |
+
Epoch 021/400
|
145 |
+
Train loss: 80313880.00 correlation: 0.2122
|
146 |
+
Validation loss: 175389216.00 correlation: 0.1929
|
147 |
+
Elapse: 540.65s
|
148 |
+
|
149 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
150 |
+
|
151 |
+
Epoch 022/400
|
152 |
+
Train loss: 79957744.00 correlation: 0.2153
|
153 |
+
Validation loss: 174862864.00 correlation: 0.1968
|
154 |
+
Elapse: 540.96s
|
155 |
+
|
156 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
157 |
+
|
158 |
+
Epoch 023/400
|
159 |
+
Train loss: 79621360.00 correlation: 0.2186
|
160 |
+
Validation loss: 174437632.00 correlation: 0.1996
|
161 |
+
Elapse: 541.11s
|
162 |
+
|
163 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
164 |
+
|
165 |
+
Epoch 024/400
|
166 |
+
Train loss: 79374368.00 correlation: 0.2211
|
167 |
+
Validation loss: 173783968.00 correlation: 0.2031
|
168 |
+
Elapse: 542.03s
|
169 |
+
|
170 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
171 |
+
|
172 |
+
Epoch 025/400
|
173 |
+
Train loss: 79085072.00 correlation: 0.2240
|
174 |
+
Validation loss: 173357520.00 correlation: 0.2059
|
175 |
+
Elapse: 541.66s
|
176 |
+
|
177 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
178 |
+
|
179 |
+
Epoch 026/400
|
180 |
+
Train loss: 78723728.00 correlation: 0.2273
|
181 |
+
Validation loss: 173125120.00 correlation: 0.2087
|
182 |
+
Elapse: 542.13s
|
183 |
+
|
184 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
185 |
+
|
186 |
+
Epoch 027/400
|
187 |
+
Train loss: 78456624.00 correlation: 0.2299
|
188 |
+
Validation loss: 172740432.00 correlation: 0.2102
|
189 |
+
Elapse: 541.72s
|
190 |
+
|
191 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
192 |
+
|
193 |
+
Epoch 028/400
|
194 |
+
Train loss: 78264240.00 correlation: 0.2316
|
195 |
+
Validation loss: 172426416.00 correlation: 0.2125
|
196 |
+
Elapse: 541.90s
|
197 |
+
|
198 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
199 |
+
|
200 |
+
Epoch 029/400
|
201 |
+
Train loss: 78095968.00 correlation: 0.2335
|
202 |
+
Validation loss: 172338688.00 correlation: 0.2139
|
203 |
+
Elapse: 542.04s
|
204 |
+
|
205 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
206 |
+
|
207 |
+
Epoch 030/400
|
208 |
+
Train loss: 77880056.00 correlation: 0.2357
|
209 |
+
Validation loss: 171972944.00 correlation: 0.2151
|
210 |
+
Elapse: 541.96s
|
211 |
+
|
212 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
213 |
+
|
214 |
+
Epoch 031/400
|
215 |
+
Train loss: 77782920.00 correlation: 0.2367
|
216 |
+
Validation loss: 171662176.00 correlation: 0.2171
|
217 |
+
Elapse: 542.59s
|
218 |
+
|
219 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
220 |
+
|
221 |
+
Epoch 032/400
|
222 |
+
Train loss: 77596272.00 correlation: 0.2382
|
223 |
+
Validation loss: 171484624.00 correlation: 0.2187
|
224 |
+
Elapse: 543.51s
|
225 |
+
|
226 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
227 |
+
|
228 |
+
Epoch 033/400
|
229 |
+
Train loss: 77378984.00 correlation: 0.2403
|
230 |
+
Validation loss: 171180896.00 correlation: 0.2208
|
231 |
+
Elapse: 542.09s
|
232 |
+
|
233 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
234 |
+
|
235 |
+
Epoch 034/400
|
236 |
+
Train loss: 77329272.00 correlation: 0.2411
|
237 |
+
Validation loss: 171382000.00 correlation: 0.2191
|
238 |
+
Elapse: 541.49s
|
239 |
+
|
240 |
+
Epoch 035/400
|
241 |
+
Train loss: 77173400.00 correlation: 0.2426
|
242 |
+
Validation loss: 170990288.00 correlation: 0.2215
|
243 |
+
Elapse: 542.22s
|
244 |
+
|
245 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
246 |
+
|
247 |
+
Epoch 036/400
|
248 |
+
Train loss: 77103352.00 correlation: 0.2430
|
249 |
+
Validation loss: 171064224.00 correlation: 0.2212
|
250 |
+
Elapse: 542.85s
|
251 |
+
|
252 |
+
Epoch 037/400
|
253 |
+
Train loss: 76961264.00 correlation: 0.2447
|
254 |
+
Validation loss: 170693952.00 correlation: 0.2239
|
255 |
+
Elapse: 542.80s
|
256 |
+
|
257 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
258 |
+
|
259 |
+
Epoch 038/400
|
260 |
+
Train loss: 76838424.00 correlation: 0.2456
|
261 |
+
Validation loss: 170481408.00 correlation: 0.2246
|
262 |
+
Elapse: 542.40s
|
263 |
+
|
264 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
265 |
+
|
266 |
+
Epoch 039/400
|
267 |
+
Train loss: 76726736.00 correlation: 0.2469
|
268 |
+
Validation loss: 170405888.00 correlation: 0.2257
|
269 |
+
Elapse: 541.86s
|
270 |
+
|
271 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
272 |
+
|
273 |
+
Epoch 040/400
|
274 |
+
Train loss: 76625736.00 correlation: 0.2481
|
275 |
+
Validation loss: 170183216.00 correlation: 0.2271
|
276 |
+
Elapse: 542.67s
|
277 |
+
|
278 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
279 |
+
|
280 |
+
Epoch 041/400
|
281 |
+
Train loss: 76633712.00 correlation: 0.2477
|
282 |
+
Validation loss: 170194400.00 correlation: 0.2270
|
283 |
+
Elapse: 542.30s
|
284 |
+
|
285 |
+
Epoch 042/400
|
286 |
+
Train loss: 76442136.00 correlation: 0.2493
|
287 |
+
Validation loss: 170452384.00 correlation: 0.2263
|
288 |
+
Elapse: 542.26s
|
289 |
+
|
290 |
+
Epoch 043/400
|
291 |
+
Train loss: 76492200.00 correlation: 0.2491
|
292 |
+
Validation loss: 170249952.00 correlation: 0.2260
|
293 |
+
Elapse: 542.10s
|
294 |
+
|
295 |
+
Epoch 044/400
|
296 |
+
Train loss: 76279480.00 correlation: 0.2510
|
297 |
+
Validation loss: 169784496.00 correlation: 0.2295
|
298 |
+
Elapse: 541.77s
|
299 |
+
|
300 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
301 |
+
|
302 |
+
Epoch 045/400
|
303 |
+
Train loss: 76193080.00 correlation: 0.2520
|
304 |
+
Validation loss: 169944928.00 correlation: 0.2278
|
305 |
+
Elapse: 542.23s
|
306 |
+
|
307 |
+
Epoch 046/400
|
308 |
+
Train loss: 76107936.00 correlation: 0.2526
|
309 |
+
Validation loss: 169860016.00 correlation: 0.2283
|
310 |
+
Elapse: 542.90s
|
311 |
+
|
312 |
+
Epoch 047/400
|
313 |
+
Train loss: 76111024.00 correlation: 0.2527
|
314 |
+
Validation loss: 169548304.00 correlation: 0.2308
|
315 |
+
Elapse: 541.89s
|
316 |
+
|
317 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
318 |
+
|
319 |
+
Epoch 048/400
|
320 |
+
Train loss: 76049672.00 correlation: 0.2534
|
321 |
+
Validation loss: 169801264.00 correlation: 0.2296
|
322 |
+
Elapse: 543.95s
|
323 |
+
|
324 |
+
Epoch 049/400
|
325 |
+
Train loss: 75997232.00 correlation: 0.2537
|
326 |
+
Validation loss: 169721248.00 correlation: 0.2301
|
327 |
+
Elapse: 543.00s
|
328 |
+
|
329 |
+
Epoch 050/400
|
330 |
+
Train loss: 75961488.00 correlation: 0.2545
|
331 |
+
Validation loss: 169722912.00 correlation: 0.2293
|
332 |
+
Elapse: 542.91s
|
333 |
+
|
334 |
+
Epoch 051/400
|
335 |
+
Train loss: 75908376.00 correlation: 0.2548
|
336 |
+
Validation loss: 169474704.00 correlation: 0.2310
|
337 |
+
Elapse: 542.56s
|
338 |
+
|
339 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
340 |
+
|
341 |
+
Epoch 052/400
|
342 |
+
Train loss: 75771856.00 correlation: 0.2561
|
343 |
+
Validation loss: 170132720.00 correlation: 0.2272
|
344 |
+
Elapse: 542.05s
|
345 |
+
|
346 |
+
Epoch 053/400
|
347 |
+
Train loss: 75913696.00 correlation: 0.2547
|
348 |
+
Validation loss: 169491888.00 correlation: 0.2309
|
349 |
+
Elapse: 542.57s
|
350 |
+
|
351 |
+
Epoch 054/400
|
352 |
+
Train loss: 75764272.00 correlation: 0.2560
|
353 |
+
Validation loss: 169266704.00 correlation: 0.2330
|
354 |
+
Elapse: 542.91s
|
355 |
+
|
356 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
357 |
+
|
358 |
+
Epoch 055/400
|
359 |
+
Train loss: 75670816.00 correlation: 0.2569
|
360 |
+
Validation loss: 169200320.00 correlation: 0.2327
|
361 |
+
Elapse: 542.21s
|
362 |
+
|
363 |
+
Epoch 056/400
|
364 |
+
Train loss: 75680240.00 correlation: 0.2570
|
365 |
+
Validation loss: 169253344.00 correlation: 0.2322
|
366 |
+
Elapse: 542.73s
|
367 |
+
|
368 |
+
Epoch 057/400
|
369 |
+
Train loss: 75623792.00 correlation: 0.2573
|
370 |
+
Validation loss: 169158704.00 correlation: 0.2336
|
371 |
+
Elapse: 544.29s
|
372 |
+
|
373 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
374 |
+
|
375 |
+
Epoch 058/400
|
376 |
+
Train loss: 75518968.00 correlation: 0.2584
|
377 |
+
Validation loss: 169124832.00 correlation: 0.2339
|
378 |
+
Elapse: 542.64s
|
379 |
+
|
380 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
381 |
+
|
382 |
+
Epoch 059/400
|
383 |
+
Train loss: 75452928.00 correlation: 0.2591
|
384 |
+
Validation loss: 169483008.00 correlation: 0.2320
|
385 |
+
Elapse: 542.34s
|
386 |
+
|
387 |
+
Epoch 060/400
|
388 |
+
Train loss: 75478992.00 correlation: 0.2590
|
389 |
+
Validation loss: 169223728.00 correlation: 0.2337
|
390 |
+
Elapse: 543.01s
|
391 |
+
|
392 |
+
Epoch 061/400
|
393 |
+
Train loss: 75414704.00 correlation: 0.2597
|
394 |
+
Validation loss: 169588672.00 correlation: 0.2307
|
395 |
+
Elapse: 542.79s
|
396 |
+
|
397 |
+
Epoch 062/400
|
398 |
+
Train loss: 75631880.00 correlation: 0.2578
|
399 |
+
Validation loss: 169325440.00 correlation: 0.2326
|
400 |
+
Elapse: 543.75s
|
401 |
+
|
402 |
+
Epoch 063/400
|
403 |
+
Train loss: 75359640.00 correlation: 0.2602
|
404 |
+
Validation loss: 169091040.00 correlation: 0.2339
|
405 |
+
Elapse: 543.16s
|
406 |
+
|
407 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
408 |
+
|
409 |
+
Epoch 064/400
|
410 |
+
Train loss: 75319080.00 correlation: 0.2605
|
411 |
+
Validation loss: 169416560.00 correlation: 0.2321
|
412 |
+
Elapse: 543.52s
|
413 |
+
|
414 |
+
Epoch 065/400
|
415 |
+
Train loss: 75306104.00 correlation: 0.2609
|
416 |
+
Validation loss: 169176224.00 correlation: 0.2331
|
417 |
+
Elapse: 542.80s
|
418 |
+
|
419 |
+
Epoch 066/400
|
420 |
+
Train loss: 75301592.00 correlation: 0.2609
|
421 |
+
Validation loss: 169371616.00 correlation: 0.2327
|
422 |
+
Elapse: 543.10s
|
423 |
+
|
424 |
+
Epoch 067/400
|
425 |
+
Train loss: 75389672.00 correlation: 0.2601
|
426 |
+
Validation loss: 169169312.00 correlation: 0.2332
|
427 |
+
Elapse: 544.11s
|
428 |
+
|
429 |
+
Epoch 068/400
|
430 |
+
Train loss: 75361008.00 correlation: 0.2604
|
431 |
+
Validation loss: 169366960.00 correlation: 0.2315
|
432 |
+
Elapse: 543.42s
|
433 |
+
|
434 |
+
Loaded checkpoint from epoch 63 (correlation: 0.2339).
|
435 |
+
|
436 |
+
Reduce learning rate of core to 1.4400e-03 (num. reduce: 1).
|
437 |
+
Reduce learning rate of readouts to 1.0800e-03 (num. reduce: 1).
|
438 |
+
Reduce learning rate of shifters to 1.0800e-03 (num. reduce: 1).
|
439 |
+
|
440 |
+
Epoch 069/400
|
441 |
+
Train loss: 73278464.00 correlation: 0.2784
|
442 |
+
Validation loss: 167482848.00 correlation: 0.2447
|
443 |
+
Elapse: 544.59s
|
444 |
+
|
445 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
446 |
+
|
447 |
+
Epoch 070/400
|
448 |
+
Train loss: 72562424.00 correlation: 0.2849
|
449 |
+
Validation loss: 167277872.00 correlation: 0.2456
|
450 |
+
Elapse: 544.90s
|
451 |
+
|
452 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
453 |
+
|
454 |
+
Epoch 071/400
|
455 |
+
Train loss: 72429480.00 correlation: 0.2862
|
456 |
+
Validation loss: 167337568.00 correlation: 0.2452
|
457 |
+
Elapse: 544.84s
|
458 |
+
|
459 |
+
Epoch 072/400
|
460 |
+
Train loss: 72339856.00 correlation: 0.2872
|
461 |
+
Validation loss: 167472656.00 correlation: 0.2442
|
462 |
+
Elapse: 544.89s
|
463 |
+
|
464 |
+
Epoch 073/400
|
465 |
+
Train loss: 72270912.00 correlation: 0.2877
|
466 |
+
Validation loss: 167356592.00 correlation: 0.2443
|
467 |
+
Elapse: 545.34s
|
468 |
+
|
469 |
+
Epoch 074/400
|
470 |
+
Train loss: 72207960.00 correlation: 0.2884
|
471 |
+
Validation loss: 167467040.00 correlation: 0.2434
|
472 |
+
Elapse: 545.38s
|
473 |
+
|
474 |
+
Epoch 075/400
|
475 |
+
Train loss: 72186752.00 correlation: 0.2885
|
476 |
+
Validation loss: 167473600.00 correlation: 0.2434
|
477 |
+
Elapse: 545.13s
|
478 |
+
|
479 |
+
Loaded checkpoint from epoch 70 (correlation: 0.2456).
|
480 |
+
|
481 |
+
Reduce learning rate of core to 4.3200e-04 (num. reduce: 1).
|
482 |
+
Reduce learning rate of readouts to 3.2400e-04 (num. reduce: 1).
|
483 |
+
Reduce learning rate of shifters to 3.2400e-04 (num. reduce: 1).
|
484 |
+
|
485 |
+
Epoch 076/400
|
486 |
+
Train loss: 71743648.00 correlation: 0.2919
|
487 |
+
Validation loss: 166945040.00 correlation: 0.2479
|
488 |
+
Elapse: 544.86s
|
489 |
+
|
490 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
491 |
+
|
492 |
+
Epoch 077/400
|
493 |
+
Train loss: 71453328.00 correlation: 0.2949
|
494 |
+
Validation loss: 166933984.00 correlation: 0.2480
|
495 |
+
Elapse: 545.20s
|
496 |
+
|
497 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
498 |
+
|
499 |
+
Epoch 078/400
|
500 |
+
Train loss: 71407184.00 correlation: 0.2951
|
501 |
+
Validation loss: 166839616.00 correlation: 0.2480
|
502 |
+
Elapse: 545.38s
|
503 |
+
|
504 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
505 |
+
|
506 |
+
Epoch 079/400
|
507 |
+
Train loss: 71308560.00 correlation: 0.2960
|
508 |
+
Validation loss: 166820688.00 correlation: 0.2484
|
509 |
+
Elapse: 545.26s
|
510 |
+
|
511 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
512 |
+
|
513 |
+
Epoch 080/400
|
514 |
+
Train loss: 71223520.00 correlation: 0.2968
|
515 |
+
Validation loss: 166801616.00 correlation: 0.2487
|
516 |
+
Elapse: 545.81s
|
517 |
+
|
518 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
519 |
+
|
520 |
+
Epoch 081/400
|
521 |
+
Train loss: 71151600.00 correlation: 0.2975
|
522 |
+
Validation loss: 166777584.00 correlation: 0.2485
|
523 |
+
Elapse: 545.15s
|
524 |
+
|
525 |
+
Epoch 082/400
|
526 |
+
Train loss: 71166128.00 correlation: 0.2973
|
527 |
+
Validation loss: 166806736.00 correlation: 0.2484
|
528 |
+
Elapse: 545.51s
|
529 |
+
|
530 |
+
Epoch 083/400
|
531 |
+
Train loss: 71003768.00 correlation: 0.2991
|
532 |
+
Validation loss: 166794000.00 correlation: 0.2487
|
533 |
+
Elapse: 545.39s
|
534 |
+
|
535 |
+
Epoch 084/400
|
536 |
+
Train loss: 71028680.00 correlation: 0.2987
|
537 |
+
Validation loss: 166740976.00 correlation: 0.2486
|
538 |
+
Elapse: 545.50s
|
539 |
+
|
540 |
+
Epoch 085/400
|
541 |
+
Train loss: 70987920.00 correlation: 0.2989
|
542 |
+
Validation loss: 166771344.00 correlation: 0.2483
|
543 |
+
Elapse: 545.38s
|
544 |
+
|
545 |
+
Loaded checkpoint from epoch 80 (correlation: 0.2487).
|
546 |
+
|
547 |
+
Reduce learning rate of core to 1.2960e-04 (num. reduce: 1).
|
548 |
+
Reduce learning rate of readouts to 9.7200e-05 (num. reduce: 1).
|
549 |
+
Reduce learning rate of shifters to 9.7200e-05 (num. reduce: 1).
|
550 |
+
|
551 |
+
Epoch 086/400
|
552 |
+
Train loss: 70886192.00 correlation: 0.2998
|
553 |
+
Validation loss: 166696544.00 correlation: 0.2492
|
554 |
+
Elapse: 545.68s
|
555 |
+
|
556 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
557 |
+
|
558 |
+
Epoch 087/400
|
559 |
+
Train loss: 70891072.00 correlation: 0.2998
|
560 |
+
Validation loss: 166700640.00 correlation: 0.2493
|
561 |
+
Elapse: 545.36s
|
562 |
+
|
563 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
564 |
+
|
565 |
+
Epoch 088/400
|
566 |
+
Train loss: 70786208.00 correlation: 0.3009
|
567 |
+
Validation loss: 166720928.00 correlation: 0.2490
|
568 |
+
Elapse: 545.75s
|
569 |
+
|
570 |
+
Epoch 089/400
|
571 |
+
Train loss: 70840864.00 correlation: 0.3002
|
572 |
+
Validation loss: 166705888.00 correlation: 0.2491
|
573 |
+
Elapse: 546.01s
|
574 |
+
|
575 |
+
Epoch 090/400
|
576 |
+
Train loss: 70781008.00 correlation: 0.3008
|
577 |
+
Validation loss: 166757248.00 correlation: 0.2489
|
578 |
+
Elapse: 545.02s
|
579 |
+
|
580 |
+
Epoch 091/400
|
581 |
+
Train loss: 70768960.00 correlation: 0.3009
|
582 |
+
Validation loss: 166698640.00 correlation: 0.2489
|
583 |
+
Elapse: 545.07s
|
584 |
+
|
585 |
+
Epoch 092/400
|
586 |
+
Train loss: 70700664.00 correlation: 0.3016
|
587 |
+
Validation loss: 166705392.00 correlation: 0.2491
|
588 |
+
Elapse: 545.85s
|
589 |
+
|
590 |
+
Loaded checkpoint from epoch 87 (correlation: 0.2493).
|
591 |
+
|
592 |
+
Reduce learning rate of core to 3.8880e-05 (num. reduce: 1).
|
593 |
+
Reduce learning rate of readouts to 2.9160e-05 (num. reduce: 1).
|
594 |
+
Reduce learning rate of shifters to 2.9160e-05 (num. reduce: 1).
|
595 |
+
|
596 |
+
Epoch 093/400
|
597 |
+
Train loss: 70743624.00 correlation: 0.3012
|
598 |
+
Validation loss: 166685456.00 correlation: 0.2494
|
599 |
+
Elapse: 545.69s
|
600 |
+
|
601 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
602 |
+
|
603 |
+
Epoch 094/400
|
604 |
+
Train loss: 70752552.00 correlation: 0.3012
|
605 |
+
Validation loss: 166676048.00 correlation: 0.2493
|
606 |
+
Elapse: 545.53s
|
607 |
+
|
608 |
+
Epoch 095/400
|
609 |
+
Train loss: 70729328.00 correlation: 0.3013
|
610 |
+
Validation loss: 166677072.00 correlation: 0.2494
|
611 |
+
Elapse: 545.12s
|
612 |
+
|
613 |
+
Epoch 096/400
|
614 |
+
Train loss: 70661304.00 correlation: 0.3018
|
615 |
+
Validation loss: 166687824.00 correlation: 0.2493
|
616 |
+
Elapse: 545.30s
|
617 |
+
|
618 |
+
Epoch 097/400
|
619 |
+
Train loss: 70768896.00 correlation: 0.3006
|
620 |
+
Validation loss: 166658272.00 correlation: 0.2492
|
621 |
+
Elapse: 545.47s
|
622 |
+
|
623 |
+
Epoch 098/400
|
624 |
+
Train loss: 70673976.00 correlation: 0.3017
|
625 |
+
Validation loss: 166648288.00 correlation: 0.2495
|
626 |
+
Elapse: 545.22s
|
627 |
+
|
628 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
629 |
+
|
630 |
+
Epoch 099/400
|
631 |
+
Train loss: 70635672.00 correlation: 0.3022
|
632 |
+
Validation loss: 166648032.00 correlation: 0.2495
|
633 |
+
Elapse: 545.17s
|
634 |
+
|
635 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
636 |
+
|
637 |
+
Epoch 100/400
|
638 |
+
Train loss: 70748008.00 correlation: 0.3010
|
639 |
+
Validation loss: 166647312.00 correlation: 0.2495
|
640 |
+
Elapse: 545.61s
|
641 |
+
|
642 |
+
Epoch 101/400
|
643 |
+
Train loss: 70682408.00 correlation: 0.3016
|
644 |
+
Validation loss: 166662208.00 correlation: 0.2494
|
645 |
+
Elapse: 545.56s
|
646 |
+
|
647 |
+
Epoch 102/400
|
648 |
+
Train loss: 70642688.00 correlation: 0.3020
|
649 |
+
Validation loss: 166662624.00 correlation: 0.2495
|
650 |
+
Elapse: 545.17s
|
651 |
+
|
652 |
+
Epoch 103/400
|
653 |
+
Train loss: 70638368.00 correlation: 0.3019
|
654 |
+
Validation loss: 166645120.00 correlation: 0.2495
|
655 |
+
Elapse: 545.25s
|
656 |
+
|
657 |
+
Epoch 104/400
|
658 |
+
Train loss: 70563872.00 correlation: 0.3027
|
659 |
+
Validation loss: 166649696.00 correlation: 0.2495
|
660 |
+
Elapse: 545.70s
|
661 |
+
|
662 |
+
Loaded checkpoint from epoch 99 (correlation: 0.2495).
|
663 |
+
|
664 |
+
Reduce learning rate of core to 1.1664e-05 (num. reduce: 1).
|
665 |
+
Reduce learning rate of readouts to 8.7480e-06 (num. reduce: 1).
|
666 |
+
Reduce learning rate of shifters to 8.7480e-06 (num. reduce: 1).
|
667 |
+
|
668 |
+
Epoch 105/400
|
669 |
+
Train loss: 70679696.00 correlation: 0.3019
|
670 |
+
Validation loss: 166646944.00 correlation: 0.2495
|
671 |
+
Elapse: 545.44s
|
672 |
+
|
673 |
+
Epoch 106/400
|
674 |
+
Train loss: 70623656.00 correlation: 0.3021
|
675 |
+
Validation loss: 166651056.00 correlation: 0.2495
|
676 |
+
Elapse: 545.46s
|
677 |
+
|
678 |
+
Epoch 107/400
|
679 |
+
Train loss: 70689912.00 correlation: 0.3013
|
680 |
+
Validation loss: 166642080.00 correlation: 0.2495
|
681 |
+
Elapse: 545.17s
|
682 |
+
|
683 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
684 |
+
|
685 |
+
Epoch 108/400
|
686 |
+
Train loss: 70636352.00 correlation: 0.3019
|
687 |
+
Validation loss: 166643376.00 correlation: 0.2495
|
688 |
+
Elapse: 545.12s
|
689 |
+
|
690 |
+
Epoch 109/400
|
691 |
+
Train loss: 70622056.00 correlation: 0.3021
|
692 |
+
Validation loss: 166645664.00 correlation: 0.2495
|
693 |
+
Elapse: 545.91s
|
694 |
+
|
695 |
+
Epoch 110/400
|
696 |
+
Train loss: 70689848.00 correlation: 0.3013
|
697 |
+
Validation loss: 166646544.00 correlation: 0.2495
|
698 |
+
Elapse: 544.95s
|
699 |
+
|
700 |
+
Epoch 111/400
|
701 |
+
Train loss: 70594792.00 correlation: 0.3025
|
702 |
+
Validation loss: 166655344.00 correlation: 0.2494
|
703 |
+
Elapse: 545.66s
|
704 |
+
|
705 |
+
Epoch 112/400
|
706 |
+
Train loss: 70636904.00 correlation: 0.3020
|
707 |
+
Validation loss: 166638224.00 correlation: 0.2495
|
708 |
+
Elapse: 544.74s
|
709 |
+
|
710 |
+
Loaded checkpoint from epoch 107 (correlation: 0.2495).
|
711 |
+
|
712 |
+
Reduce learning rate of core to 3.4992e-06 (num. reduce: 1).
|
713 |
+
Reduce learning rate of readouts to 2.6244e-06 (num. reduce: 1).
|
714 |
+
Reduce learning rate of shifters to 2.6244e-06 (num. reduce: 1).
|
715 |
+
|
716 |
+
Epoch 113/400
|
717 |
+
Train loss: 70679760.00 correlation: 0.3016
|
718 |
+
Validation loss: 166645488.00 correlation: 0.2495
|
719 |
+
Elapse: 543.62s
|
720 |
+
|
721 |
+
Epoch 114/400
|
722 |
+
Train loss: 70609840.00 correlation: 0.3026
|
723 |
+
Validation loss: 166641568.00 correlation: 0.2495
|
724 |
+
Elapse: 543.57s
|
725 |
+
|
726 |
+
Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
|
727 |
+
|
728 |
+
Epoch 115/400
|
729 |
+
Train loss: 70676264.00 correlation: 0.3017
|
730 |
+
Validation loss: 166645824.00 correlation: 0.2495
|
731 |
+
Elapse: 545.22s
|
732 |
+
|
733 |
+
Epoch 116/400
|
734 |
+
Train loss: 70640760.00 correlation: 0.3023
|
735 |
+
Validation loss: 166649888.00 correlation: 0.2495
|
736 |
+
Elapse: 545.14s
|
737 |
+
|
738 |
+
Epoch 117/400
|
739 |
+
Train loss: 70651464.00 correlation: 0.3017
|
740 |
+
Validation loss: 166644896.00 correlation: 0.2495
|
741 |
+
Elapse: 545.75s
|
742 |
+
|
743 |
+
Epoch 118/400
|
744 |
+
Train loss: 70647664.00 correlation: 0.3020
|
745 |
+
Validation loss: 166642016.00 correlation: 0.2495
|
746 |
+
Elapse: 551.10s
|
747 |
+
|
748 |
+
Epoch 119/400
|
749 |
+
Train loss: 70647632.00 correlation: 0.3017
|
750 |
+
Validation loss: 166642992.00 correlation: 0.2495
|
751 |
+
Elapse: 545.02s
|
752 |
+
|
753 |
+
Loaded checkpoint from epoch 114 (correlation: 0.2495).
|
754 |
+
|
755 |
+
Reduce learning rate of core to 1.0498e-06 (num. reduce: 1).
|
756 |
+
Reduce learning rate of readouts to 7.8732e-07 (num. reduce: 1).
|
757 |
+
Reduce learning rate of shifters to 7.8732e-07 (num. reduce: 1).
|
758 |
+
|
759 |
+
Epoch 120/400
|
760 |
+
Train loss: 70673976.00 correlation: 0.3014
|
761 |
+
Validation loss: 166641376.00 correlation: 0.2495
|
762 |
+
Elapse: 544.88s
|
763 |
+
|
764 |
+
Epoch 121/400
|
765 |
+
Train loss: 70599064.00 correlation: 0.3023
|
766 |
+
Validation loss: 166642464.00 correlation: 0.2495
|
767 |
+
Elapse: 544.91s
|
768 |
+
|
769 |
+
Epoch 122/400
|
770 |
+
Train loss: 70592552.00 correlation: 0.3025
|
771 |
+
Validation loss: 166642720.00 correlation: 0.2495
|
772 |
+
Elapse: 544.80s
|
773 |
+
|
774 |
+
Epoch 123/400
|
775 |
+
Train loss: 70644184.00 correlation: 0.3019
|
776 |
+
Validation loss: 166643072.00 correlation: 0.2495
|
777 |
+
Elapse: 544.57s
|
778 |
+
|
779 |
+
Epoch 124/400
|
780 |
+
Train loss: 70629504.00 correlation: 0.3022
|
781 |
+
Validation loss: 166642208.00 correlation: 0.2495
|
782 |
+
Elapse: 545.38s
|
783 |
+
|
784 |
+
Loaded checkpoint from epoch 114 (correlation: 0.2495).
|
785 |
+
|
786 |
+
Reduce learning rate of core to 3.1493e-07 (num. reduce: 2).
|
787 |
+
Reduce learning rate of readouts to 2.3620e-07 (num. reduce: 2).
|
788 |
+
Reduce learning rate of shifters to 2.3620e-07 (num. reduce: 2).
|
789 |
+
|
790 |
+
Epoch 125/400
|
791 |
+
Train loss: 70617168.00 correlation: 0.3023
|
792 |
+
Validation loss: 166641952.00 correlation: 0.2495
|
793 |
+
Elapse: 544.97s
|
794 |
+
|
795 |
+
Epoch 126/400
|
796 |
+
Train loss: 70613328.00 correlation: 0.3026
|
797 |
+
Validation loss: 166642704.00 correlation: 0.2495
|
798 |
+
Elapse: 544.92s
|
799 |
+
|
800 |
+
Epoch 127/400
|
801 |
+
Train loss: 70681712.00 correlation: 0.3016
|
802 |
+
Validation loss: 166642848.00 correlation: 0.2495
|
803 |
+
Elapse: 544.98s
|
804 |
+
|
805 |
+
Epoch 128/400
|
806 |
+
Train loss: 70630672.00 correlation: 0.3021
|
807 |
+
Validation loss: 166642912.00 correlation: 0.2495
|
808 |
+
Elapse: 544.96s
|
809 |
+
|
810 |
+
Epoch 129/400
|
811 |
+
Train loss: 70600632.00 correlation: 0.3025
|
812 |
+
Validation loss: 166642848.00 correlation: 0.2495
|
813 |
+
Elapse: 545.27s
|
814 |
+
|
815 |
+
Model has not improved after 2 LR reductions.
|
816 |
+
|
817 |
+
Loaded checkpoint from epoch 114 (correlation: 0.2495).
|
818 |
+
|
819 |
+
|
820 |
+
ValidationA: 0.2465 B: 0.2783 C: 0.2688 D: 0.2292 E: 0.2366 F: 0.2341 G: 0.2549 H: 0.2330 I: 0.2567 J: 0.2571 average: 0.2495
|
821 |
+
|
822 |
+
Results saved to /home/storage/runs/vivit_ensemble/028.
|