bryanlimy commited on
Commit
26f9a55
·
verified ·
1 Parent(s): 30b6a9b

upload ViV1T model checkpoints, each trained with a different seed.

Browse files
001/args.yaml ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_eps: 1e-08
4
+ batch_size: 6
5
+ cache_data: false
6
+ center_crop: 1.0
7
+ clear_output_dir: true
8
+ core: vivit
9
+ core_behavior_mode: 2
10
+ core_compile: false
11
+ core_drop_path: 0.0505
12
+ core_emb_dim: 112
13
+ core_ff_activation: gelu
14
+ core_ff_dropout: 0.0592
15
+ core_flash_attention: 1
16
+ core_head_dim: 48
17
+ core_lr: 0.0048
18
+ core_mha_dropout: 0.358
19
+ core_mlp_dim: 136
20
+ core_norm_qk: false
21
+ core_num_heads: 11
22
+ core_p_dropout: 0.1338
23
+ core_parallel_attention: true
24
+ core_patch_mode: 0
25
+ core_pos_encoding: 3
26
+ core_spatial_depth: 3
27
+ core_spatial_patch_size: 7
28
+ core_spatial_patch_stride: 2
29
+ core_temporal_depth: 5
30
+ core_temporal_patch_size: 25
31
+ core_temporal_patch_stride: 1
32
+ core_weight_decay: 0.1789
33
+ criterion: poisson_correlation
34
+ critic_mode: 0
35
+ crop_frame: 140
36
+ data: /home/storage/sensorium
37
+ deterministic: false
38
+ device: cuda
39
+ dpi: 120
40
+ ds_mode: 3
41
+ ds_scale: 1
42
+ epochs: 400
43
+ format: svg
44
+ git_hash: 1033c29
45
+ grad_checkpointing: 0
46
+ grad_norm: null
47
+ input_shapes:
48
+ behavior: [2, 140]
49
+ pupil_center: [2, 140]
50
+ video: [1, 140, 36, 64]
51
+ limit_data: null
52
+ lr: 0.0036
53
+ max_frame: 300
54
+ micro_batch_size: 6
55
+ modulator_mode: 0
56
+ mouse_ids: [A, B, C, D, E, F, G, H, I, J]
57
+ num_workers: 2
58
+ output_dir: /home/storage/runs/001
59
+ output_mode: 1
60
+ output_shapes:
61
+ A: [7440, 140]
62
+ B: [7928, 140]
63
+ C: [8285, 140]
64
+ D: [7671, 140]
65
+ E: [7495, 140]
66
+ F: [7863, 140]
67
+ G: [7908, 140]
68
+ H: [8202, 140]
69
+ I: [7939, 140]
70
+ J: [8122, 140]
71
+ precision: "32"
72
+ pretrain_core: null
73
+ readout: gaussian2d
74
+ readout_bias_mode: 2
75
+ readout_dropout: 0.0
76
+ readout_grid_mode: 1
77
+ restore: null
78
+ save_plots: false
79
+ seed: 2
80
+ shifter_layers: 3
81
+ shifter_mode: 1
82
+ shifter_size: 5
83
+ stat_mode: 1
84
+ trainable_params: 12278365
85
+ transform_mode: 2
86
+ verbose: 1
87
+ weight_decay: 0.3939
001/ckpt/model_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86ee492503a0f995686aba27eb0db7f8d759dd2c4b491a692740b3be3241f14a
3
+ size 148268583
001/evaluation.yaml ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ validation: {A: 0.24868205189704895, B: 0.2788656949996948, C: 0.271991103887558,
2
+ D: 0.2340584099292755, E: 0.23670722544193268, F: 0.23395685851573944, G: 0.25554871559143066,
3
+ H: 0.23508135974407196, I: 0.25329142808914185, J: 0.2589012682437897, average: 0.25070841163396834}
001/model.txt ADDED
@@ -0,0 +1,143 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ =======================================================================================================================================
2
+ Layer (type:depth-idx) Input Shape Output Shape Param #
3
+ =======================================================================================================================================
4
+ Model -- [1, 7440, 116] --
5
+ ├─ViViTCore: 1-1 -- [1, 112, 116, 15, 29] --
6
+ │ └─ViViT: 2-1 [1, 5, 140, 36, 64] [1, 112, 116, 15, 29] --
7
+ │ │ └─Tokenizer: 3-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] 79,632
8
+ │ │ │ └─Sequential: 4-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] --
9
+ │ │ │ │ └─Unfold3d: 5-1 [1, 5, 140, 36, 64] [1, 116, 435, 6125] --
10
+ │ │ │ │ └─LayerNorm: 5-2 [1, 116, 435, 6125] [1, 116, 435, 6125] 12,250
11
+ │ │ │ │ └─Linear: 5-3 [1, 116, 435, 6125] [1, 116, 435, 112] 686,112
12
+ │ │ │ │ └─LayerNorm: 5-4 [1, 116, 435, 112] [1, 116, 435, 112] 224
13
+ │ │ │ │ └─Dropout: 5-5 [1, 116, 435, 112] [1, 116, 435, 112] --
14
+ │ │ └─Transformer: 3-2 [116, 435, 112] [116, 435, 112] --
15
+ │ │ │ └─ModuleList: 4-2 -- -- --
16
+ │ │ │ │ └─ParallelTransformerBlock: 5-6 [116, 435, 112] [116, 435, 112] --
17
+ │ │ │ │ │ └─LayerNorm: 6-1 [116, 435, 112] [116, 435, 112] 224
18
+ │ │ │ │ │ └─Linear: 6-2 [116, 435, 112] [116, 435, 1720] 192,640
19
+ │ │ │ │ │ └─Linear: 6-3 [116, 435, 528] [116, 435, 112] 59,136
20
+ │ │ │ │ │ └─DropPath: 6-4 [116, 435, 112] [116, 435, 112] --
21
+ │ │ │ │ │ └─Sequential: 6-5 [116, 435, 136] [116, 435, 112] --
22
+ │ │ │ │ │ │ └─GELU: 7-1 [116, 435, 136] [116, 435, 136] --
23
+ │ │ │ │ │ │ └─Dropout: 7-2 [116, 435, 136] [116, 435, 136] --
24
+ │ │ │ │ │ │ └─Linear: 7-3 [116, 435, 136] [116, 435, 112] 15,232
25
+ │ │ │ │ │ └─DropPath: 6-6 [116, 435, 112] [116, 435, 112] --
26
+ │ │ │ │ └─ParallelTransformerBlock: 5-7 [116, 435, 112] [116, 435, 112] --
27
+ │ │ │ │ │ └─LayerNorm: 6-7 [116, 435, 112] [116, 435, 112] 224
28
+ │ │ │ │ │ └─Linear: 6-8 [116, 435, 112] [116, 435, 1720] 192,640
29
+ │ │ │ │ │ └─Linear: 6-9 [116, 435, 528] [116, 435, 112] 59,136
30
+ │ │ │ │ │ └─DropPath: 6-10 [116, 435, 112] [116, 435, 112] --
31
+ │ │ │ │ │ └─Sequential: 6-11 [116, 435, 136] [116, 435, 112] --
32
+ │ │ │ │ │ │ └─GELU: 7-4 [116, 435, 136] [116, 435, 136] --
33
+ │ │ │ │ │ │ └─Dropout: 7-5 [116, 435, 136] [116, 435, 136] --
34
+ │ │ │ │ │ │ └─Linear: 7-6 [116, 435, 136] [116, 435, 112] 15,232
35
+ │ │ │ │ │ └─DropPath: 6-12 [116, 435, 112] [116, 435, 112] --
36
+ │ │ │ │ └─ParallelTransformerBlock: 5-8 [116, 435, 112] [116, 435, 112] --
37
+ │ │ │ │ │ └─LayerNorm: 6-13 [116, 435, 112] [116, 435, 112] 224
38
+ │ │ │ │ │ └─Linear: 6-14 [116, 435, 112] [116, 435, 1720] 192,640
39
+ │ │ │ │ │ └─Linear: 6-15 [116, 435, 528] [116, 435, 112] 59,136
40
+ │ │ │ │ │ └─DropPath: 6-16 [116, 435, 112] [116, 435, 112] --
41
+ │ │ │ │ │ └─Sequential: 6-17 [116, 435, 136] [116, 435, 112] --
42
+ │ │ │ │ │ │ └─GELU: 7-7 [116, 435, 136] [116, 435, 136] --
43
+ │ │ │ │ │ │ └─Dropout: 7-8 [116, 435, 136] [116, 435, 136] --
44
+ │ │ │ │ │ │ └─Linear: 7-9 [116, 435, 136] [116, 435, 112] 15,232
45
+ │ │ │ │ │ └─DropPath: 6-18 [116, 435, 112] [116, 435, 112] --
46
+ │ │ └─Transformer: 3-3 [435, 116, 112] [435, 116, 112] --
47
+ │ │ │ └─ModuleList: 4-3 -- -- --
48
+ │ │ │ │ └─ParallelTransformerBlock: 5-9 [435, 116, 112] [435, 116, 112] --
49
+ │ │ │ │ │ └─LayerNorm: 6-19 [435, 116, 112] [435, 116, 112] 224
50
+ │ │ │ │ │ └─Linear: 6-20 [435, 116, 112] [435, 116, 1720] 192,640
51
+ │ │ │ │ │ └─Linear: 6-21 [435, 116, 528] [435, 116, 112] 59,136
52
+ │ │ │ │ │ └─DropPath: 6-22 [435, 116, 112] [435, 116, 112] --
53
+ │ │ │ │ │ └─Sequential: 6-23 [435, 116, 136] [435, 116, 112] --
54
+ │ │ │ │ │ │ └─GELU: 7-10 [435, 116, 136] [435, 116, 136] --
55
+ │ │ │ │ │ │ └─Dropout: 7-11 [435, 116, 136] [435, 116, 136] --
56
+ │ │ │ │ │ │ └─Linear: 7-12 [435, 116, 136] [435, 116, 112] 15,232
57
+ │ │ │ │ │ └─DropPath: 6-24 [435, 116, 112] [435, 116, 112] --
58
+ │ │ │ │ └─ParallelTransformerBlock: 5-10 [435, 116, 112] [435, 116, 112] --
59
+ │ │ │ │ │ └─LayerNorm: 6-25 [435, 116, 112] [435, 116, 112] 224
60
+ │ │ │ │ │ └─Linear: 6-26 [435, 116, 112] [435, 116, 1720] 192,640
61
+ │ │ │ │ │ └─Linear: 6-27 [435, 116, 528] [435, 116, 112] 59,136
62
+ │ │ │ │ │ └─DropPath: 6-28 [435, 116, 112] [435, 116, 112] --
63
+ │ │ │ │ │ └─Sequential: 6-29 [435, 116, 136] [435, 116, 112] --
64
+ │ │ │ │ │ │ └─GELU: 7-13 [435, 116, 136] [435, 116, 136] --
65
+ │ │ │ │ │ │ └─Dropout: 7-14 [435, 116, 136] [435, 116, 136] --
66
+ │ │ │ │ │ │ └─Linear: 7-15 [435, 116, 136] [435, 116, 112] 15,232
67
+ │ │ │ │ │ └─DropPath: 6-30 [435, 116, 112] [435, 116, 112] --
68
+ │ │ │ │ └─ParallelTransformerBlock: 5-11 [435, 116, 112] [435, 116, 112] --
69
+ │ │ │ │ │ └─LayerNorm: 6-31 [435, 116, 112] [435, 116, 112] 224
70
+ │ │ │ │ │ └─Linear: 6-32 [435, 116, 112] [435, 116, 1720] 192,640
71
+ │ │ │ │ │ └─Linear: 6-33 [435, 116, 528] [435, 116, 112] 59,136
72
+ │ │ │ │ │ └─DropPath: 6-34 [435, 116, 112] [435, 116, 112] --
73
+ │ │ │ │ │ └─Sequential: 6-35 [435, 116, 136] [435, 116, 112] --
74
+ │ │ │ │ │ │ └─GELU: 7-16 [435, 116, 136] [435, 116, 136] --
75
+ │ │ │ │ │ │ └─Dropout: 7-17 [435, 116, 136] [435, 116, 136] --
76
+ │ │ │ │ │ │ └─Linear: 7-18 [435, 116, 136] [435, 116, 112] 15,232
77
+ │ │ │ │ │ └─DropPath: 6-36 [435, 116, 112] [435, 116, 112] --
78
+ │ │ │ │ └─ParallelTransformerBlock: 5-12 [435, 116, 112] [435, 116, 112] --
79
+ │ │ │ │ │ └─LayerNorm: 6-37 [435, 116, 112] [435, 116, 112] 224
80
+ │ │ │ │ │ └─Linear: 6-38 [435, 116, 112] [435, 116, 1720] 192,640
81
+ │ │ │ │ │ └─Linear: 6-39 [435, 116, 528] [435, 116, 112] 59,136
82
+ │ │ │ │ │ └─DropPath: 6-40 [435, 116, 112] [435, 116, 112] --
83
+ │ │ │ │ │ └─Sequential: 6-41 [435, 116, 136] [435, 116, 112] --
84
+ │ │ │ │ │ │ └─GELU: 7-19 [435, 116, 136] [435, 116, 136] --
85
+ │ │ │ │ │ │ └─Dropout: 7-20 [435, 116, 136] [435, 116, 136] --
86
+ │ │ │ │ │ │ └─Linear: 7-21 [435, 116, 136] [435, 116, 112] 15,232
87
+ │ │ │ │ │ └─DropPath: 6-42 [435, 116, 112] [435, 116, 112] --
88
+ │ │ │ │ └─ParallelTransformerBlock: 5-13 [435, 116, 112] [435, 116, 112] --
89
+ │ │ │ │ │ └─LayerNorm: 6-43 [435, 116, 112] [435, 116, 112] 224
90
+ │ │ │ │ │ └─Linear: 6-44 [435, 116, 112] [435, 116, 1720] 192,640
91
+ │ │ │ │ │ └─Linear: 6-45 [435, 116, 528] [435, 116, 112] 59,136
92
+ │ │ │ │ │ └─DropPath: 6-46 [435, 116, 112] [435, 116, 112] --
93
+ │ │ │ │ │ └─Sequential: 6-47 [435, 116, 136] [435, 116, 112] --
94
+ │ │ │ │ │ │ └─GELU: 7-22 [435, 116, 136] [435, 116, 136] --
95
+ │ │ │ │ │ │ └─Dropout: 7-23 [435, 116, 136] [435, 116, 136] --
96
+ │ │ │ │ │ │ └─Linear: 7-24 [435, 116, 136] [435, 116, 112] 15,232
97
+ │ │ │ │ │ └─DropPath: 6-48 [435, 116, 112] [435, 116, 112] --
98
+ │ │ └─Rearrange: 3-4 [1, 116, 435, 112] [1, 112, 116, 15, 29] --
99
+ ├─MLPShifters: 1-2 -- [1, 2, 116] 513
100
+ │ └─MLPShifter: 2-2 [116, 2] [116, 2] --
101
+ │ │ └─Sequential: 3-5 [116, 2] [116, 2] --
102
+ │ │ │ └─Linear: 4-4 [116, 2] [116, 5] 15
103
+ │ │ │ └─Tanh: 4-5 [116, 5] [116, 5] --
104
+ │ │ │ └─Linear: 4-6 [116, 5] [116, 5] 30
105
+ │ │ │ └─Tanh: 4-7 [116, 5] [116, 5] --
106
+ │ │ │ └─Linear: 4-8 [116, 5] [116, 2] 12
107
+ │ │ │ └─Tanh: 4-9 [116, 2] [116, 2] --
108
+ ├─Readouts: 1-3 [1, 112, 116, 15, 29] [1, 7440, 116] 8,477,649
109
+ │ └─Gaussian2DReadout2: 2-3 [1, 112, 116, 15, 29] [1, 7440, 116] 870,480
110
+ │ │ └─Sequential: 3-6 [7440, 2] [7440, 2] --
111
+ │ │ │ └─Linear: 4-10 [7440, 2] [7440, 30] 90
112
+ │ │ │ └─ELU: 4-11 [7440, 30] [7440, 30] --
113
+ │ │ │ └─Linear: 4-12 [7440, 30] [7440, 2] 62
114
+ │ │ │ └─Tanh: 4-13 [7440, 2] [7440, 2] --
115
+ │ │ └─Sequential: 3-7 [7440, 2] [7440, 2] (recursive)
116
+ │ │ │ └─Linear: 4-14 [7440, 2] [7440, 30] (recursive)
117
+ │ │ │ └─ELU: 4-15 [7440, 30] [7440, 30] --
118
+ �� │ │ └─Linear: 4-16 [7440, 30] [7440, 2] (recursive)
119
+ │ │ │ └─Tanh: 4-17 [7440, 2] [7440, 2] --
120
+ │ │ └─Sequential: 3-8 [7440, 2] [7440, 2] (recursive)
121
+ │ │ │ └─Linear: 4-18 [7440, 2] [7440, 30] (recursive)
122
+ │ │ │ └─ELU: 4-19 [7440, 30] [7440, 30] --
123
+ │ │ │ └─Linear: 4-20 [7440, 30] [7440, 2] (recursive)
124
+ │ │ │ └─Tanh: 4-21 [7440, 2] [7440, 2] --
125
+ │ │ └─Sequential: 3-9 [116, 4] [116, 112] --
126
+ │ │ │ └─Linear: 4-22 [116, 4] [116, 112] 560
127
+ │ │ │ └─LayerNorm: 4-23 [116, 112] [116, 112] 224
128
+ │ │ │ └─GELU: 4-24 [116, 112] [116, 112] --
129
+ │ │ │ └─Dropout: 4-25 [116, 112] [116, 112] --
130
+ │ │ │ └─Linear: 4-26 [116, 112] [116, 112] 12,656
131
+ │ │ │ └─Tanh: 4-27 [116, 112] [116, 112] --
132
+ ├─Exponential: 1-4 [1, 7440, 116] [1, 7440, 116] --
133
+ =======================================================================================================================================
134
+ Total params: 12,278,365
135
+ Trainable params: 12,278,365
136
+ Non-trainable params: 0
137
+ Total mult-adds (Units.MEGABYTES): 679.88
138
+ =======================================================================================================================================
139
+ Input size (MB): 1.29
140
+ Forward/backward pass size (MB): 9208.73
141
+ Params size (MB): 11.40
142
+ Estimated Total Size (MB): 9221.42
143
+ =======================================================================================================================================
001/output.log ADDED
@@ -0,0 +1,816 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Use bfloat16 for core module.
2
+ Use parallel attention and MLP in ViViT.
3
+
4
+ Epoch 001/400
5
+ Train loss: 113924008.00 correlation: 0.0107
6
+ Validation loss: 200107760.00 correlation: 0.0263
7
+ Elapse: 605.46s
8
+
9
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
10
+
11
+ Epoch 002/400
12
+ Train loss: 97896768.00 correlation: 0.0340
13
+ Validation loss: 199235856.00 correlation: 0.0378
14
+ Elapse: 556.86s
15
+
16
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
17
+
18
+ Epoch 003/400
19
+ Train loss: 96883144.00 correlation: 0.0443
20
+ Validation loss: 198767200.00 correlation: 0.0405
21
+ Elapse: 560.31s
22
+
23
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
24
+
25
+ Epoch 004/400
26
+ Train loss: 96317000.00 correlation: 0.0499
27
+ Validation loss: 198194576.00 correlation: 0.0449
28
+ Elapse: 560.78s
29
+
30
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
31
+
32
+ Epoch 005/400
33
+ Train loss: 95592096.00 correlation: 0.0577
34
+ Validation loss: 197382576.00 correlation: 0.0493
35
+ Elapse: 563.47s
36
+
37
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
38
+
39
+ Epoch 006/400
40
+ Train loss: 94455696.00 correlation: 0.0692
41
+ Validation loss: 195917728.00 correlation: 0.0602
42
+ Elapse: 565.83s
43
+
44
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
45
+
46
+ Epoch 007/400
47
+ Train loss: 93257144.00 correlation: 0.0821
48
+ Validation loss: 193956304.00 correlation: 0.0721
49
+ Elapse: 566.60s
50
+
51
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
52
+
53
+ Epoch 008/400
54
+ Train loss: 92014728.00 correlation: 0.0951
55
+ Validation loss: 192039424.00 correlation: 0.0839
56
+ Elapse: 566.05s
57
+
58
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
59
+
60
+ Epoch 009/400
61
+ Train loss: 91067848.00 correlation: 0.1053
62
+ Validation loss: 190701360.00 correlation: 0.0935
63
+ Elapse: 563.36s
64
+
65
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
66
+
67
+ Epoch 010/400
68
+ Train loss: 90106464.00 correlation: 0.1149
69
+ Validation loss: 189259712.00 correlation: 0.1026
70
+ Elapse: 562.44s
71
+
72
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
73
+
74
+ Epoch 011/400
75
+ Train loss: 89183952.00 correlation: 0.1243
76
+ Validation loss: 187589920.00 correlation: 0.1130
77
+ Elapse: 560.31s
78
+
79
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
80
+
81
+ Epoch 012/400
82
+ Train loss: 88171952.00 correlation: 0.1348
83
+ Validation loss: 186131232.00 correlation: 0.1219
84
+ Elapse: 559.08s
85
+
86
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
87
+
88
+ Epoch 013/400
89
+ Train loss: 87220088.00 correlation: 0.1442
90
+ Validation loss: 184294144.00 correlation: 0.1328
91
+ Elapse: 564.57s
92
+
93
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
94
+
95
+ Epoch 014/400
96
+ Train loss: 86305888.00 correlation: 0.1535
97
+ Validation loss: 182766432.00 correlation: 0.1425
98
+ Elapse: 564.31s
99
+
100
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
101
+
102
+ Epoch 015/400
103
+ Train loss: 85306032.00 correlation: 0.1632
104
+ Validation loss: 181567952.00 correlation: 0.1505
105
+ Elapse: 562.48s
106
+
107
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
108
+
109
+ Epoch 016/400
110
+ Train loss: 84622736.00 correlation: 0.1701
111
+ Validation loss: 180351280.00 correlation: 0.1587
112
+ Elapse: 561.75s
113
+
114
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
115
+
116
+ Epoch 017/400
117
+ Train loss: 83839824.00 correlation: 0.1780
118
+ Validation loss: 179434864.00 correlation: 0.1644
119
+ Elapse: 561.90s
120
+
121
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
122
+
123
+ Epoch 018/400
124
+ Train loss: 83213000.00 correlation: 0.1840
125
+ Validation loss: 178816208.00 correlation: 0.1695
126
+ Elapse: 562.07s
127
+
128
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
129
+
130
+ Epoch 019/400
131
+ Train loss: 82673560.00 correlation: 0.1895
132
+ Validation loss: 178169568.00 correlation: 0.1740
133
+ Elapse: 562.05s
134
+
135
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
136
+
137
+ Epoch 020/400
138
+ Train loss: 82081376.00 correlation: 0.1949
139
+ Validation loss: 177435600.00 correlation: 0.1787
140
+ Elapse: 561.87s
141
+
142
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
143
+
144
+ Epoch 021/400
145
+ Train loss: 81644440.00 correlation: 0.1992
146
+ Validation loss: 176873408.00 correlation: 0.1824
147
+ Elapse: 562.31s
148
+
149
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
150
+
151
+ Epoch 022/400
152
+ Train loss: 81300944.00 correlation: 0.2027
153
+ Validation loss: 176298464.00 correlation: 0.1855
154
+ Elapse: 562.57s
155
+
156
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
157
+
158
+ Epoch 023/400
159
+ Train loss: 80864992.00 correlation: 0.2072
160
+ Validation loss: 175630304.00 correlation: 0.1905
161
+ Elapse: 562.55s
162
+
163
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
164
+
165
+ Epoch 024/400
166
+ Train loss: 80516536.00 correlation: 0.2102
167
+ Validation loss: 175099184.00 correlation: 0.1937
168
+ Elapse: 561.74s
169
+
170
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
171
+
172
+ Epoch 025/400
173
+ Train loss: 80141312.00 correlation: 0.2140
174
+ Validation loss: 174953952.00 correlation: 0.1954
175
+ Elapse: 563.63s
176
+
177
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
178
+
179
+ Epoch 026/400
180
+ Train loss: 79914320.00 correlation: 0.2162
181
+ Validation loss: 174397456.00 correlation: 0.1975
182
+ Elapse: 563.20s
183
+
184
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
185
+
186
+ Epoch 027/400
187
+ Train loss: 79520984.00 correlation: 0.2200
188
+ Validation loss: 174134560.00 correlation: 0.2014
189
+ Elapse: 562.71s
190
+
191
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
192
+
193
+ Epoch 028/400
194
+ Train loss: 79212208.00 correlation: 0.2229
195
+ Validation loss: 173471920.00 correlation: 0.2046
196
+ Elapse: 562.79s
197
+
198
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
199
+
200
+ Epoch 029/400
201
+ Train loss: 78973040.00 correlation: 0.2252
202
+ Validation loss: 173183520.00 correlation: 0.2064
203
+ Elapse: 563.08s
204
+
205
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
206
+
207
+ Epoch 030/400
208
+ Train loss: 78870784.00 correlation: 0.2264
209
+ Validation loss: 172775088.00 correlation: 0.2096
210
+ Elapse: 562.82s
211
+
212
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
213
+
214
+ Epoch 031/400
215
+ Train loss: 78490200.00 correlation: 0.2296
216
+ Validation loss: 172664992.00 correlation: 0.2107
217
+ Elapse: 563.05s
218
+
219
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
220
+
221
+ Epoch 032/400
222
+ Train loss: 78317200.00 correlation: 0.2318
223
+ Validation loss: 172019824.00 correlation: 0.2132
224
+ Elapse: 562.89s
225
+
226
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
227
+
228
+ Epoch 033/400
229
+ Train loss: 78137128.00 correlation: 0.2333
230
+ Validation loss: 171897024.00 correlation: 0.2150
231
+ Elapse: 562.71s
232
+
233
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
234
+
235
+ Epoch 034/400
236
+ Train loss: 77950032.00 correlation: 0.2354
237
+ Validation loss: 171802656.00 correlation: 0.2157
238
+ Elapse: 562.68s
239
+
240
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
241
+
242
+ Epoch 035/400
243
+ Train loss: 77766832.00 correlation: 0.2367
244
+ Validation loss: 171322160.00 correlation: 0.2180
245
+ Elapse: 561.92s
246
+
247
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
248
+
249
+ Epoch 036/400
250
+ Train loss: 77637216.00 correlation: 0.2384
251
+ Validation loss: 171034880.00 correlation: 0.2209
252
+ Elapse: 562.15s
253
+
254
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
255
+
256
+ Epoch 037/400
257
+ Train loss: 77482304.00 correlation: 0.2397
258
+ Validation loss: 171174608.00 correlation: 0.2203
259
+ Elapse: 564.93s
260
+
261
+ Epoch 038/400
262
+ Train loss: 77429408.00 correlation: 0.2402
263
+ Validation loss: 170815888.00 correlation: 0.2218
264
+ Elapse: 564.45s
265
+
266
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
267
+
268
+ Epoch 039/400
269
+ Train loss: 77292792.00 correlation: 0.2412
270
+ Validation loss: 170692576.00 correlation: 0.2224
271
+ Elapse: 563.94s
272
+
273
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
274
+
275
+ Epoch 040/400
276
+ Train loss: 77122352.00 correlation: 0.2426
277
+ Validation loss: 170492064.00 correlation: 0.2256
278
+ Elapse: 565.03s
279
+
280
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
281
+
282
+ Epoch 041/400
283
+ Train loss: 77124456.00 correlation: 0.2430
284
+ Validation loss: 170532256.00 correlation: 0.2245
285
+ Elapse: 564.39s
286
+
287
+ Epoch 042/400
288
+ Train loss: 76964592.00 correlation: 0.2445
289
+ Validation loss: 170406688.00 correlation: 0.2257
290
+ Elapse: 565.12s
291
+
292
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
293
+
294
+ Epoch 043/400
295
+ Train loss: 76869008.00 correlation: 0.2454
296
+ Validation loss: 170592080.00 correlation: 0.2248
297
+ Elapse: 563.98s
298
+
299
+ Epoch 044/400
300
+ Train loss: 76798544.00 correlation: 0.2461
301
+ Validation loss: 170285664.00 correlation: 0.2253
302
+ Elapse: 564.88s
303
+
304
+ Epoch 045/400
305
+ Train loss: 76706736.00 correlation: 0.2469
306
+ Validation loss: 170137504.00 correlation: 0.2276
307
+ Elapse: 564.78s
308
+
309
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
310
+
311
+ Epoch 046/400
312
+ Train loss: 76661312.00 correlation: 0.2474
313
+ Validation loss: 170203360.00 correlation: 0.2258
314
+ Elapse: 563.90s
315
+
316
+ Epoch 047/400
317
+ Train loss: 76653904.00 correlation: 0.2479
318
+ Validation loss: 169920448.00 correlation: 0.2283
319
+ Elapse: 565.79s
320
+
321
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
322
+
323
+ Epoch 048/400
324
+ Train loss: 76510704.00 correlation: 0.2491
325
+ Validation loss: 169954384.00 correlation: 0.2279
326
+ Elapse: 566.41s
327
+
328
+ Epoch 049/400
329
+ Train loss: 76493416.00 correlation: 0.2492
330
+ Validation loss: 169840224.00 correlation: 0.2290
331
+ Elapse: 566.13s
332
+
333
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
334
+
335
+ Epoch 050/400
336
+ Train loss: 76429016.00 correlation: 0.2495
337
+ Validation loss: 170036560.00 correlation: 0.2272
338
+ Elapse: 567.15s
339
+
340
+ Epoch 051/400
341
+ Train loss: 76434184.00 correlation: 0.2500
342
+ Validation loss: 169668848.00 correlation: 0.2298
343
+ Elapse: 563.78s
344
+
345
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
346
+
347
+ Epoch 052/400
348
+ Train loss: 76368824.00 correlation: 0.2505
349
+ Validation loss: 169862640.00 correlation: 0.2292
350
+ Elapse: 563.52s
351
+
352
+ Epoch 053/400
353
+ Train loss: 76235120.00 correlation: 0.2516
354
+ Validation loss: 169524560.00 correlation: 0.2315
355
+ Elapse: 565.24s
356
+
357
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
358
+
359
+ Epoch 054/400
360
+ Train loss: 76236176.00 correlation: 0.2518
361
+ Validation loss: 169235696.00 correlation: 0.2324
362
+ Elapse: 564.43s
363
+
364
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
365
+
366
+ Epoch 055/400
367
+ Train loss: 76272208.00 correlation: 0.2514
368
+ Validation loss: 169566032.00 correlation: 0.2303
369
+ Elapse: 564.62s
370
+
371
+ Epoch 056/400
372
+ Train loss: 76095872.00 correlation: 0.2528
373
+ Validation loss: 169257008.00 correlation: 0.2329
374
+ Elapse: 564.52s
375
+
376
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
377
+
378
+ Epoch 057/400
379
+ Train loss: 76150160.00 correlation: 0.2523
380
+ Validation loss: 169306656.00 correlation: 0.2323
381
+ Elapse: 564.42s
382
+
383
+ Epoch 058/400
384
+ Train loss: 75971168.00 correlation: 0.2540
385
+ Validation loss: 169281824.00 correlation: 0.2326
386
+ Elapse: 565.79s
387
+
388
+ Epoch 059/400
389
+ Train loss: 76016632.00 correlation: 0.2537
390
+ Validation loss: 169175984.00 correlation: 0.2330
391
+ Elapse: 567.53s
392
+
393
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
394
+
395
+ Epoch 060/400
396
+ Train loss: 75961288.00 correlation: 0.2543
397
+ Validation loss: 169244832.00 correlation: 0.2312
398
+ Elapse: 564.74s
399
+
400
+ Epoch 061/400
401
+ Train loss: 75918368.00 correlation: 0.2545
402
+ Validation loss: 169277088.00 correlation: 0.2310
403
+ Elapse: 564.73s
404
+
405
+ Epoch 062/400
406
+ Train loss: 75869072.00 correlation: 0.2550
407
+ Validation loss: 169328944.00 correlation: 0.2320
408
+ Elapse: 564.39s
409
+
410
+ Epoch 063/400
411
+ Train loss: 75762192.00 correlation: 0.2561
412
+ Validation loss: 169258112.00 correlation: 0.2316
413
+ Elapse: 564.19s
414
+
415
+ Epoch 064/400
416
+ Train loss: 75825328.00 correlation: 0.2556
417
+ Validation loss: 169071840.00 correlation: 0.2332
418
+ Elapse: 564.93s
419
+
420
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
421
+
422
+ Epoch 065/400
423
+ Train loss: 75713256.00 correlation: 0.2566
424
+ Validation loss: 169214000.00 correlation: 0.2329
425
+ Elapse: 564.84s
426
+
427
+ Epoch 066/400
428
+ Train loss: 75745160.00 correlation: 0.2561
429
+ Validation loss: 169041248.00 correlation: 0.2327
430
+ Elapse: 564.78s
431
+
432
+ Epoch 067/400
433
+ Train loss: 75648152.00 correlation: 0.2572
434
+ Validation loss: 169051616.00 correlation: 0.2327
435
+ Elapse: 565.20s
436
+
437
+ Epoch 068/400
438
+ Train loss: 75614368.00 correlation: 0.2577
439
+ Validation loss: 169221120.00 correlation: 0.2327
440
+ Elapse: 564.71s
441
+
442
+ Epoch 069/400
443
+ Train loss: 75625776.00 correlation: 0.2574
444
+ Validation loss: 169122256.00 correlation: 0.2330
445
+ Elapse: 564.46s
446
+
447
+ Loaded checkpoint from epoch 64 (correlation: 0.2332).
448
+
449
+ Reduce learning rate of core to 1.4400e-03 (num. reduce: 1).
450
+ Reduce learning rate of readouts to 1.0800e-03 (num. reduce: 1).
451
+ Reduce learning rate of shifters to 1.0800e-03 (num. reduce: 1).
452
+
453
+ Epoch 070/400
454
+ Train loss: 73759920.00 correlation: 0.2731
455
+ Validation loss: 167411552.00 correlation: 0.2444
456
+ Elapse: 565.27s
457
+
458
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
459
+
460
+ Epoch 071/400
461
+ Train loss: 73162624.00 correlation: 0.2785
462
+ Validation loss: 167276400.00 correlation: 0.2454
463
+ Elapse: 565.31s
464
+
465
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
466
+
467
+ Epoch 072/400
468
+ Train loss: 73062080.00 correlation: 0.2797
469
+ Validation loss: 167303840.00 correlation: 0.2453
470
+ Elapse: 565.70s
471
+
472
+ Epoch 073/400
473
+ Train loss: 72859248.00 correlation: 0.2818
474
+ Validation loss: 167279840.00 correlation: 0.2448
475
+ Elapse: 566.21s
476
+
477
+ Epoch 074/400
478
+ Train loss: 72867944.00 correlation: 0.2819
479
+ Validation loss: 167328304.00 correlation: 0.2445
480
+ Elapse: 566.10s
481
+
482
+ Epoch 075/400
483
+ Train loss: 72806064.00 correlation: 0.2823
484
+ Validation loss: 167367392.00 correlation: 0.2443
485
+ Elapse: 566.39s
486
+
487
+ Epoch 076/400
488
+ Train loss: 72707504.00 correlation: 0.2836
489
+ Validation loss: 167176992.00 correlation: 0.2450
490
+ Elapse: 566.85s
491
+
492
+ Loaded checkpoint from epoch 71 (correlation: 0.2454).
493
+
494
+ Reduce learning rate of core to 4.3200e-04 (num. reduce: 1).
495
+ Reduce learning rate of readouts to 3.2400e-04 (num. reduce: 1).
496
+ Reduce learning rate of shifters to 3.2400e-04 (num. reduce: 1).
497
+
498
+ Epoch 077/400
499
+ Train loss: 72382144.00 correlation: 0.2856
500
+ Validation loss: 166842576.00 correlation: 0.2479
501
+ Elapse: 566.50s
502
+
503
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
504
+
505
+ Epoch 078/400
506
+ Train loss: 72078376.00 correlation: 0.2881
507
+ Validation loss: 166822496.00 correlation: 0.2483
508
+ Elapse: 567.42s
509
+
510
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
511
+
512
+ Epoch 079/400
513
+ Train loss: 71958248.00 correlation: 0.2896
514
+ Validation loss: 166738624.00 correlation: 0.2488
515
+ Elapse: 567.48s
516
+
517
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
518
+
519
+ Epoch 080/400
520
+ Train loss: 71895880.00 correlation: 0.2900
521
+ Validation loss: 166642640.00 correlation: 0.2490
522
+ Elapse: 567.47s
523
+
524
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
525
+
526
+ Epoch 081/400
527
+ Train loss: 71789800.00 correlation: 0.2911
528
+ Validation loss: 166705248.00 correlation: 0.2491
529
+ Elapse: 566.97s
530
+
531
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
532
+
533
+ Epoch 082/400
534
+ Train loss: 71770424.00 correlation: 0.2915
535
+ Validation loss: 166628368.00 correlation: 0.2487
536
+ Elapse: 567.08s
537
+
538
+ Epoch 083/400
539
+ Train loss: 71742960.00 correlation: 0.2915
540
+ Validation loss: 166623744.00 correlation: 0.2491
541
+ Elapse: 567.32s
542
+
543
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
544
+
545
+ Epoch 084/400
546
+ Train loss: 71726080.00 correlation: 0.2915
547
+ Validation loss: 166593008.00 correlation: 0.2489
548
+ Elapse: 566.52s
549
+
550
+ Epoch 085/400
551
+ Train loss: 71608472.00 correlation: 0.2930
552
+ Validation loss: 166582448.00 correlation: 0.2494
553
+ Elapse: 566.39s
554
+
555
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
556
+
557
+ Epoch 086/400
558
+ Train loss: 71622656.00 correlation: 0.2929
559
+ Validation loss: 166651488.00 correlation: 0.2488
560
+ Elapse: 567.27s
561
+
562
+ Epoch 087/400
563
+ Train loss: 71550640.00 correlation: 0.2936
564
+ Validation loss: 166630768.00 correlation: 0.2490
565
+ Elapse: 566.70s
566
+
567
+ Epoch 088/400
568
+ Train loss: 71491864.00 correlation: 0.2941
569
+ Validation loss: 166610080.00 correlation: 0.2493
570
+ Elapse: 567.65s
571
+
572
+ Epoch 089/400
573
+ Train loss: 71458584.00 correlation: 0.2944
574
+ Validation loss: 166546464.00 correlation: 0.2492
575
+ Elapse: 566.68s
576
+
577
+ Epoch 090/400
578
+ Train loss: 71462792.00 correlation: 0.2945
579
+ Validation loss: 166668320.00 correlation: 0.2492
580
+ Elapse: 566.84s
581
+
582
+ Loaded checkpoint from epoch 85 (correlation: 0.2494).
583
+
584
+ Reduce learning rate of core to 1.2960e-04 (num. reduce: 1).
585
+ Reduce learning rate of readouts to 9.7200e-05 (num. reduce: 1).
586
+ Reduce learning rate of shifters to 9.7200e-05 (num. reduce: 1).
587
+
588
+ Epoch 091/400
589
+ Train loss: 71288968.00 correlation: 0.2953
590
+ Validation loss: 166494880.00 correlation: 0.2500
591
+ Elapse: 567.12s
592
+
593
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
594
+
595
+ Epoch 092/400
596
+ Train loss: 71275904.00 correlation: 0.2958
597
+ Validation loss: 166504256.00 correlation: 0.2498
598
+ Elapse: 566.80s
599
+
600
+ Epoch 093/400
601
+ Train loss: 71229392.00 correlation: 0.2962
602
+ Validation loss: 166490080.00 correlation: 0.2502
603
+ Elapse: 567.91s
604
+
605
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
606
+
607
+ Epoch 094/400
608
+ Train loss: 71289360.00 correlation: 0.2955
609
+ Validation loss: 166481824.00 correlation: 0.2501
610
+ Elapse: 567.35s
611
+
612
+ Epoch 095/400
613
+ Train loss: 71209928.00 correlation: 0.2962
614
+ Validation loss: 166463984.00 correlation: 0.2501
615
+ Elapse: 567.29s
616
+
617
+ Epoch 096/400
618
+ Train loss: 71155936.00 correlation: 0.2969
619
+ Validation loss: 166447504.00 correlation: 0.2502
620
+ Elapse: 567.66s
621
+
622
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
623
+
624
+ Epoch 097/400
625
+ Train loss: 71163080.00 correlation: 0.2967
626
+ Validation loss: 166476448.00 correlation: 0.2501
627
+ Elapse: 567.23s
628
+
629
+ Epoch 098/400
630
+ Train loss: 71090216.00 correlation: 0.2976
631
+ Validation loss: 166447952.00 correlation: 0.2502
632
+ Elapse: 567.15s
633
+
634
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
635
+
636
+ Epoch 099/400
637
+ Train loss: 71146160.00 correlation: 0.2971
638
+ Validation loss: 166436720.00 correlation: 0.2504
639
+ Elapse: 566.92s
640
+
641
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
642
+
643
+ Epoch 100/400
644
+ Train loss: 71064016.00 correlation: 0.2977
645
+ Validation loss: 166422944.00 correlation: 0.2502
646
+ Elapse: 567.03s
647
+
648
+ Epoch 101/400
649
+ Train loss: 71056432.00 correlation: 0.2979
650
+ Validation loss: 166403840.00 correlation: 0.2505
651
+ Elapse: 567.52s
652
+
653
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
654
+
655
+ Epoch 102/400
656
+ Train loss: 71051576.00 correlation: 0.2978
657
+ Validation loss: 166443872.00 correlation: 0.2504
658
+ Elapse: 567.13s
659
+
660
+ Epoch 103/400
661
+ Train loss: 71046608.00 correlation: 0.2979
662
+ Validation loss: 166479680.00 correlation: 0.2502
663
+ Elapse: 566.67s
664
+
665
+ Epoch 104/400
666
+ Train loss: 71038120.00 correlation: 0.2981
667
+ Validation loss: 166454112.00 correlation: 0.2501
668
+ Elapse: 564.93s
669
+
670
+ Epoch 105/400
671
+ Train loss: 70978192.00 correlation: 0.2988
672
+ Validation loss: 166414432.00 correlation: 0.2503
673
+ Elapse: 564.91s
674
+
675
+ Epoch 106/400
676
+ Train loss: 70976960.00 correlation: 0.2990
677
+ Validation loss: 166474720.00 correlation: 0.2500
678
+ Elapse: 566.07s
679
+
680
+ Loaded checkpoint from epoch 101 (correlation: 0.2505).
681
+
682
+ Reduce learning rate of core to 3.8880e-05 (num. reduce: 1).
683
+ Reduce learning rate of readouts to 2.9160e-05 (num. reduce: 1).
684
+ Reduce learning rate of shifters to 2.9160e-05 (num. reduce: 1).
685
+
686
+ Epoch 107/400
687
+ Train loss: 70972624.00 correlation: 0.2986
688
+ Validation loss: 166398144.00 correlation: 0.2506
689
+ Elapse: 566.75s
690
+
691
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
692
+
693
+ Epoch 108/400
694
+ Train loss: 70964176.00 correlation: 0.2987
695
+ Validation loss: 166382512.00 correlation: 0.2506
696
+ Elapse: 566.44s
697
+
698
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
699
+
700
+ Epoch 109/400
701
+ Train loss: 70976968.00 correlation: 0.2987
702
+ Validation loss: 166404432.00 correlation: 0.2505
703
+ Elapse: 567.32s
704
+
705
+ Epoch 110/400
706
+ Train loss: 70951736.00 correlation: 0.2985
707
+ Validation loss: 166396896.00 correlation: 0.2506
708
+ Elapse: 567.77s
709
+
710
+ Epoch 111/400
711
+ Train loss: 70895944.00 correlation: 0.2997
712
+ Validation loss: 166385856.00 correlation: 0.2506
713
+ Elapse: 566.89s
714
+
715
+ Epoch 112/400
716
+ Train loss: 70880200.00 correlation: 0.2995
717
+ Validation loss: 166380672.00 correlation: 0.2507
718
+ Elapse: 566.94s
719
+
720
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/002/ckpt/model_state.pt.
721
+
722
+ Epoch 113/400
723
+ Train loss: 70861304.00 correlation: 0.2998
724
+ Validation loss: 166391184.00 correlation: 0.2506
725
+ Elapse: 566.54s
726
+
727
+ Epoch 114/400
728
+ Train loss: 70921912.00 correlation: 0.2989
729
+ Validation loss: 166417776.00 correlation: 0.2504
730
+ Elapse: 567.26s
731
+
732
+ Epoch 115/400
733
+ Train loss: 70914312.00 correlation: 0.2989
734
+ Validation loss: 166403376.00 correlation: 0.2506
735
+ Elapse: 566.92s
736
+
737
+ Epoch 116/400
738
+ Train loss: 70903784.00 correlation: 0.2992
739
+ Validation loss: 166403360.00 correlation: 0.2506
740
+ Elapse: 567.11s
741
+
742
+ Epoch 117/400
743
+ Train loss: 70866896.00 correlation: 0.2994
744
+ Validation loss: 166382688.00 correlation: 0.2505
745
+ Elapse: 566.94s
746
+
747
+ Loaded checkpoint from epoch 112 (correlation: 0.2507).
748
+
749
+ Reduce learning rate of core to 1.1664e-05 (num. reduce: 1).
750
+ Reduce learning rate of readouts to 8.7480e-06 (num. reduce: 1).
751
+ Reduce learning rate of shifters to 8.7480e-06 (num. reduce: 1).
752
+
753
+ Epoch 118/400
754
+ Train loss: 70926000.00 correlation: 0.2989
755
+ Validation loss: 166380768.00 correlation: 0.2506
756
+ Elapse: 567.50s
757
+
758
+ Epoch 119/400
759
+ Train loss: 70900808.00 correlation: 0.2993
760
+ Validation loss: 166386016.00 correlation: 0.2506
761
+ Elapse: 567.35s
762
+
763
+ Epoch 120/400
764
+ Train loss: 70881328.00 correlation: 0.2993
765
+ Validation loss: 166387568.00 correlation: 0.2506
766
+ Elapse: 567.65s
767
+
768
+ Epoch 121/400
769
+ Train loss: 70937256.00 correlation: 0.2984
770
+ Validation loss: 166393568.00 correlation: 0.2506
771
+ Elapse: 566.97s
772
+
773
+ Epoch 122/400
774
+ Train loss: 70855888.00 correlation: 0.2996
775
+ Validation loss: 166378592.00 correlation: 0.2507
776
+ Elapse: 567.50s
777
+
778
+ Loaded checkpoint from epoch 112 (correlation: 0.2507).
779
+
780
+ Reduce learning rate of core to 3.4992e-06 (num. reduce: 2).
781
+ Reduce learning rate of readouts to 2.6244e-06 (num. reduce: 2).
782
+ Reduce learning rate of shifters to 2.6244e-06 (num. reduce: 2).
783
+
784
+ Epoch 123/400
785
+ Train loss: 70938496.00 correlation: 0.2988
786
+ Validation loss: 166375792.00 correlation: 0.2507
787
+ Elapse: 567.50s
788
+
789
+ Epoch 124/400
790
+ Train loss: 70966320.00 correlation: 0.2986
791
+ Validation loss: 166383664.00 correlation: 0.2506
792
+ Elapse: 567.77s
793
+
794
+ Epoch 125/400
795
+ Train loss: 70872080.00 correlation: 0.2990
796
+ Validation loss: 166383328.00 correlation: 0.2506
797
+ Elapse: 567.87s
798
+
799
+ Epoch 126/400
800
+ Train loss: 70866264.00 correlation: 0.2997
801
+ Validation loss: 166383136.00 correlation: 0.2506
802
+ Elapse: 567.21s
803
+
804
+ Epoch 127/400
805
+ Train loss: 70836352.00 correlation: 0.2996
806
+ Validation loss: 166386816.00 correlation: 0.2506
807
+ Elapse: 566.90s
808
+
809
+ Model has not improved after 2 LR reductions.
810
+
811
+ Loaded checkpoint from epoch 112 (correlation: 0.2507).
812
+
813
+
814
+ ValidationA: 0.2487 B: 0.2789 C: 0.2720 D: 0.2341 E: 0.2367 F: 0.2340 G: 0.2555 H: 0.2351 I: 0.2533 J: 0.2589 average: 0.2507
815
+
816
+ Results saved to /home/storage/runs/vivit_ensemble/002.
002/args.yaml ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_eps: 1e-08
4
+ batch_size: 6
5
+ cache_data: false
6
+ center_crop: 1.0
7
+ clear_output_dir: true
8
+ core: vivit
9
+ core_behavior_mode: 2
10
+ core_compile: false
11
+ core_drop_path: 0.0505
12
+ core_emb_dim: 112
13
+ core_ff_activation: gelu
14
+ core_ff_dropout: 0.0592
15
+ core_flash_attention: 1
16
+ core_head_dim: 48
17
+ core_lr: 0.0048
18
+ core_mha_dropout: 0.358
19
+ core_mlp_dim: 136
20
+ core_norm_qk: false
21
+ core_num_heads: 11
22
+ core_p_dropout: 0.1338
23
+ core_parallel_attention: true
24
+ core_patch_mode: 0
25
+ core_pos_encoding: 3
26
+ core_spatial_depth: 3
27
+ core_spatial_patch_size: 7
28
+ core_spatial_patch_stride: 2
29
+ core_temporal_depth: 5
30
+ core_temporal_patch_size: 25
31
+ core_temporal_patch_stride: 1
32
+ core_weight_decay: 0.1789
33
+ criterion: poisson_correlation
34
+ critic_mode: 0
35
+ crop_frame: 140
36
+ data: /home/sensorium2023
37
+ deterministic: false
38
+ device: cuda
39
+ dpi: 120
40
+ ds_mode: 3
41
+ ds_scale: 1
42
+ epochs: 400
43
+ format: svg
44
+ git_hash: 1033c29
45
+ grad_checkpointing: 0
46
+ grad_norm: null
47
+ input_shapes:
48
+ behavior: [2, 140]
49
+ pupil_center: [2, 140]
50
+ video: [1, 140, 36, 64]
51
+ limit_data: null
52
+ lr: 0.0036
53
+ max_frame: 300
54
+ micro_batch_size: 6
55
+ modulator_mode: 0
56
+ mouse_ids: [A, B, C, D, E, F, G, H, I, J]
57
+ num_workers: 2
58
+ output_dir: /home/storage/runs/002
59
+ output_mode: 1
60
+ output_shapes:
61
+ A: [7440, 140]
62
+ B: [7928, 140]
63
+ C: [8285, 140]
64
+ D: [7671, 140]
65
+ E: [7495, 140]
66
+ F: [7863, 140]
67
+ G: [7908, 140]
68
+ H: [8202, 140]
69
+ I: [7939, 140]
70
+ J: [8122, 140]
71
+ precision: "32"
72
+ pretrain_core: null
73
+ readout: gaussian2d
74
+ readout_bias_mode: 2
75
+ readout_dropout: 0.0
76
+ readout_grid_mode: 1
77
+ restore: null
78
+ save_plots: false
79
+ seed: 9
80
+ shifter_layers: 3
81
+ shifter_mode: 1
82
+ shifter_size: 5
83
+ stat_mode: 1
84
+ trainable_params: 12278365
85
+ transform_mode: 2
86
+ verbose: 1
87
+ weight_decay: 0.3939
002/ckpt/model_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beef5725438551d35727d0a1a42f996cce8ce0c760b74e7f7228171b34283e11
3
+ size 148268583
002/evaluation.yaml ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ validation: {A: 0.25081300735473633, B: 0.2804259657859802, C: 0.27504464983940125,
2
+ D: 0.23932193219661713, E: 0.23903165757656097, F: 0.23461945354938507, G: 0.25730910897254944,
3
+ H: 0.2378837764263153, I: 0.2555205523967743, J: 0.25993871688842773, average: 0.25299088209867476}
002/model.txt ADDED
@@ -0,0 +1,143 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ =======================================================================================================================================
2
+ Layer (type:depth-idx) Input Shape Output Shape Param #
3
+ =======================================================================================================================================
4
+ Model -- [1, 7440, 116] --
5
+ ├─ViViTCore: 1-1 -- [1, 112, 116, 15, 29] --
6
+ │ └─ViViT: 2-1 [1, 5, 140, 36, 64] [1, 112, 116, 15, 29] --
7
+ │ │ └─Tokenizer: 3-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] 79,632
8
+ │ │ │ └─Sequential: 4-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] --
9
+ │ │ │ │ └─Unfold3d: 5-1 [1, 5, 140, 36, 64] [1, 116, 435, 6125] --
10
+ │ │ │ │ └─LayerNorm: 5-2 [1, 116, 435, 6125] [1, 116, 435, 6125] 12,250
11
+ │ │ │ │ └─Linear: 5-3 [1, 116, 435, 6125] [1, 116, 435, 112] 686,112
12
+ │ │ │ │ └─LayerNorm: 5-4 [1, 116, 435, 112] [1, 116, 435, 112] 224
13
+ │ │ │ │ └─Dropout: 5-5 [1, 116, 435, 112] [1, 116, 435, 112] --
14
+ │ │ └─Transformer: 3-2 [116, 435, 112] [116, 435, 112] --
15
+ │ │ │ └─ModuleList: 4-2 -- -- --
16
+ │ │ │ │ └─ParallelTransformerBlock: 5-6 [116, 435, 112] [116, 435, 112] --
17
+ │ │ │ │ │ └─LayerNorm: 6-1 [116, 435, 112] [116, 435, 112] 224
18
+ │ │ │ │ │ └─Linear: 6-2 [116, 435, 112] [116, 435, 1720] 192,640
19
+ │ │ │ │ │ └─Linear: 6-3 [116, 435, 528] [116, 435, 112] 59,136
20
+ │ │ │ │ │ └─DropPath: 6-4 [116, 435, 112] [116, 435, 112] --
21
+ │ │ │ │ │ └─Sequential: 6-5 [116, 435, 136] [116, 435, 112] --
22
+ │ │ │ │ │ │ └─GELU: 7-1 [116, 435, 136] [116, 435, 136] --
23
+ │ │ │ │ │ │ └─Dropout: 7-2 [116, 435, 136] [116, 435, 136] --
24
+ │ │ │ │ │ │ └─Linear: 7-3 [116, 435, 136] [116, 435, 112] 15,232
25
+ │ │ │ │ │ └─DropPath: 6-6 [116, 435, 112] [116, 435, 112] --
26
+ │ │ │ │ └─ParallelTransformerBlock: 5-7 [116, 435, 112] [116, 435, 112] --
27
+ │ │ │ │ │ └─LayerNorm: 6-7 [116, 435, 112] [116, 435, 112] 224
28
+ │ │ │ │ │ └─Linear: 6-8 [116, 435, 112] [116, 435, 1720] 192,640
29
+ │ │ │ │ │ └─Linear: 6-9 [116, 435, 528] [116, 435, 112] 59,136
30
+ │ │ │ │ │ └─DropPath: 6-10 [116, 435, 112] [116, 435, 112] --
31
+ │ │ │ │ │ └─Sequential: 6-11 [116, 435, 136] [116, 435, 112] --
32
+ │ │ │ │ │ │ └─GELU: 7-4 [116, 435, 136] [116, 435, 136] --
33
+ │ │ │ │ │ │ └─Dropout: 7-5 [116, 435, 136] [116, 435, 136] --
34
+ │ │ │ │ │ │ └─Linear: 7-6 [116, 435, 136] [116, 435, 112] 15,232
35
+ │ │ │ │ │ └─DropPath: 6-12 [116, 435, 112] [116, 435, 112] --
36
+ │ │ │ │ └─ParallelTransformerBlock: 5-8 [116, 435, 112] [116, 435, 112] --
37
+ │ │ │ │ │ └─LayerNorm: 6-13 [116, 435, 112] [116, 435, 112] 224
38
+ │ │ │ │ │ └─Linear: 6-14 [116, 435, 112] [116, 435, 1720] 192,640
39
+ │ │ │ │ │ └─Linear: 6-15 [116, 435, 528] [116, 435, 112] 59,136
40
+ │ │ │ │ │ └─DropPath: 6-16 [116, 435, 112] [116, 435, 112] --
41
+ │ │ │ │ │ └─Sequential: 6-17 [116, 435, 136] [116, 435, 112] --
42
+ │ │ │ │ │ │ └─GELU: 7-7 [116, 435, 136] [116, 435, 136] --
43
+ │ │ │ │ │ │ └─Dropout: 7-8 [116, 435, 136] [116, 435, 136] --
44
+ │ │ │ │ │ │ └─Linear: 7-9 [116, 435, 136] [116, 435, 112] 15,232
45
+ │ │ │ │ │ └─DropPath: 6-18 [116, 435, 112] [116, 435, 112] --
46
+ │ │ └─Transformer: 3-3 [435, 116, 112] [435, 116, 112] --
47
+ │ │ │ └─ModuleList: 4-3 -- -- --
48
+ │ │ │ │ └─ParallelTransformerBlock: 5-9 [435, 116, 112] [435, 116, 112] --
49
+ │ │ │ │ │ └─LayerNorm: 6-19 [435, 116, 112] [435, 116, 112] 224
50
+ │ │ │ │ │ └─Linear: 6-20 [435, 116, 112] [435, 116, 1720] 192,640
51
+ │ │ │ │ │ └─Linear: 6-21 [435, 116, 528] [435, 116, 112] 59,136
52
+ │ │ │ │ │ └─DropPath: 6-22 [435, 116, 112] [435, 116, 112] --
53
+ │ │ │ │ │ └─Sequential: 6-23 [435, 116, 136] [435, 116, 112] --
54
+ │ │ │ │ │ │ └─GELU: 7-10 [435, 116, 136] [435, 116, 136] --
55
+ │ │ │ │ │ │ └─Dropout: 7-11 [435, 116, 136] [435, 116, 136] --
56
+ │ │ │ │ │ │ └─Linear: 7-12 [435, 116, 136] [435, 116, 112] 15,232
57
+ │ │ │ │ │ └─DropPath: 6-24 [435, 116, 112] [435, 116, 112] --
58
+ │ │ │ │ └─ParallelTransformerBlock: 5-10 [435, 116, 112] [435, 116, 112] --
59
+ │ │ │ │ │ └─LayerNorm: 6-25 [435, 116, 112] [435, 116, 112] 224
60
+ │ │ │ │ │ └─Linear: 6-26 [435, 116, 112] [435, 116, 1720] 192,640
61
+ │ │ │ │ │ └─Linear: 6-27 [435, 116, 528] [435, 116, 112] 59,136
62
+ │ │ │ │ │ └─DropPath: 6-28 [435, 116, 112] [435, 116, 112] --
63
+ │ │ │ │ │ └─Sequential: 6-29 [435, 116, 136] [435, 116, 112] --
64
+ │ │ │ │ │ │ └─GELU: 7-13 [435, 116, 136] [435, 116, 136] --
65
+ │ │ │ │ │ │ └─Dropout: 7-14 [435, 116, 136] [435, 116, 136] --
66
+ │ │ │ │ │ │ └─Linear: 7-15 [435, 116, 136] [435, 116, 112] 15,232
67
+ │ │ │ │ │ └─DropPath: 6-30 [435, 116, 112] [435, 116, 112] --
68
+ │ │ │ │ └─ParallelTransformerBlock: 5-11 [435, 116, 112] [435, 116, 112] --
69
+ │ │ │ │ │ └─LayerNorm: 6-31 [435, 116, 112] [435, 116, 112] 224
70
+ │ │ │ │ │ └─Linear: 6-32 [435, 116, 112] [435, 116, 1720] 192,640
71
+ │ │ │ │ │ └─Linear: 6-33 [435, 116, 528] [435, 116, 112] 59,136
72
+ │ │ │ │ │ └─DropPath: 6-34 [435, 116, 112] [435, 116, 112] --
73
+ │ │ │ │ │ └─Sequential: 6-35 [435, 116, 136] [435, 116, 112] --
74
+ │ │ │ │ │ │ └─GELU: 7-16 [435, 116, 136] [435, 116, 136] --
75
+ │ │ │ │ │ │ └─Dropout: 7-17 [435, 116, 136] [435, 116, 136] --
76
+ │ │ │ │ │ │ └─Linear: 7-18 [435, 116, 136] [435, 116, 112] 15,232
77
+ │ │ │ │ │ └─DropPath: 6-36 [435, 116, 112] [435, 116, 112] --
78
+ │ │ │ │ └─ParallelTransformerBlock: 5-12 [435, 116, 112] [435, 116, 112] --
79
+ │ │ │ │ │ └─LayerNorm: 6-37 [435, 116, 112] [435, 116, 112] 224
80
+ │ │ │ │ │ └─Linear: 6-38 [435, 116, 112] [435, 116, 1720] 192,640
81
+ │ │ │ │ │ └─Linear: 6-39 [435, 116, 528] [435, 116, 112] 59,136
82
+ │ │ │ │ │ └─DropPath: 6-40 [435, 116, 112] [435, 116, 112] --
83
+ │ │ │ │ │ └─Sequential: 6-41 [435, 116, 136] [435, 116, 112] --
84
+ │ │ │ │ │ │ └─GELU: 7-19 [435, 116, 136] [435, 116, 136] --
85
+ │ │ │ │ │ │ └─Dropout: 7-20 [435, 116, 136] [435, 116, 136] --
86
+ │ │ │ │ │ │ └─Linear: 7-21 [435, 116, 136] [435, 116, 112] 15,232
87
+ │ │ │ │ │ └─DropPath: 6-42 [435, 116, 112] [435, 116, 112] --
88
+ │ │ │ │ └─ParallelTransformerBlock: 5-13 [435, 116, 112] [435, 116, 112] --
89
+ │ │ │ │ │ └─LayerNorm: 6-43 [435, 116, 112] [435, 116, 112] 224
90
+ │ │ │ │ │ └─Linear: 6-44 [435, 116, 112] [435, 116, 1720] 192,640
91
+ │ │ │ │ │ └─Linear: 6-45 [435, 116, 528] [435, 116, 112] 59,136
92
+ │ │ │ │ │ └─DropPath: 6-46 [435, 116, 112] [435, 116, 112] --
93
+ │ │ │ │ │ └─Sequential: 6-47 [435, 116, 136] [435, 116, 112] --
94
+ │ │ │ │ │ │ └─GELU: 7-22 [435, 116, 136] [435, 116, 136] --
95
+ │ │ │ │ │ │ └─Dropout: 7-23 [435, 116, 136] [435, 116, 136] --
96
+ │ │ │ │ │ │ └─Linear: 7-24 [435, 116, 136] [435, 116, 112] 15,232
97
+ │ │ │ │ │ └─DropPath: 6-48 [435, 116, 112] [435, 116, 112] --
98
+ │ │ └─Rearrange: 3-4 [1, 116, 435, 112] [1, 112, 116, 15, 29] --
99
+ ├─MLPShifters: 1-2 -- [1, 2, 116] 513
100
+ │ └─MLPShifter: 2-2 [116, 2] [116, 2] --
101
+ │ │ └─Sequential: 3-5 [116, 2] [116, 2] --
102
+ │ │ │ └─Linear: 4-4 [116, 2] [116, 5] 15
103
+ │ │ │ └─Tanh: 4-5 [116, 5] [116, 5] --
104
+ │ │ │ └─Linear: 4-6 [116, 5] [116, 5] 30
105
+ │ │ │ └─Tanh: 4-7 [116, 5] [116, 5] --
106
+ │ │ │ └─Linear: 4-8 [116, 5] [116, 2] 12
107
+ │ │ │ └─Tanh: 4-9 [116, 2] [116, 2] --
108
+ ├─Readouts: 1-3 [1, 112, 116, 15, 29] [1, 7440, 116] 8,477,649
109
+ │ └─Gaussian2DReadout2: 2-3 [1, 112, 116, 15, 29] [1, 7440, 116] 870,480
110
+ │ │ └─Sequential: 3-6 [7440, 2] [7440, 2] --
111
+ │ │ │ └─Linear: 4-10 [7440, 2] [7440, 30] 90
112
+ │ │ │ └─ELU: 4-11 [7440, 30] [7440, 30] --
113
+ │ │ │ └─Linear: 4-12 [7440, 30] [7440, 2] 62
114
+ │ │ │ └─Tanh: 4-13 [7440, 2] [7440, 2] --
115
+ │ │ └─Sequential: 3-7 [7440, 2] [7440, 2] (recursive)
116
+ │ │ │ └─Linear: 4-14 [7440, 2] [7440, 30] (recursive)
117
+ │ │ │ └─ELU: 4-15 [7440, 30] [7440, 30] --
118
+ �� │ │ └─Linear: 4-16 [7440, 30] [7440, 2] (recursive)
119
+ │ │ │ └─Tanh: 4-17 [7440, 2] [7440, 2] --
120
+ │ │ └─Sequential: 3-8 [7440, 2] [7440, 2] (recursive)
121
+ │ │ │ └─Linear: 4-18 [7440, 2] [7440, 30] (recursive)
122
+ │ │ │ └─ELU: 4-19 [7440, 30] [7440, 30] --
123
+ │ │ │ └─Linear: 4-20 [7440, 30] [7440, 2] (recursive)
124
+ │ │ │ └─Tanh: 4-21 [7440, 2] [7440, 2] --
125
+ │ │ └─Sequential: 3-9 [116, 4] [116, 112] --
126
+ │ │ │ └─Linear: 4-22 [116, 4] [116, 112] 560
127
+ │ │ │ └─LayerNorm: 4-23 [116, 112] [116, 112] 224
128
+ │ │ │ └─GELU: 4-24 [116, 112] [116, 112] --
129
+ │ │ │ └─Dropout: 4-25 [116, 112] [116, 112] --
130
+ │ │ │ └─Linear: 4-26 [116, 112] [116, 112] 12,656
131
+ │ │ │ └─Tanh: 4-27 [116, 112] [116, 112] --
132
+ ├─Exponential: 1-4 [1, 7440, 116] [1, 7440, 116] --
133
+ =======================================================================================================================================
134
+ Total params: 12,278,365
135
+ Trainable params: 12,278,365
136
+ Non-trainable params: 0
137
+ Total mult-adds (Units.MEGABYTES): 679.88
138
+ =======================================================================================================================================
139
+ Input size (MB): 1.29
140
+ Forward/backward pass size (MB): 9208.73
141
+ Params size (MB): 11.40
142
+ Estimated Total Size (MB): 9221.42
143
+ =======================================================================================================================================
002/output.log ADDED
@@ -0,0 +1,942 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Use bfloat16 for core module.
2
+ Use parallel attention and MLP in ViViT.
3
+
4
+ Epoch 001/400
5
+ Train loss: 121388096.00 correlation: 0.0109
6
+ Validation loss: 200734000.00 correlation: 0.0221
7
+ Elapse: 522.91s
8
+
9
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
10
+
11
+ Epoch 002/400
12
+ Train loss: 98318960.00 correlation: 0.0308
13
+ Validation loss: 199955104.00 correlation: 0.0339
14
+ Elapse: 525.64s
15
+
16
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
17
+
18
+ Epoch 003/400
19
+ Train loss: 97097640.00 correlation: 0.0413
20
+ Validation loss: 199270752.00 correlation: 0.0396
21
+ Elapse: 531.95s
22
+
23
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
24
+
25
+ Epoch 004/400
26
+ Train loss: 96457752.00 correlation: 0.0479
27
+ Validation loss: 198723456.00 correlation: 0.0421
28
+ Elapse: 536.86s
29
+
30
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
31
+
32
+ Epoch 005/400
33
+ Train loss: 95920056.00 correlation: 0.0541
34
+ Validation loss: 197835248.00 correlation: 0.0461
35
+ Elapse: 538.89s
36
+
37
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
38
+
39
+ Epoch 006/400
40
+ Train loss: 95131240.00 correlation: 0.0621
41
+ Validation loss: 196873360.00 correlation: 0.0519
42
+ Elapse: 542.34s
43
+
44
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
45
+
46
+ Epoch 007/400
47
+ Train loss: 94226616.00 correlation: 0.0710
48
+ Validation loss: 195726576.00 correlation: 0.0578
49
+ Elapse: 541.43s
50
+
51
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
52
+
53
+ Epoch 008/400
54
+ Train loss: 93506680.00 correlation: 0.0783
55
+ Validation loss: 194520016.00 correlation: 0.0654
56
+ Elapse: 541.56s
57
+
58
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
59
+
60
+ Epoch 009/400
61
+ Train loss: 92727504.00 correlation: 0.0871
62
+ Validation loss: 193465776.00 correlation: 0.0716
63
+ Elapse: 543.31s
64
+
65
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
66
+
67
+ Epoch 010/400
68
+ Train loss: 91843728.00 correlation: 0.0966
69
+ Validation loss: 192176672.00 correlation: 0.0791
70
+ Elapse: 541.68s
71
+
72
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
73
+
74
+ Epoch 011/400
75
+ Train loss: 90936304.00 correlation: 0.1063
76
+ Validation loss: 190695968.00 correlation: 0.0928
77
+ Elapse: 540.29s
78
+
79
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
80
+
81
+ Epoch 012/400
82
+ Train loss: 90051912.00 correlation: 0.1153
83
+ Validation loss: 189604784.00 correlation: 0.1011
84
+ Elapse: 542.29s
85
+
86
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
87
+
88
+ Epoch 013/400
89
+ Train loss: 89180568.00 correlation: 0.1245
90
+ Validation loss: 188031648.00 correlation: 0.1112
91
+ Elapse: 542.62s
92
+
93
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
94
+
95
+ Epoch 014/400
96
+ Train loss: 88307792.00 correlation: 0.1337
97
+ Validation loss: 186159440.00 correlation: 0.1226
98
+ Elapse: 540.81s
99
+
100
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
101
+
102
+ Epoch 015/400
103
+ Train loss: 87278960.00 correlation: 0.1436
104
+ Validation loss: 184683440.00 correlation: 0.1313
105
+ Elapse: 543.63s
106
+
107
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
108
+
109
+ Epoch 016/400
110
+ Train loss: 86609264.00 correlation: 0.1505
111
+ Validation loss: 183679264.00 correlation: 0.1374
112
+ Elapse: 544.07s
113
+
114
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
115
+
116
+ Epoch 017/400
117
+ Train loss: 85933704.00 correlation: 0.1573
118
+ Validation loss: 182858960.00 correlation: 0.1427
119
+ Elapse: 543.60s
120
+
121
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
122
+
123
+ Epoch 018/400
124
+ Train loss: 85316224.00 correlation: 0.1634
125
+ Validation loss: 181758608.00 correlation: 0.1502
126
+ Elapse: 543.09s
127
+
128
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
129
+
130
+ Epoch 019/400
131
+ Train loss: 84800144.00 correlation: 0.1686
132
+ Validation loss: 181267248.00 correlation: 0.1538
133
+ Elapse: 545.10s
134
+
135
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
136
+
137
+ Epoch 020/400
138
+ Train loss: 84276656.00 correlation: 0.1737
139
+ Validation loss: 180435344.00 correlation: 0.1578
140
+ Elapse: 545.34s
141
+
142
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
143
+
144
+ Epoch 021/400
145
+ Train loss: 83717728.00 correlation: 0.1793
146
+ Validation loss: 179796752.00 correlation: 0.1639
147
+ Elapse: 545.93s
148
+
149
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
150
+
151
+ Epoch 022/400
152
+ Train loss: 83306056.00 correlation: 0.1836
153
+ Validation loss: 178887952.00 correlation: 0.1689
154
+ Elapse: 545.45s
155
+
156
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
157
+
158
+ Epoch 023/400
159
+ Train loss: 82787680.00 correlation: 0.1887
160
+ Validation loss: 177999440.00 correlation: 0.1749
161
+ Elapse: 545.47s
162
+
163
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
164
+
165
+ Epoch 024/400
166
+ Train loss: 82335960.00 correlation: 0.1933
167
+ Validation loss: 177650256.00 correlation: 0.1774
168
+ Elapse: 545.75s
169
+
170
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
171
+
172
+ Epoch 025/400
173
+ Train loss: 82013392.00 correlation: 0.1962
174
+ Validation loss: 177572752.00 correlation: 0.1786
175
+ Elapse: 545.69s
176
+
177
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
178
+
179
+ Epoch 026/400
180
+ Train loss: 81675472.00 correlation: 0.1996
181
+ Validation loss: 176845120.00 correlation: 0.1841
182
+ Elapse: 545.58s
183
+
184
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
185
+
186
+ Epoch 027/400
187
+ Train loss: 81393008.00 correlation: 0.2025
188
+ Validation loss: 176056032.00 correlation: 0.1886
189
+ Elapse: 545.76s
190
+
191
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
192
+
193
+ Epoch 028/400
194
+ Train loss: 80972248.00 correlation: 0.2065
195
+ Validation loss: 175799008.00 correlation: 0.1898
196
+ Elapse: 545.76s
197
+
198
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
199
+
200
+ Epoch 029/400
201
+ Train loss: 80749744.00 correlation: 0.2086
202
+ Validation loss: 175376608.00 correlation: 0.1918
203
+ Elapse: 546.06s
204
+
205
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
206
+
207
+ Epoch 030/400
208
+ Train loss: 80453840.00 correlation: 0.2117
209
+ Validation loss: 174830400.00 correlation: 0.1967
210
+ Elapse: 546.10s
211
+
212
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
213
+
214
+ Epoch 031/400
215
+ Train loss: 80186704.00 correlation: 0.2145
216
+ Validation loss: 174322544.00 correlation: 0.1984
217
+ Elapse: 545.45s
218
+
219
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
220
+
221
+ Epoch 032/400
222
+ Train loss: 79856432.00 correlation: 0.2176
223
+ Validation loss: 174104672.00 correlation: 0.2003
224
+ Elapse: 545.77s
225
+
226
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
227
+
228
+ Epoch 033/400
229
+ Train loss: 79589576.00 correlation: 0.2200
230
+ Validation loss: 173607248.00 correlation: 0.2031
231
+ Elapse: 545.80s
232
+
233
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
234
+
235
+ Epoch 034/400
236
+ Train loss: 79380120.00 correlation: 0.2221
237
+ Validation loss: 173319472.00 correlation: 0.2055
238
+ Elapse: 545.70s
239
+
240
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
241
+
242
+ Epoch 035/400
243
+ Train loss: 79158640.00 correlation: 0.2243
244
+ Validation loss: 172901472.00 correlation: 0.2089
245
+ Elapse: 545.61s
246
+
247
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
248
+
249
+ Epoch 036/400
250
+ Train loss: 78927200.00 correlation: 0.2266
251
+ Validation loss: 172636560.00 correlation: 0.2097
252
+ Elapse: 546.53s
253
+
254
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
255
+
256
+ Epoch 037/400
257
+ Train loss: 78682176.00 correlation: 0.2288
258
+ Validation loss: 172407184.00 correlation: 0.2118
259
+ Elapse: 545.83s
260
+
261
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
262
+
263
+ Epoch 038/400
264
+ Train loss: 78582504.00 correlation: 0.2299
265
+ Validation loss: 172238496.00 correlation: 0.2137
266
+ Elapse: 542.71s
267
+
268
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
269
+
270
+ Epoch 039/400
271
+ Train loss: 78397632.00 correlation: 0.2314
272
+ Validation loss: 171969648.00 correlation: 0.2147
273
+ Elapse: 545.53s
274
+
275
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
276
+
277
+ Epoch 040/400
278
+ Train loss: 78234600.00 correlation: 0.2330
279
+ Validation loss: 171758000.00 correlation: 0.2170
280
+ Elapse: 545.77s
281
+
282
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
283
+
284
+ Epoch 041/400
285
+ Train loss: 78047656.00 correlation: 0.2349
286
+ Validation loss: 171651168.00 correlation: 0.2175
287
+ Elapse: 545.10s
288
+
289
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
290
+
291
+ Epoch 042/400
292
+ Train loss: 77868808.00 correlation: 0.2362
293
+ Validation loss: 171537312.00 correlation: 0.2173
294
+ Elapse: 545.58s
295
+
296
+ Epoch 043/400
297
+ Train loss: 77839128.00 correlation: 0.2370
298
+ Validation loss: 171300016.00 correlation: 0.2185
299
+ Elapse: 546.30s
300
+
301
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
302
+
303
+ Epoch 044/400
304
+ Train loss: 77629288.00 correlation: 0.2390
305
+ Validation loss: 171374944.00 correlation: 0.2191
306
+ Elapse: 546.42s
307
+
308
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
309
+
310
+ Epoch 045/400
311
+ Train loss: 77550776.00 correlation: 0.2396
312
+ Validation loss: 171207344.00 correlation: 0.2194
313
+ Elapse: 545.96s
314
+
315
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
316
+
317
+ Epoch 046/400
318
+ Train loss: 77437640.00 correlation: 0.2408
319
+ Validation loss: 171176240.00 correlation: 0.2198
320
+ Elapse: 546.38s
321
+
322
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
323
+
324
+ Epoch 047/400
325
+ Train loss: 77397712.00 correlation: 0.2412
326
+ Validation loss: 170808800.00 correlation: 0.2224
327
+ Elapse: 545.84s
328
+
329
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
330
+
331
+ Epoch 048/400
332
+ Train loss: 77307432.00 correlation: 0.2422
333
+ Validation loss: 170735520.00 correlation: 0.2233
334
+ Elapse: 546.33s
335
+
336
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
337
+
338
+ Epoch 049/400
339
+ Train loss: 77119432.00 correlation: 0.2439
340
+ Validation loss: 170442368.00 correlation: 0.2245
341
+ Elapse: 545.45s
342
+
343
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
344
+
345
+ Epoch 050/400
346
+ Train loss: 76988832.00 correlation: 0.2449
347
+ Validation loss: 170672960.00 correlation: 0.2232
348
+ Elapse: 544.34s
349
+
350
+ Epoch 051/400
351
+ Train loss: 76992464.00 correlation: 0.2450
352
+ Validation loss: 170562112.00 correlation: 0.2244
353
+ Elapse: 545.56s
354
+
355
+ Epoch 052/400
356
+ Train loss: 76925112.00 correlation: 0.2452
357
+ Validation loss: 170404016.00 correlation: 0.2248
358
+ Elapse: 545.72s
359
+
360
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
361
+
362
+ Epoch 053/400
363
+ Train loss: 76844464.00 correlation: 0.2460
364
+ Validation loss: 170137952.00 correlation: 0.2261
365
+ Elapse: 545.92s
366
+
367
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
368
+
369
+ Epoch 054/400
370
+ Train loss: 76812920.00 correlation: 0.2469
371
+ Validation loss: 170023120.00 correlation: 0.2259
372
+ Elapse: 545.56s
373
+
374
+ Epoch 055/400
375
+ Train loss: 76702536.00 correlation: 0.2475
376
+ Validation loss: 170054384.00 correlation: 0.2263
377
+ Elapse: 544.95s
378
+
379
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
380
+
381
+ Epoch 056/400
382
+ Train loss: 76612752.00 correlation: 0.2485
383
+ Validation loss: 170032864.00 correlation: 0.2272
384
+ Elapse: 545.49s
385
+
386
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
387
+
388
+ Epoch 057/400
389
+ Train loss: 76617696.00 correlation: 0.2485
390
+ Validation loss: 169630816.00 correlation: 0.2293
391
+ Elapse: 545.90s
392
+
393
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
394
+
395
+ Epoch 058/400
396
+ Train loss: 76465880.00 correlation: 0.2499
397
+ Validation loss: 169825600.00 correlation: 0.2283
398
+ Elapse: 545.37s
399
+
400
+ Epoch 059/400
401
+ Train loss: 76456912.00 correlation: 0.2499
402
+ Validation loss: 169766688.00 correlation: 0.2284
403
+ Elapse: 545.61s
404
+
405
+ Epoch 060/400
406
+ Train loss: 76426872.00 correlation: 0.2501
407
+ Validation loss: 169651072.00 correlation: 0.2298
408
+ Elapse: 545.66s
409
+
410
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
411
+
412
+ Epoch 061/400
413
+ Train loss: 76272176.00 correlation: 0.2515
414
+ Validation loss: 169694896.00 correlation: 0.2290
415
+ Elapse: 544.26s
416
+
417
+ Epoch 062/400
418
+ Train loss: 76381040.00 correlation: 0.2506
419
+ Validation loss: 169396208.00 correlation: 0.2316
420
+ Elapse: 544.91s
421
+
422
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
423
+
424
+ Epoch 063/400
425
+ Train loss: 76206744.00 correlation: 0.2523
426
+ Validation loss: 169683888.00 correlation: 0.2297
427
+ Elapse: 544.69s
428
+
429
+ Epoch 064/400
430
+ Train loss: 76167792.00 correlation: 0.2527
431
+ Validation loss: 169194928.00 correlation: 0.2329
432
+ Elapse: 545.55s
433
+
434
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
435
+
436
+ Epoch 065/400
437
+ Train loss: 76127384.00 correlation: 0.2528
438
+ Validation loss: 169763808.00 correlation: 0.2287
439
+ Elapse: 545.54s
440
+
441
+ Epoch 066/400
442
+ Train loss: 76104336.00 correlation: 0.2531
443
+ Validation loss: 169165280.00 correlation: 0.2327
444
+ Elapse: 545.65s
445
+
446
+ Epoch 067/400
447
+ Train loss: 76021512.00 correlation: 0.2539
448
+ Validation loss: 169219872.00 correlation: 0.2317
449
+ Elapse: 545.30s
450
+
451
+ Epoch 068/400
452
+ Train loss: 76148160.00 correlation: 0.2528
453
+ Validation loss: 169344656.00 correlation: 0.2314
454
+ Elapse: 545.59s
455
+
456
+ Epoch 069/400
457
+ Train loss: 75939984.00 correlation: 0.2545
458
+ Validation loss: 169043376.00 correlation: 0.2339
459
+ Elapse: 545.18s
460
+
461
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
462
+
463
+ Epoch 070/400
464
+ Train loss: 75822872.00 correlation: 0.2557
465
+ Validation loss: 169167760.00 correlation: 0.2328
466
+ Elapse: 544.88s
467
+
468
+ Epoch 071/400
469
+ Train loss: 75873072.00 correlation: 0.2551
470
+ Validation loss: 169123712.00 correlation: 0.2336
471
+ Elapse: 545.60s
472
+
473
+ Epoch 072/400
474
+ Train loss: 75867984.00 correlation: 0.2552
475
+ Validation loss: 168947232.00 correlation: 0.2344
476
+ Elapse: 545.61s
477
+
478
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
479
+
480
+ Epoch 073/400
481
+ Train loss: 75840912.00 correlation: 0.2555
482
+ Validation loss: 169026784.00 correlation: 0.2348
483
+ Elapse: 545.60s
484
+
485
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
486
+
487
+ Epoch 074/400
488
+ Train loss: 75855384.00 correlation: 0.2555
489
+ Validation loss: 168842592.00 correlation: 0.2341
490
+ Elapse: 545.99s
491
+
492
+ Epoch 075/400
493
+ Train loss: 75737744.00 correlation: 0.2565
494
+ Validation loss: 168971312.00 correlation: 0.2336
495
+ Elapse: 545.40s
496
+
497
+ Epoch 076/400
498
+ Train loss: 75735656.00 correlation: 0.2565
499
+ Validation loss: 168829920.00 correlation: 0.2338
500
+ Elapse: 546.00s
501
+
502
+ Epoch 077/400
503
+ Train loss: 75607888.00 correlation: 0.2576
504
+ Validation loss: 168935968.00 correlation: 0.2349
505
+ Elapse: 545.47s
506
+
507
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
508
+
509
+ Epoch 078/400
510
+ Train loss: 75679128.00 correlation: 0.2571
511
+ Validation loss: 168987280.00 correlation: 0.2328
512
+ Elapse: 545.11s
513
+
514
+ Epoch 079/400
515
+ Train loss: 75621152.00 correlation: 0.2574
516
+ Validation loss: 168822512.00 correlation: 0.2347
517
+ Elapse: 545.59s
518
+
519
+ Epoch 080/400
520
+ Train loss: 75483728.00 correlation: 0.2590
521
+ Validation loss: 168774416.00 correlation: 0.2347
522
+ Elapse: 545.47s
523
+
524
+ Epoch 081/400
525
+ Train loss: 75531304.00 correlation: 0.2586
526
+ Validation loss: 169126304.00 correlation: 0.2331
527
+ Elapse: 545.29s
528
+
529
+ Epoch 082/400
530
+ Train loss: 75558736.00 correlation: 0.2583
531
+ Validation loss: 168670160.00 correlation: 0.2354
532
+ Elapse: 545.72s
533
+
534
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
535
+
536
+ Epoch 083/400
537
+ Train loss: 75590176.00 correlation: 0.2579
538
+ Validation loss: 169091472.00 correlation: 0.2330
539
+ Elapse: 545.76s
540
+
541
+ Epoch 084/400
542
+ Train loss: 75406416.00 correlation: 0.2595
543
+ Validation loss: 169084192.00 correlation: 0.2329
544
+ Elapse: 545.78s
545
+
546
+ Epoch 085/400
547
+ Train loss: 75376912.00 correlation: 0.2599
548
+ Validation loss: 168861952.00 correlation: 0.2341
549
+ Elapse: 545.89s
550
+
551
+ Epoch 086/400
552
+ Train loss: 75349048.00 correlation: 0.2604
553
+ Validation loss: 168882304.00 correlation: 0.2349
554
+ Elapse: 545.73s
555
+
556
+ Epoch 087/400
557
+ Train loss: 75302984.00 correlation: 0.2607
558
+ Validation loss: 169006784.00 correlation: 0.2333
559
+ Elapse: 545.26s
560
+
561
+ Loaded checkpoint from epoch 82 (correlation: 0.2354).
562
+
563
+ Reduce learning rate of core to 1.4400e-03 (num. reduce: 1).
564
+ Reduce learning rate of readouts to 1.0800e-03 (num. reduce: 1).
565
+ Reduce learning rate of shifters to 1.0800e-03 (num. reduce: 1).
566
+
567
+ Epoch 088/400
568
+ Train loss: 73472912.00 correlation: 0.2760
569
+ Validation loss: 166967968.00 correlation: 0.2466
570
+ Elapse: 546.46s
571
+
572
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
573
+
574
+ Epoch 089/400
575
+ Train loss: 72834528.00 correlation: 0.2820
576
+ Validation loss: 166834160.00 correlation: 0.2485
577
+ Elapse: 546.50s
578
+
579
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
580
+
581
+ Epoch 090/400
582
+ Train loss: 72607408.00 correlation: 0.2844
583
+ Validation loss: 166764992.00 correlation: 0.2490
584
+ Elapse: 546.18s
585
+
586
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
587
+
588
+ Epoch 091/400
589
+ Train loss: 72571872.00 correlation: 0.2846
590
+ Validation loss: 166824368.00 correlation: 0.2476
591
+ Elapse: 546.25s
592
+
593
+ Epoch 092/400
594
+ Train loss: 72491600.00 correlation: 0.2854
595
+ Validation loss: 166791872.00 correlation: 0.2474
596
+ Elapse: 545.90s
597
+
598
+ Epoch 093/400
599
+ Train loss: 72479560.00 correlation: 0.2856
600
+ Validation loss: 166900064.00 correlation: 0.2473
601
+ Elapse: 546.88s
602
+
603
+ Epoch 094/400
604
+ Train loss: 72391640.00 correlation: 0.2867
605
+ Validation loss: 166895872.00 correlation: 0.2471
606
+ Elapse: 546.67s
607
+
608
+ Epoch 095/400
609
+ Train loss: 72406800.00 correlation: 0.2865
610
+ Validation loss: 166785824.00 correlation: 0.2477
611
+ Elapse: 546.76s
612
+
613
+ Loaded checkpoint from epoch 90 (correlation: 0.2490).
614
+
615
+ Reduce learning rate of core to 4.3200e-04 (num. reduce: 1).
616
+ Reduce learning rate of readouts to 3.2400e-04 (num. reduce: 1).
617
+ Reduce learning rate of shifters to 3.2400e-04 (num. reduce: 1).
618
+
619
+ Epoch 096/400
620
+ Train loss: 71820392.00 correlation: 0.2914
621
+ Validation loss: 166357664.00 correlation: 0.2510
622
+ Elapse: 546.29s
623
+
624
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
625
+
626
+ Epoch 097/400
627
+ Train loss: 71646128.00 correlation: 0.2926
628
+ Validation loss: 166358480.00 correlation: 0.2512
629
+ Elapse: 546.63s
630
+
631
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
632
+
633
+ Epoch 098/400
634
+ Train loss: 71469944.00 correlation: 0.2943
635
+ Validation loss: 166261168.00 correlation: 0.2520
636
+ Elapse: 547.33s
637
+
638
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
639
+
640
+ Epoch 099/400
641
+ Train loss: 71457032.00 correlation: 0.2945
642
+ Validation loss: 166242256.00 correlation: 0.2517
643
+ Elapse: 547.22s
644
+
645
+ Epoch 100/400
646
+ Train loss: 71381520.00 correlation: 0.2953
647
+ Validation loss: 166269072.00 correlation: 0.2516
648
+ Elapse: 546.93s
649
+
650
+ Epoch 101/400
651
+ Train loss: 71365904.00 correlation: 0.2954
652
+ Validation loss: 166306016.00 correlation: 0.2512
653
+ Elapse: 547.14s
654
+
655
+ Epoch 102/400
656
+ Train loss: 71313408.00 correlation: 0.2956
657
+ Validation loss: 166202720.00 correlation: 0.2520
658
+ Elapse: 547.18s
659
+
660
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
661
+
662
+ Epoch 103/400
663
+ Train loss: 71246520.00 correlation: 0.2963
664
+ Validation loss: 166201664.00 correlation: 0.2519
665
+ Elapse: 546.59s
666
+
667
+ Epoch 104/400
668
+ Train loss: 71237544.00 correlation: 0.2967
669
+ Validation loss: 166225280.00 correlation: 0.2516
670
+ Elapse: 546.47s
671
+
672
+ Epoch 105/400
673
+ Train loss: 71175248.00 correlation: 0.2973
674
+ Validation loss: 166234304.00 correlation: 0.2515
675
+ Elapse: 546.73s
676
+
677
+ Epoch 106/400
678
+ Train loss: 71139096.00 correlation: 0.2976
679
+ Validation loss: 166179840.00 correlation: 0.2518
680
+ Elapse: 547.27s
681
+
682
+ Epoch 107/400
683
+ Train loss: 71152664.00 correlation: 0.2972
684
+ Validation loss: 166277328.00 correlation: 0.2509
685
+ Elapse: 547.28s
686
+
687
+ Loaded checkpoint from epoch 102 (correlation: 0.2520).
688
+
689
+ Reduce learning rate of core to 1.2960e-04 (num. reduce: 1).
690
+ Reduce learning rate of readouts to 9.7200e-05 (num. reduce: 1).
691
+ Reduce learning rate of shifters to 9.7200e-05 (num. reduce: 1).
692
+
693
+ Epoch 108/400
694
+ Train loss: 70975272.00 correlation: 0.2990
695
+ Validation loss: 166102416.00 correlation: 0.2526
696
+ Elapse: 547.38s
697
+
698
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
699
+
700
+ Epoch 109/400
701
+ Train loss: 70927400.00 correlation: 0.2990
702
+ Validation loss: 166090848.00 correlation: 0.2526
703
+ Elapse: 547.10s
704
+
705
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
706
+
707
+ Epoch 110/400
708
+ Train loss: 70928176.00 correlation: 0.2993
709
+ Validation loss: 166087520.00 correlation: 0.2526
710
+ Elapse: 547.24s
711
+
712
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
713
+
714
+ Epoch 111/400
715
+ Train loss: 70948912.00 correlation: 0.2989
716
+ Validation loss: 166067424.00 correlation: 0.2526
717
+ Elapse: 547.30s
718
+
719
+ Epoch 112/400
720
+ Train loss: 70843856.00 correlation: 0.2999
721
+ Validation loss: 166089904.00 correlation: 0.2527
722
+ Elapse: 547.44s
723
+
724
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
725
+
726
+ Epoch 113/400
727
+ Train loss: 70930864.00 correlation: 0.2991
728
+ Validation loss: 166048192.00 correlation: 0.2527
729
+ Elapse: 547.22s
730
+
731
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
732
+
733
+ Epoch 114/400
734
+ Train loss: 70888224.00 correlation: 0.2998
735
+ Validation loss: 166076336.00 correlation: 0.2525
736
+ Elapse: 547.07s
737
+
738
+ Epoch 115/400
739
+ Train loss: 70807400.00 correlation: 0.3003
740
+ Validation loss: 166078992.00 correlation: 0.2524
741
+ Elapse: 547.34s
742
+
743
+ Epoch 116/400
744
+ Train loss: 70784824.00 correlation: 0.3006
745
+ Validation loss: 166036512.00 correlation: 0.2528
746
+ Elapse: 547.33s
747
+
748
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
749
+
750
+ Epoch 117/400
751
+ Train loss: 70760888.00 correlation: 0.3007
752
+ Validation loss: 166109792.00 correlation: 0.2523
753
+ Elapse: 547.36s
754
+
755
+ Epoch 118/400
756
+ Train loss: 70793224.00 correlation: 0.3003
757
+ Validation loss: 166033088.00 correlation: 0.2527
758
+ Elapse: 547.66s
759
+
760
+ Epoch 119/400
761
+ Train loss: 70801416.00 correlation: 0.3002
762
+ Validation loss: 166062960.00 correlation: 0.2529
763
+ Elapse: 547.68s
764
+
765
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
766
+
767
+ Epoch 120/400
768
+ Train loss: 70748944.00 correlation: 0.3009
769
+ Validation loss: 166063152.00 correlation: 0.2524
770
+ Elapse: 547.18s
771
+
772
+ Epoch 121/400
773
+ Train loss: 70736464.00 correlation: 0.3010
774
+ Validation loss: 166058976.00 correlation: 0.2528
775
+ Elapse: 547.53s
776
+
777
+ Epoch 122/400
778
+ Train loss: 70653008.00 correlation: 0.3019
779
+ Validation loss: 166041920.00 correlation: 0.2527
780
+ Elapse: 547.68s
781
+
782
+ Epoch 123/400
783
+ Train loss: 70723656.00 correlation: 0.3011
784
+ Validation loss: 166053344.00 correlation: 0.2525
785
+ Elapse: 547.37s
786
+
787
+ Epoch 124/400
788
+ Train loss: 70689936.00 correlation: 0.3016
789
+ Validation loss: 166053472.00 correlation: 0.2526
790
+ Elapse: 547.93s
791
+
792
+ Loaded checkpoint from epoch 119 (correlation: 0.2529).
793
+
794
+ Reduce learning rate of core to 3.8880e-05 (num. reduce: 1).
795
+ Reduce learning rate of readouts to 2.9160e-05 (num. reduce: 1).
796
+ Reduce learning rate of shifters to 2.9160e-05 (num. reduce: 1).
797
+
798
+ Epoch 125/400
799
+ Train loss: 70604440.00 correlation: 0.3023
800
+ Validation loss: 166025312.00 correlation: 0.2529
801
+ Elapse: 547.63s
802
+
803
+ Epoch 126/400
804
+ Train loss: 70608160.00 correlation: 0.3021
805
+ Validation loss: 166010512.00 correlation: 0.2530
806
+ Elapse: 547.36s
807
+
808
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
809
+
810
+ Epoch 127/400
811
+ Train loss: 70626448.00 correlation: 0.3020
812
+ Validation loss: 166023648.00 correlation: 0.2528
813
+ Elapse: 547.13s
814
+
815
+ Epoch 128/400
816
+ Train loss: 70612096.00 correlation: 0.3018
817
+ Validation loss: 166023216.00 correlation: 0.2529
818
+ Elapse: 546.99s
819
+
820
+ Epoch 129/400
821
+ Train loss: 70635640.00 correlation: 0.3020
822
+ Validation loss: 166036208.00 correlation: 0.2528
823
+ Elapse: 547.23s
824
+
825
+ Epoch 130/400
826
+ Train loss: 70666920.00 correlation: 0.3015
827
+ Validation loss: 166035808.00 correlation: 0.2527
828
+ Elapse: 546.99s
829
+
830
+ Epoch 131/400
831
+ Train loss: 70564592.00 correlation: 0.3028
832
+ Validation loss: 166005856.00 correlation: 0.2528
833
+ Elapse: 547.30s
834
+
835
+ Loaded checkpoint from epoch 126 (correlation: 0.2530).
836
+
837
+ Reduce learning rate of core to 1.1664e-05 (num. reduce: 1).
838
+ Reduce learning rate of readouts to 8.7480e-06 (num. reduce: 1).
839
+ Reduce learning rate of shifters to 8.7480e-06 (num. reduce: 1).
840
+
841
+ Epoch 132/400
842
+ Train loss: 70603848.00 correlation: 0.3022
843
+ Validation loss: 166004944.00 correlation: 0.2530
844
+ Elapse: 547.32s
845
+
846
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/009/ckpt/model_state.pt.
847
+
848
+ Epoch 133/400
849
+ Train loss: 70533872.00 correlation: 0.3031
850
+ Validation loss: 166019360.00 correlation: 0.2529
851
+ Elapse: 547.50s
852
+
853
+ Epoch 134/400
854
+ Train loss: 70635248.00 correlation: 0.3019
855
+ Validation loss: 166021888.00 correlation: 0.2529
856
+ Elapse: 547.34s
857
+
858
+ Epoch 135/400
859
+ Train loss: 70620176.00 correlation: 0.3020
860
+ Validation loss: 166009888.00 correlation: 0.2529
861
+ Elapse: 546.38s
862
+
863
+ Epoch 136/400
864
+ Train loss: 70572368.00 correlation: 0.3023
865
+ Validation loss: 166012144.00 correlation: 0.2529
866
+ Elapse: 547.10s
867
+
868
+ Epoch 137/400
869
+ Train loss: 70658640.00 correlation: 0.3016
870
+ Validation loss: 166018080.00 correlation: 0.2529
871
+ Elapse: 546.90s
872
+
873
+ Loaded checkpoint from epoch 132 (correlation: 0.2530).
874
+
875
+ Reduce learning rate of core to 3.4992e-06 (num. reduce: 1).
876
+ Reduce learning rate of readouts to 2.6244e-06 (num. reduce: 1).
877
+ Reduce learning rate of shifters to 2.6244e-06 (num. reduce: 1).
878
+
879
+ Epoch 138/400
880
+ Train loss: 70545520.00 correlation: 0.3026
881
+ Validation loss: 166011936.00 correlation: 0.2530
882
+ Elapse: 546.72s
883
+
884
+ Epoch 139/400
885
+ Train loss: 70622800.00 correlation: 0.3018
886
+ Validation loss: 166013088.00 correlation: 0.2529
887
+ Elapse: 547.01s
888
+
889
+ Epoch 140/400
890
+ Train loss: 70572936.00 correlation: 0.3025
891
+ Validation loss: 166013696.00 correlation: 0.2529
892
+ Elapse: 547.38s
893
+
894
+ Epoch 141/400
895
+ Train loss: 70624016.00 correlation: 0.3020
896
+ Validation loss: 166012496.00 correlation: 0.2530
897
+ Elapse: 546.98s
898
+
899
+ Epoch 142/400
900
+ Train loss: 70651392.00 correlation: 0.3018
901
+ Validation loss: 166017120.00 correlation: 0.2529
902
+ Elapse: 547.57s
903
+
904
+ Loaded checkpoint from epoch 132 (correlation: 0.2530).
905
+
906
+ Reduce learning rate of core to 1.0498e-06 (num. reduce: 2).
907
+ Reduce learning rate of readouts to 7.8732e-07 (num. reduce: 2).
908
+ Reduce learning rate of shifters to 7.8732e-07 (num. reduce: 2).
909
+
910
+ Epoch 143/400
911
+ Train loss: 70616608.00 correlation: 0.3018
912
+ Validation loss: 166009488.00 correlation: 0.2530
913
+ Elapse: 547.46s
914
+
915
+ Epoch 144/400
916
+ Train loss: 70557224.00 correlation: 0.3027
917
+ Validation loss: 166010240.00 correlation: 0.2530
918
+ Elapse: 547.42s
919
+
920
+ Epoch 145/400
921
+ Train loss: 70617064.00 correlation: 0.3020
922
+ Validation loss: 166011824.00 correlation: 0.2530
923
+ Elapse: 547.48s
924
+
925
+ Epoch 146/400
926
+ Train loss: 70601720.00 correlation: 0.3022
927
+ Validation loss: 166010880.00 correlation: 0.2530
928
+ Elapse: 547.26s
929
+
930
+ Epoch 147/400
931
+ Train loss: 70616768.00 correlation: 0.3021
932
+ Validation loss: 166012944.00 correlation: 0.2530
933
+ Elapse: 547.43s
934
+
935
+ Model has not improved after 2 LR reductions.
936
+
937
+ Loaded checkpoint from epoch 132 (correlation: 0.2530).
938
+
939
+
940
+ ValidationA: 0.2508 B: 0.2804 C: 0.2750 D: 0.2393 E: 0.2390 F: 0.2346 G: 0.2573 H: 0.2379 I: 0.2555 J: 0.2599 average: 0.2530
941
+
942
+ Results saved to /home/storage/runs/vivit_ensemble/009.
003/args.yaml ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_eps: 1e-08
4
+ batch_size: 6
5
+ cache_data: false
6
+ center_crop: 1.0
7
+ clear_output_dir: true
8
+ core: vivit
9
+ core_behavior_mode: 2
10
+ core_compile: false
11
+ core_drop_path: 0.0505
12
+ core_emb_dim: 112
13
+ core_ff_activation: gelu
14
+ core_ff_dropout: 0.0592
15
+ core_flash_attention: 1
16
+ core_head_dim: 48
17
+ core_lr: 0.0048
18
+ core_mha_dropout: 0.358
19
+ core_mlp_dim: 136
20
+ core_norm_qk: false
21
+ core_num_heads: 11
22
+ core_p_dropout: 0.1338
23
+ core_parallel_attention: true
24
+ core_patch_mode: 0
25
+ core_pos_encoding: 3
26
+ core_spatial_depth: 3
27
+ core_spatial_patch_size: 7
28
+ core_spatial_patch_stride: 2
29
+ core_temporal_depth: 5
30
+ core_temporal_patch_size: 25
31
+ core_temporal_patch_stride: 1
32
+ core_weight_decay: 0.1789
33
+ criterion: poisson_correlation
34
+ critic_mode: 0
35
+ crop_frame: 140
36
+ data: /home/sensorium2023
37
+ deterministic: false
38
+ device: cuda
39
+ dpi: 120
40
+ ds_mode: 3
41
+ ds_scale: 1
42
+ epochs: 400
43
+ format: svg
44
+ git_hash: 1033c29
45
+ grad_checkpointing: 0
46
+ grad_norm: null
47
+ input_shapes:
48
+ behavior: [2, 140]
49
+ pupil_center: [2, 140]
50
+ video: [1, 140, 36, 64]
51
+ limit_data: null
52
+ lr: 0.0036
53
+ max_frame: 300
54
+ micro_batch_size: 6
55
+ modulator_mode: 0
56
+ mouse_ids: [A, B, C, D, E, F, G, H, I, J]
57
+ num_workers: 2
58
+ output_dir: /home/storage/runs/003
59
+ output_mode: 1
60
+ output_shapes:
61
+ A: [7440, 140]
62
+ B: [7928, 140]
63
+ C: [8285, 140]
64
+ D: [7671, 140]
65
+ E: [7495, 140]
66
+ F: [7863, 140]
67
+ G: [7908, 140]
68
+ H: [8202, 140]
69
+ I: [7939, 140]
70
+ J: [8122, 140]
71
+ precision: "32"
72
+ pretrain_core: null
73
+ readout: gaussian2d
74
+ readout_bias_mode: 2
75
+ readout_dropout: 0.0
76
+ readout_grid_mode: 1
77
+ restore: null
78
+ save_plots: false
79
+ seed: 12
80
+ shifter_layers: 3
81
+ shifter_mode: 1
82
+ shifter_size: 5
83
+ stat_mode: 1
84
+ trainable_params: 12278365
85
+ transform_mode: 2
86
+ verbose: 1
87
+ weight_decay: 0.3939
003/ckpt/model_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09874ebf6e03ea617ccd08af30de997d9ca2d372fd68f9fe26696e58b675f025
3
+ size 148268583
003/evaluation.yaml ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ validation: {A: 0.24746963381767273, B: 0.27505889534950256, C: 0.27303239703178406,
2
+ D: 0.23642510175704956, E: 0.23546315729618073, F: 0.23425357043743134, G: 0.2543371021747589,
3
+ H: 0.23437707126140594, I: 0.2602153420448303, J: 0.2588430643081665, average: 0.25094753354787824}
003/model.txt ADDED
@@ -0,0 +1,143 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ =======================================================================================================================================
2
+ Layer (type:depth-idx) Input Shape Output Shape Param #
3
+ =======================================================================================================================================
4
+ Model -- [1, 7440, 116] --
5
+ ├─ViViTCore: 1-1 -- [1, 112, 116, 15, 29] --
6
+ │ └─ViViT: 2-1 [1, 5, 140, 36, 64] [1, 112, 116, 15, 29] --
7
+ │ │ └─Tokenizer: 3-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] 79,632
8
+ │ │ │ └─Sequential: 4-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] --
9
+ │ │ │ │ └─Unfold3d: 5-1 [1, 5, 140, 36, 64] [1, 116, 435, 6125] --
10
+ │ │ │ │ └─LayerNorm: 5-2 [1, 116, 435, 6125] [1, 116, 435, 6125] 12,250
11
+ │ │ │ │ └─Linear: 5-3 [1, 116, 435, 6125] [1, 116, 435, 112] 686,112
12
+ │ │ │ │ └─LayerNorm: 5-4 [1, 116, 435, 112] [1, 116, 435, 112] 224
13
+ │ │ │ │ └─Dropout: 5-5 [1, 116, 435, 112] [1, 116, 435, 112] --
14
+ │ │ └─Transformer: 3-2 [116, 435, 112] [116, 435, 112] --
15
+ │ │ │ └─ModuleList: 4-2 -- -- --
16
+ │ │ │ │ └─ParallelTransformerBlock: 5-6 [116, 435, 112] [116, 435, 112] --
17
+ │ │ │ │ │ └─LayerNorm: 6-1 [116, 435, 112] [116, 435, 112] 224
18
+ │ │ │ │ │ └─Linear: 6-2 [116, 435, 112] [116, 435, 1720] 192,640
19
+ │ │ │ │ │ └─Linear: 6-3 [116, 435, 528] [116, 435, 112] 59,136
20
+ │ │ │ │ │ └─DropPath: 6-4 [116, 435, 112] [116, 435, 112] --
21
+ │ │ │ │ │ └─Sequential: 6-5 [116, 435, 136] [116, 435, 112] --
22
+ │ │ │ │ │ │ └─GELU: 7-1 [116, 435, 136] [116, 435, 136] --
23
+ │ │ │ │ │ │ └─Dropout: 7-2 [116, 435, 136] [116, 435, 136] --
24
+ │ │ │ │ │ │ └─Linear: 7-3 [116, 435, 136] [116, 435, 112] 15,232
25
+ │ │ │ │ │ └─DropPath: 6-6 [116, 435, 112] [116, 435, 112] --
26
+ │ │ │ │ └─ParallelTransformerBlock: 5-7 [116, 435, 112] [116, 435, 112] --
27
+ │ │ │ │ │ └─LayerNorm: 6-7 [116, 435, 112] [116, 435, 112] 224
28
+ │ │ │ │ │ └─Linear: 6-8 [116, 435, 112] [116, 435, 1720] 192,640
29
+ │ │ │ │ │ └─Linear: 6-9 [116, 435, 528] [116, 435, 112] 59,136
30
+ │ │ │ │ │ └─DropPath: 6-10 [116, 435, 112] [116, 435, 112] --
31
+ │ │ │ │ │ └─Sequential: 6-11 [116, 435, 136] [116, 435, 112] --
32
+ │ │ │ │ │ │ └─GELU: 7-4 [116, 435, 136] [116, 435, 136] --
33
+ │ │ │ │ │ │ └─Dropout: 7-5 [116, 435, 136] [116, 435, 136] --
34
+ │ │ │ │ │ │ └─Linear: 7-6 [116, 435, 136] [116, 435, 112] 15,232
35
+ │ │ │ │ │ └─DropPath: 6-12 [116, 435, 112] [116, 435, 112] --
36
+ │ │ │ │ └─ParallelTransformerBlock: 5-8 [116, 435, 112] [116, 435, 112] --
37
+ │ │ │ │ │ └─LayerNorm: 6-13 [116, 435, 112] [116, 435, 112] 224
38
+ │ │ │ │ │ └─Linear: 6-14 [116, 435, 112] [116, 435, 1720] 192,640
39
+ │ │ │ │ │ └─Linear: 6-15 [116, 435, 528] [116, 435, 112] 59,136
40
+ │ │ │ │ │ └─DropPath: 6-16 [116, 435, 112] [116, 435, 112] --
41
+ │ │ │ │ │ └─Sequential: 6-17 [116, 435, 136] [116, 435, 112] --
42
+ │ │ │ │ │ │ └─GELU: 7-7 [116, 435, 136] [116, 435, 136] --
43
+ │ │ │ │ │ │ └─Dropout: 7-8 [116, 435, 136] [116, 435, 136] --
44
+ │ │ │ │ │ │ └─Linear: 7-9 [116, 435, 136] [116, 435, 112] 15,232
45
+ │ │ │ │ │ └─DropPath: 6-18 [116, 435, 112] [116, 435, 112] --
46
+ │ │ └─Transformer: 3-3 [435, 116, 112] [435, 116, 112] --
47
+ │ │ │ └─ModuleList: 4-3 -- -- --
48
+ │ │ │ │ └─ParallelTransformerBlock: 5-9 [435, 116, 112] [435, 116, 112] --
49
+ │ │ │ │ │ └─LayerNorm: 6-19 [435, 116, 112] [435, 116, 112] 224
50
+ │ │ │ │ │ └─Linear: 6-20 [435, 116, 112] [435, 116, 1720] 192,640
51
+ │ │ │ │ │ └─Linear: 6-21 [435, 116, 528] [435, 116, 112] 59,136
52
+ │ │ │ │ │ └─DropPath: 6-22 [435, 116, 112] [435, 116, 112] --
53
+ │ │ │ │ │ └─Sequential: 6-23 [435, 116, 136] [435, 116, 112] --
54
+ │ │ │ │ │ │ └─GELU: 7-10 [435, 116, 136] [435, 116, 136] --
55
+ │ │ │ │ │ │ └─Dropout: 7-11 [435, 116, 136] [435, 116, 136] --
56
+ │ │ │ │ │ │ └─Linear: 7-12 [435, 116, 136] [435, 116, 112] 15,232
57
+ │ │ │ │ │ └─DropPath: 6-24 [435, 116, 112] [435, 116, 112] --
58
+ │ │ │ │ └─ParallelTransformerBlock: 5-10 [435, 116, 112] [435, 116, 112] --
59
+ │ │ │ │ │ └─LayerNorm: 6-25 [435, 116, 112] [435, 116, 112] 224
60
+ │ │ │ │ │ └─Linear: 6-26 [435, 116, 112] [435, 116, 1720] 192,640
61
+ │ │ │ │ │ └─Linear: 6-27 [435, 116, 528] [435, 116, 112] 59,136
62
+ │ │ │ │ │ └─DropPath: 6-28 [435, 116, 112] [435, 116, 112] --
63
+ │ │ │ │ │ └─Sequential: 6-29 [435, 116, 136] [435, 116, 112] --
64
+ │ │ │ │ │ │ └─GELU: 7-13 [435, 116, 136] [435, 116, 136] --
65
+ │ │ │ │ │ │ └─Dropout: 7-14 [435, 116, 136] [435, 116, 136] --
66
+ │ │ │ │ │ │ └─Linear: 7-15 [435, 116, 136] [435, 116, 112] 15,232
67
+ │ │ │ │ │ └─DropPath: 6-30 [435, 116, 112] [435, 116, 112] --
68
+ │ │ │ │ └─ParallelTransformerBlock: 5-11 [435, 116, 112] [435, 116, 112] --
69
+ │ │ │ │ │ └─LayerNorm: 6-31 [435, 116, 112] [435, 116, 112] 224
70
+ │ │ │ │ │ └─Linear: 6-32 [435, 116, 112] [435, 116, 1720] 192,640
71
+ │ │ │ │ │ └─Linear: 6-33 [435, 116, 528] [435, 116, 112] 59,136
72
+ │ │ │ │ │ └─DropPath: 6-34 [435, 116, 112] [435, 116, 112] --
73
+ │ │ │ │ │ └─Sequential: 6-35 [435, 116, 136] [435, 116, 112] --
74
+ │ │ │ │ │ │ └─GELU: 7-16 [435, 116, 136] [435, 116, 136] --
75
+ │ │ │ │ │ │ └─Dropout: 7-17 [435, 116, 136] [435, 116, 136] --
76
+ │ │ │ │ │ │ └─Linear: 7-18 [435, 116, 136] [435, 116, 112] 15,232
77
+ │ │ │ │ │ └─DropPath: 6-36 [435, 116, 112] [435, 116, 112] --
78
+ │ │ │ │ └─ParallelTransformerBlock: 5-12 [435, 116, 112] [435, 116, 112] --
79
+ │ │ │ │ │ └─LayerNorm: 6-37 [435, 116, 112] [435, 116, 112] 224
80
+ │ │ │ │ │ └─Linear: 6-38 [435, 116, 112] [435, 116, 1720] 192,640
81
+ │ │ │ │ │ └─Linear: 6-39 [435, 116, 528] [435, 116, 112] 59,136
82
+ │ │ │ │ │ └─DropPath: 6-40 [435, 116, 112] [435, 116, 112] --
83
+ │ │ │ │ │ └─Sequential: 6-41 [435, 116, 136] [435, 116, 112] --
84
+ │ │ │ │ │ │ └─GELU: 7-19 [435, 116, 136] [435, 116, 136] --
85
+ │ │ │ │ │ │ └─Dropout: 7-20 [435, 116, 136] [435, 116, 136] --
86
+ │ │ │ │ │ │ └─Linear: 7-21 [435, 116, 136] [435, 116, 112] 15,232
87
+ │ │ │ │ │ └─DropPath: 6-42 [435, 116, 112] [435, 116, 112] --
88
+ │ │ │ │ └─ParallelTransformerBlock: 5-13 [435, 116, 112] [435, 116, 112] --
89
+ │ │ │ │ │ └─LayerNorm: 6-43 [435, 116, 112] [435, 116, 112] 224
90
+ │ │ │ │ │ └─Linear: 6-44 [435, 116, 112] [435, 116, 1720] 192,640
91
+ │ │ │ │ │ └─Linear: 6-45 [435, 116, 528] [435, 116, 112] 59,136
92
+ │ │ │ │ │ └─DropPath: 6-46 [435, 116, 112] [435, 116, 112] --
93
+ │ │ │ │ │ └─Sequential: 6-47 [435, 116, 136] [435, 116, 112] --
94
+ │ │ │ │ │ │ └─GELU: 7-22 [435, 116, 136] [435, 116, 136] --
95
+ │ │ │ │ │ │ └─Dropout: 7-23 [435, 116, 136] [435, 116, 136] --
96
+ │ │ │ │ │ │ └─Linear: 7-24 [435, 116, 136] [435, 116, 112] 15,232
97
+ │ │ │ │ │ └─DropPath: 6-48 [435, 116, 112] [435, 116, 112] --
98
+ │ │ └─Rearrange: 3-4 [1, 116, 435, 112] [1, 112, 116, 15, 29] --
99
+ ├─MLPShifters: 1-2 -- [1, 2, 116] 513
100
+ │ └─MLPShifter: 2-2 [116, 2] [116, 2] --
101
+ │ │ └─Sequential: 3-5 [116, 2] [116, 2] --
102
+ │ │ │ └─Linear: 4-4 [116, 2] [116, 5] 15
103
+ │ │ │ └─Tanh: 4-5 [116, 5] [116, 5] --
104
+ │ │ │ └─Linear: 4-6 [116, 5] [116, 5] 30
105
+ │ │ │ └─Tanh: 4-7 [116, 5] [116, 5] --
106
+ │ │ │ └─Linear: 4-8 [116, 5] [116, 2] 12
107
+ │ │ │ └─Tanh: 4-9 [116, 2] [116, 2] --
108
+ ├─Readouts: 1-3 [1, 112, 116, 15, 29] [1, 7440, 116] 8,477,649
109
+ │ └─Gaussian2DReadout2: 2-3 [1, 112, 116, 15, 29] [1, 7440, 116] 870,480
110
+ │ │ └─Sequential: 3-6 [7440, 2] [7440, 2] --
111
+ │ │ │ └─Linear: 4-10 [7440, 2] [7440, 30] 90
112
+ │ │ │ └─ELU: 4-11 [7440, 30] [7440, 30] --
113
+ │ │ │ └─Linear: 4-12 [7440, 30] [7440, 2] 62
114
+ │ │ │ └─Tanh: 4-13 [7440, 2] [7440, 2] --
115
+ │ │ └─Sequential: 3-7 [7440, 2] [7440, 2] (recursive)
116
+ │ │ │ └─Linear: 4-14 [7440, 2] [7440, 30] (recursive)
117
+ │ │ │ └─ELU: 4-15 [7440, 30] [7440, 30] --
118
+ �� │ │ └─Linear: 4-16 [7440, 30] [7440, 2] (recursive)
119
+ │ │ │ └─Tanh: 4-17 [7440, 2] [7440, 2] --
120
+ │ │ └─Sequential: 3-8 [7440, 2] [7440, 2] (recursive)
121
+ │ │ │ └─Linear: 4-18 [7440, 2] [7440, 30] (recursive)
122
+ │ │ │ └─ELU: 4-19 [7440, 30] [7440, 30] --
123
+ │ │ │ └─Linear: 4-20 [7440, 30] [7440, 2] (recursive)
124
+ │ │ │ └─Tanh: 4-21 [7440, 2] [7440, 2] --
125
+ │ │ └─Sequential: 3-9 [116, 4] [116, 112] --
126
+ │ │ │ └─Linear: 4-22 [116, 4] [116, 112] 560
127
+ │ │ │ └─LayerNorm: 4-23 [116, 112] [116, 112] 224
128
+ │ │ │ └─GELU: 4-24 [116, 112] [116, 112] --
129
+ │ │ │ └─Dropout: 4-25 [116, 112] [116, 112] --
130
+ │ │ │ └─Linear: 4-26 [116, 112] [116, 112] 12,656
131
+ │ │ │ └─Tanh: 4-27 [116, 112] [116, 112] --
132
+ ├─Exponential: 1-4 [1, 7440, 116] [1, 7440, 116] --
133
+ =======================================================================================================================================
134
+ Total params: 12,278,365
135
+ Trainable params: 12,278,365
136
+ Non-trainable params: 0
137
+ Total mult-adds (Units.MEGABYTES): 679.88
138
+ =======================================================================================================================================
139
+ Input size (MB): 1.29
140
+ Forward/backward pass size (MB): 9208.73
141
+ Params size (MB): 11.40
142
+ Estimated Total Size (MB): 9221.42
143
+ =======================================================================================================================================
003/output.log ADDED
@@ -0,0 +1,789 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Use bfloat16 for core module.
2
+ Use parallel attention and MLP in ViViT.
3
+
4
+ Epoch 001/400
5
+ Train loss: 112704208.00 correlation: 0.0126
6
+ Validation loss: 199545376.00 correlation: 0.0293
7
+ Elapse: 540.35s
8
+
9
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
10
+
11
+ Epoch 002/400
12
+ Train loss: 97414480.00 correlation: 0.0393
13
+ Validation loss: 198820640.00 correlation: 0.0410
14
+ Elapse: 549.83s
15
+
16
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
17
+
18
+ Epoch 003/400
19
+ Train loss: 95851936.00 correlation: 0.0545
20
+ Validation loss: 197542912.00 correlation: 0.0493
21
+ Elapse: 552.73s
22
+
23
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
24
+
25
+ Epoch 004/400
26
+ Train loss: 94762680.00 correlation: 0.0658
27
+ Validation loss: 195978896.00 correlation: 0.0592
28
+ Elapse: 553.22s
29
+
30
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
31
+
32
+ Epoch 005/400
33
+ Train loss: 93366904.00 correlation: 0.0807
34
+ Validation loss: 193138784.00 correlation: 0.0786
35
+ Elapse: 551.37s
36
+
37
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
38
+
39
+ Epoch 006/400
40
+ Train loss: 91530000.00 correlation: 0.0996
41
+ Validation loss: 190414640.00 correlation: 0.0957
42
+ Elapse: 548.87s
43
+
44
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
45
+
46
+ Epoch 007/400
47
+ Train loss: 90052112.00 correlation: 0.1151
48
+ Validation loss: 187958800.00 correlation: 0.1117
49
+ Elapse: 545.45s
50
+
51
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
52
+
53
+ Epoch 008/400
54
+ Train loss: 88550296.00 correlation: 0.1303
55
+ Validation loss: 185819104.00 correlation: 0.1231
56
+ Elapse: 542.13s
57
+
58
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
59
+
60
+ Epoch 009/400
61
+ Train loss: 87211088.00 correlation: 0.1444
62
+ Validation loss: 183781008.00 correlation: 0.1379
63
+ Elapse: 540.39s
64
+
65
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
66
+
67
+ Epoch 010/400
68
+ Train loss: 85912744.00 correlation: 0.1575
69
+ Validation loss: 182160864.00 correlation: 0.1483
70
+ Elapse: 539.93s
71
+
72
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
73
+
74
+ Epoch 011/400
75
+ Train loss: 84825776.00 correlation: 0.1681
76
+ Validation loss: 180796960.00 correlation: 0.1574
77
+ Elapse: 539.05s
78
+
79
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
80
+
81
+ Epoch 012/400
82
+ Train loss: 83932096.00 correlation: 0.1768
83
+ Validation loss: 179665872.00 correlation: 0.1651
84
+ Elapse: 539.83s
85
+
86
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
87
+
88
+ Epoch 013/400
89
+ Train loss: 83185960.00 correlation: 0.1841
90
+ Validation loss: 178867920.00 correlation: 0.1706
91
+ Elapse: 540.49s
92
+
93
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
94
+
95
+ Epoch 014/400
96
+ Train loss: 82619600.00 correlation: 0.1896
97
+ Validation loss: 178183616.00 correlation: 0.1749
98
+ Elapse: 540.25s
99
+
100
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
101
+
102
+ Epoch 015/400
103
+ Train loss: 82049104.00 correlation: 0.1953
104
+ Validation loss: 177195872.00 correlation: 0.1811
105
+ Elapse: 539.98s
106
+
107
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
108
+
109
+ Epoch 016/400
110
+ Train loss: 81438744.00 correlation: 0.2013
111
+ Validation loss: 176732480.00 correlation: 0.1848
112
+ Elapse: 539.92s
113
+
114
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
115
+
116
+ Epoch 017/400
117
+ Train loss: 80981184.00 correlation: 0.2058
118
+ Validation loss: 175869328.00 correlation: 0.1895
119
+ Elapse: 540.34s
120
+
121
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
122
+
123
+ Epoch 018/400
124
+ Train loss: 80463984.00 correlation: 0.2108
125
+ Validation loss: 175137504.00 correlation: 0.1941
126
+ Elapse: 540.52s
127
+
128
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
129
+
130
+ Epoch 019/400
131
+ Train loss: 80076456.00 correlation: 0.2145
132
+ Validation loss: 174743216.00 correlation: 0.1976
133
+ Elapse: 540.79s
134
+
135
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
136
+
137
+ Epoch 020/400
138
+ Train loss: 79770240.00 correlation: 0.2180
139
+ Validation loss: 174354656.00 correlation: 0.1999
140
+ Elapse: 541.02s
141
+
142
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
143
+
144
+ Epoch 021/400
145
+ Train loss: 79389680.00 correlation: 0.2210
146
+ Validation loss: 173737072.00 correlation: 0.2049
147
+ Elapse: 540.85s
148
+
149
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
150
+
151
+ Epoch 022/400
152
+ Train loss: 79099264.00 correlation: 0.2238
153
+ Validation loss: 173426080.00 correlation: 0.2057
154
+ Elapse: 542.08s
155
+
156
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
157
+
158
+ Epoch 023/400
159
+ Train loss: 78893584.00 correlation: 0.2259
160
+ Validation loss: 172965088.00 correlation: 0.2094
161
+ Elapse: 542.73s
162
+
163
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
164
+
165
+ Epoch 024/400
166
+ Train loss: 78610448.00 correlation: 0.2286
167
+ Validation loss: 172757408.00 correlation: 0.2102
168
+ Elapse: 543.17s
169
+
170
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
171
+
172
+ Epoch 025/400
173
+ Train loss: 78350984.00 correlation: 0.2311
174
+ Validation loss: 172301040.00 correlation: 0.2136
175
+ Elapse: 543.01s
176
+
177
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
178
+
179
+ Epoch 026/400
180
+ Train loss: 78082256.00 correlation: 0.2338
181
+ Validation loss: 172086432.00 correlation: 0.2145
182
+ Elapse: 543.35s
183
+
184
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
185
+
186
+ Epoch 027/400
187
+ Train loss: 77827456.00 correlation: 0.2363
188
+ Validation loss: 171786464.00 correlation: 0.2169
189
+ Elapse: 543.66s
190
+
191
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
192
+
193
+ Epoch 028/400
194
+ Train loss: 77638136.00 correlation: 0.2379
195
+ Validation loss: 171793264.00 correlation: 0.2171
196
+ Elapse: 543.62s
197
+
198
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
199
+
200
+ Epoch 029/400
201
+ Train loss: 77553520.00 correlation: 0.2390
202
+ Validation loss: 171183824.00 correlation: 0.2206
203
+ Elapse: 543.14s
204
+
205
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
206
+
207
+ Epoch 030/400
208
+ Train loss: 77293184.00 correlation: 0.2414
209
+ Validation loss: 171063472.00 correlation: 0.2218
210
+ Elapse: 542.93s
211
+
212
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
213
+
214
+ Epoch 031/400
215
+ Train loss: 77137136.00 correlation: 0.2425
216
+ Validation loss: 170927232.00 correlation: 0.2215
217
+ Elapse: 542.90s
218
+
219
+ Epoch 032/400
220
+ Train loss: 77036008.00 correlation: 0.2439
221
+ Validation loss: 170678112.00 correlation: 0.2241
222
+ Elapse: 544.22s
223
+
224
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
225
+
226
+ Epoch 033/400
227
+ Train loss: 76850512.00 correlation: 0.2458
228
+ Validation loss: 170585168.00 correlation: 0.2249
229
+ Elapse: 543.38s
230
+
231
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
232
+
233
+ Epoch 034/400
234
+ Train loss: 76745528.00 correlation: 0.2467
235
+ Validation loss: 170361008.00 correlation: 0.2261
236
+ Elapse: 543.46s
237
+
238
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
239
+
240
+ Epoch 035/400
241
+ Train loss: 76631640.00 correlation: 0.2479
242
+ Validation loss: 170159952.00 correlation: 0.2272
243
+ Elapse: 544.31s
244
+
245
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
246
+
247
+ Epoch 036/400
248
+ Train loss: 76572216.00 correlation: 0.2483
249
+ Validation loss: 170068624.00 correlation: 0.2280
250
+ Elapse: 544.03s
251
+
252
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
253
+
254
+ Epoch 037/400
255
+ Train loss: 76306000.00 correlation: 0.2511
256
+ Validation loss: 170078272.00 correlation: 0.2281
257
+ Elapse: 543.66s
258
+
259
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
260
+
261
+ Epoch 038/400
262
+ Train loss: 76521968.00 correlation: 0.2488
263
+ Validation loss: 170034304.00 correlation: 0.2284
264
+ Elapse: 543.78s
265
+
266
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
267
+
268
+ Epoch 039/400
269
+ Train loss: 76277552.00 correlation: 0.2512
270
+ Validation loss: 169955232.00 correlation: 0.2283
271
+ Elapse: 544.11s
272
+
273
+ Epoch 040/400
274
+ Train loss: 76083856.00 correlation: 0.2532
275
+ Validation loss: 169547568.00 correlation: 0.2316
276
+ Elapse: 544.27s
277
+
278
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
279
+
280
+ Epoch 041/400
281
+ Train loss: 76034800.00 correlation: 0.2536
282
+ Validation loss: 169778400.00 correlation: 0.2301
283
+ Elapse: 544.31s
284
+
285
+ Epoch 042/400
286
+ Train loss: 75948104.00 correlation: 0.2542
287
+ Validation loss: 169703472.00 correlation: 0.2304
288
+ Elapse: 543.89s
289
+
290
+ Epoch 043/400
291
+ Train loss: 75900336.00 correlation: 0.2549
292
+ Validation loss: 169460816.00 correlation: 0.2314
293
+ Elapse: 543.95s
294
+
295
+ Epoch 044/400
296
+ Train loss: 75856872.00 correlation: 0.2554
297
+ Validation loss: 169446544.00 correlation: 0.2314
298
+ Elapse: 543.85s
299
+
300
+ Epoch 045/400
301
+ Train loss: 75771024.00 correlation: 0.2563
302
+ Validation loss: 169373568.00 correlation: 0.2320
303
+ Elapse: 544.58s
304
+
305
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
306
+
307
+ Epoch 046/400
308
+ Train loss: 75747888.00 correlation: 0.2564
309
+ Validation loss: 169484960.00 correlation: 0.2316
310
+ Elapse: 544.29s
311
+
312
+ Epoch 047/400
313
+ Train loss: 75614488.00 correlation: 0.2578
314
+ Validation loss: 169374048.00 correlation: 0.2332
315
+ Elapse: 544.59s
316
+
317
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
318
+
319
+ Epoch 048/400
320
+ Train loss: 75621768.00 correlation: 0.2577
321
+ Validation loss: 169829152.00 correlation: 0.2292
322
+ Elapse: 544.60s
323
+
324
+ Epoch 049/400
325
+ Train loss: 75540576.00 correlation: 0.2584
326
+ Validation loss: 169151584.00 correlation: 0.2322
327
+ Elapse: 545.07s
328
+
329
+ Epoch 050/400
330
+ Train loss: 75552112.00 correlation: 0.2587
331
+ Validation loss: 169218528.00 correlation: 0.2327
332
+ Elapse: 544.47s
333
+
334
+ Epoch 051/400
335
+ Train loss: 75440728.00 correlation: 0.2597
336
+ Validation loss: 169177248.00 correlation: 0.2329
337
+ Elapse: 544.75s
338
+
339
+ Epoch 052/400
340
+ Train loss: 75499728.00 correlation: 0.2591
341
+ Validation loss: 169380720.00 correlation: 0.2327
342
+ Elapse: 544.77s
343
+
344
+ Loaded checkpoint from epoch 47 (correlation: 0.2332).
345
+
346
+ Reduce learning rate of core to 1.4400e-03 (num. reduce: 1).
347
+ Reduce learning rate of readouts to 1.0800e-03 (num. reduce: 1).
348
+ Reduce learning rate of shifters to 1.0800e-03 (num. reduce: 1).
349
+
350
+ Epoch 053/400
351
+ Train loss: 73633064.00 correlation: 0.2750
352
+ Validation loss: 167526240.00 correlation: 0.2446
353
+ Elapse: 545.49s
354
+
355
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
356
+
357
+ Epoch 054/400
358
+ Train loss: 72992880.00 correlation: 0.2809
359
+ Validation loss: 167505792.00 correlation: 0.2447
360
+ Elapse: 545.66s
361
+
362
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
363
+
364
+ Epoch 055/400
365
+ Train loss: 72791024.00 correlation: 0.2827
366
+ Validation loss: 167337248.00 correlation: 0.2451
367
+ Elapse: 545.82s
368
+
369
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
370
+
371
+ Epoch 056/400
372
+ Train loss: 72699672.00 correlation: 0.2837
373
+ Validation loss: 167396864.00 correlation: 0.2453
374
+ Elapse: 545.65s
375
+
376
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
377
+
378
+ Epoch 057/400
379
+ Train loss: 72666128.00 correlation: 0.2841
380
+ Validation loss: 167320224.00 correlation: 0.2457
381
+ Elapse: 546.33s
382
+
383
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
384
+
385
+ Epoch 058/400
386
+ Train loss: 72662680.00 correlation: 0.2840
387
+ Validation loss: 167358624.00 correlation: 0.2457
388
+ Elapse: 545.38s
389
+
390
+ Epoch 059/400
391
+ Train loss: 72528456.00 correlation: 0.2854
392
+ Validation loss: 167347344.00 correlation: 0.2456
393
+ Elapse: 546.44s
394
+
395
+ Epoch 060/400
396
+ Train loss: 72553424.00 correlation: 0.2854
397
+ Validation loss: 167294624.00 correlation: 0.2462
398
+ Elapse: 546.17s
399
+
400
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
401
+
402
+ Epoch 061/400
403
+ Train loss: 72496144.00 correlation: 0.2860
404
+ Validation loss: 167428896.00 correlation: 0.2444
405
+ Elapse: 545.96s
406
+
407
+ Epoch 062/400
408
+ Train loss: 72479344.00 correlation: 0.2859
409
+ Validation loss: 167235104.00 correlation: 0.2454
410
+ Elapse: 546.11s
411
+
412
+ Epoch 063/400
413
+ Train loss: 72437912.00 correlation: 0.2863
414
+ Validation loss: 167384528.00 correlation: 0.2447
415
+ Elapse: 546.05s
416
+
417
+ Epoch 064/400
418
+ Train loss: 72443952.00 correlation: 0.2864
419
+ Validation loss: 167276464.00 correlation: 0.2452
420
+ Elapse: 546.23s
421
+
422
+ Epoch 065/400
423
+ Train loss: 72421648.00 correlation: 0.2869
424
+ Validation loss: 167359664.00 correlation: 0.2448
425
+ Elapse: 546.55s
426
+
427
+ Loaded checkpoint from epoch 60 (correlation: 0.2462).
428
+
429
+ Reduce learning rate of core to 4.3200e-04 (num. reduce: 1).
430
+ Reduce learning rate of readouts to 3.2400e-04 (num. reduce: 1).
431
+ Reduce learning rate of shifters to 3.2400e-04 (num. reduce: 1).
432
+
433
+ Epoch 066/400
434
+ Train loss: 71631360.00 correlation: 0.2929
435
+ Validation loss: 166762592.00 correlation: 0.2488
436
+ Elapse: 546.04s
437
+
438
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
439
+
440
+ Epoch 067/400
441
+ Train loss: 71301752.00 correlation: 0.2963
442
+ Validation loss: 166766816.00 correlation: 0.2491
443
+ Elapse: 546.30s
444
+
445
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
446
+
447
+ Epoch 068/400
448
+ Train loss: 71239384.00 correlation: 0.2970
449
+ Validation loss: 166698608.00 correlation: 0.2493
450
+ Elapse: 546.54s
451
+
452
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
453
+
454
+ Epoch 069/400
455
+ Train loss: 71140904.00 correlation: 0.2977
456
+ Validation loss: 166688480.00 correlation: 0.2493
457
+ Elapse: 546.57s
458
+
459
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
460
+
461
+ Epoch 070/400
462
+ Train loss: 71157128.00 correlation: 0.2979
463
+ Validation loss: 166701680.00 correlation: 0.2493
464
+ Elapse: 546.93s
465
+
466
+ Epoch 071/400
467
+ Train loss: 71109936.00 correlation: 0.2983
468
+ Validation loss: 166666112.00 correlation: 0.2493
469
+ Elapse: 546.33s
470
+
471
+ Epoch 072/400
472
+ Train loss: 71014384.00 correlation: 0.2990
473
+ Validation loss: 166637680.00 correlation: 0.2493
474
+ Elapse: 546.25s
475
+
476
+ Epoch 073/400
477
+ Train loss: 71012144.00 correlation: 0.2989
478
+ Validation loss: 166633760.00 correlation: 0.2495
479
+ Elapse: 546.14s
480
+
481
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
482
+
483
+ Epoch 074/400
484
+ Train loss: 70962312.00 correlation: 0.2996
485
+ Validation loss: 166724848.00 correlation: 0.2491
486
+ Elapse: 546.66s
487
+
488
+ Epoch 075/400
489
+ Train loss: 70909096.00 correlation: 0.3002
490
+ Validation loss: 166680192.00 correlation: 0.2492
491
+ Elapse: 546.39s
492
+
493
+ Epoch 076/400
494
+ Train loss: 70859696.00 correlation: 0.3007
495
+ Validation loss: 166666160.00 correlation: 0.2493
496
+ Elapse: 546.76s
497
+
498
+ Epoch 077/400
499
+ Train loss: 70862616.00 correlation: 0.3006
500
+ Validation loss: 166644512.00 correlation: 0.2493
501
+ Elapse: 546.35s
502
+
503
+ Epoch 078/400
504
+ Train loss: 70866920.00 correlation: 0.3008
505
+ Validation loss: 166689088.00 correlation: 0.2489
506
+ Elapse: 546.43s
507
+
508
+ Loaded checkpoint from epoch 73 (correlation: 0.2495).
509
+
510
+ Reduce learning rate of core to 1.2960e-04 (num. reduce: 1).
511
+ Reduce learning rate of readouts to 9.7200e-05 (num. reduce: 1).
512
+ Reduce learning rate of shifters to 9.7200e-05 (num. reduce: 1).
513
+
514
+ Epoch 079/400
515
+ Train loss: 70659088.00 correlation: 0.3023
516
+ Validation loss: 166495968.00 correlation: 0.2504
517
+ Elapse: 546.32s
518
+
519
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
520
+
521
+ Epoch 080/400
522
+ Train loss: 70583640.00 correlation: 0.3029
523
+ Validation loss: 166499952.00 correlation: 0.2503
524
+ Elapse: 546.55s
525
+
526
+ Epoch 081/400
527
+ Train loss: 70541232.00 correlation: 0.3031
528
+ Validation loss: 166486608.00 correlation: 0.2504
529
+ Elapse: 546.44s
530
+
531
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
532
+
533
+ Epoch 082/400
534
+ Train loss: 70561208.00 correlation: 0.3030
535
+ Validation loss: 166498080.00 correlation: 0.2505
536
+ Elapse: 546.48s
537
+
538
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
539
+
540
+ Epoch 083/400
541
+ Train loss: 70504848.00 correlation: 0.3037
542
+ Validation loss: 166479744.00 correlation: 0.2504
543
+ Elapse: 545.91s
544
+
545
+ Epoch 084/400
546
+ Train loss: 70483280.00 correlation: 0.3037
547
+ Validation loss: 166527136.00 correlation: 0.2504
548
+ Elapse: 546.39s
549
+
550
+ Epoch 085/400
551
+ Train loss: 70486104.00 correlation: 0.3039
552
+ Validation loss: 166507024.00 correlation: 0.2504
553
+ Elapse: 546.66s
554
+
555
+ Epoch 086/400
556
+ Train loss: 70448464.00 correlation: 0.3042
557
+ Validation loss: 166480160.00 correlation: 0.2505
558
+ Elapse: 546.13s
559
+
560
+ Epoch 087/400
561
+ Train loss: 70433528.00 correlation: 0.3043
562
+ Validation loss: 166521664.00 correlation: 0.2504
563
+ Elapse: 546.51s
564
+
565
+ Loaded checkpoint from epoch 82 (correlation: 0.2505).
566
+
567
+ Reduce learning rate of core to 3.8880e-05 (num. reduce: 1).
568
+ Reduce learning rate of readouts to 2.9160e-05 (num. reduce: 1).
569
+ Reduce learning rate of shifters to 2.9160e-05 (num. reduce: 1).
570
+
571
+ Epoch 088/400
572
+ Train loss: 70419248.00 correlation: 0.3041
573
+ Validation loss: 166470848.00 correlation: 0.2507
574
+ Elapse: 546.72s
575
+
576
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
577
+
578
+ Epoch 089/400
579
+ Train loss: 70456936.00 correlation: 0.3039
580
+ Validation loss: 166478544.00 correlation: 0.2507
581
+ Elapse: 546.31s
582
+
583
+ Epoch 090/400
584
+ Train loss: 70377392.00 correlation: 0.3047
585
+ Validation loss: 166470880.00 correlation: 0.2508
586
+ Elapse: 546.64s
587
+
588
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
589
+
590
+ Epoch 091/400
591
+ Train loss: 70370720.00 correlation: 0.3048
592
+ Validation loss: 166471712.00 correlation: 0.2507
593
+ Elapse: 546.55s
594
+
595
+ Epoch 092/400
596
+ Train loss: 70332624.00 correlation: 0.3052
597
+ Validation loss: 166468176.00 correlation: 0.2506
598
+ Elapse: 546.51s
599
+
600
+ Epoch 093/400
601
+ Train loss: 70375248.00 correlation: 0.3046
602
+ Validation loss: 166466304.00 correlation: 0.2507
603
+ Elapse: 547.09s
604
+
605
+ Epoch 094/400
606
+ Train loss: 70312208.00 correlation: 0.3053
607
+ Validation loss: 166426080.00 correlation: 0.2509
608
+ Elapse: 546.36s
609
+
610
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
611
+
612
+ Epoch 095/400
613
+ Train loss: 70306024.00 correlation: 0.3054
614
+ Validation loss: 166448992.00 correlation: 0.2509
615
+ Elapse: 546.42s
616
+
617
+ Epoch 096/400
618
+ Train loss: 70301760.00 correlation: 0.3053
619
+ Validation loss: 166460400.00 correlation: 0.2508
620
+ Elapse: 545.99s
621
+
622
+ Epoch 097/400
623
+ Train loss: 70339392.00 correlation: 0.3050
624
+ Validation loss: 166448912.00 correlation: 0.2507
625
+ Elapse: 546.74s
626
+
627
+ Epoch 098/400
628
+ Train loss: 70365064.00 correlation: 0.3048
629
+ Validation loss: 166476400.00 correlation: 0.2506
630
+ Elapse: 546.17s
631
+
632
+ Epoch 099/400
633
+ Train loss: 70304792.00 correlation: 0.3053
634
+ Validation loss: 166451168.00 correlation: 0.2507
635
+ Elapse: 545.82s
636
+
637
+ Loaded checkpoint from epoch 94 (correlation: 0.2509).
638
+
639
+ Reduce learning rate of core to 1.1664e-05 (num. reduce: 1).
640
+ Reduce learning rate of readouts to 8.7480e-06 (num. reduce: 1).
641
+ Reduce learning rate of shifters to 8.7480e-06 (num. reduce: 1).
642
+
643
+ Epoch 100/400
644
+ Train loss: 70282520.00 correlation: 0.3055
645
+ Validation loss: 166444240.00 correlation: 0.2509
646
+ Elapse: 546.60s
647
+
648
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
649
+
650
+ Epoch 101/400
651
+ Train loss: 70321056.00 correlation: 0.3050
652
+ Validation loss: 166451424.00 correlation: 0.2509
653
+ Elapse: 546.61s
654
+
655
+ Epoch 102/400
656
+ Train loss: 70312536.00 correlation: 0.3052
657
+ Validation loss: 166450992.00 correlation: 0.2509
658
+ Elapse: 546.64s
659
+
660
+ Epoch 103/400
661
+ Train loss: 70294928.00 correlation: 0.3057
662
+ Validation loss: 166437664.00 correlation: 0.2509
663
+ Elapse: 546.47s
664
+
665
+ Epoch 104/400
666
+ Train loss: 70265648.00 correlation: 0.3058
667
+ Validation loss: 166443488.00 correlation: 0.2509
668
+ Elapse: 546.86s
669
+
670
+ Epoch 105/400
671
+ Train loss: 70228080.00 correlation: 0.3058
672
+ Validation loss: 166447312.00 correlation: 0.2508
673
+ Elapse: 546.77s
674
+
675
+ Loaded checkpoint from epoch 100 (correlation: 0.2509).
676
+
677
+ Reduce learning rate of core to 3.4992e-06 (num. reduce: 1).
678
+ Reduce learning rate of readouts to 2.6244e-06 (num. reduce: 1).
679
+ Reduce learning rate of shifters to 2.6244e-06 (num. reduce: 1).
680
+
681
+ Epoch 106/400
682
+ Train loss: 70303288.00 correlation: 0.3053
683
+ Validation loss: 166441600.00 correlation: 0.2509
684
+ Elapse: 546.61s
685
+
686
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
687
+
688
+ Epoch 107/400
689
+ Train loss: 70329360.00 correlation: 0.3052
690
+ Validation loss: 166438976.00 correlation: 0.2509
691
+ Elapse: 546.25s
692
+
693
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/012/ckpt/model_state.pt.
694
+
695
+ Epoch 108/400
696
+ Train loss: 70249752.00 correlation: 0.3063
697
+ Validation loss: 166440032.00 correlation: 0.2509
698
+ Elapse: 546.40s
699
+
700
+ Epoch 109/400
701
+ Train loss: 70245592.00 correlation: 0.3059
702
+ Validation loss: 166436832.00 correlation: 0.2509
703
+ Elapse: 546.34s
704
+
705
+ Epoch 110/400
706
+ Train loss: 70323520.00 correlation: 0.3050
707
+ Validation loss: 166439552.00 correlation: 0.2509
708
+ Elapse: 546.33s
709
+
710
+ Epoch 111/400
711
+ Train loss: 70291648.00 correlation: 0.3053
712
+ Validation loss: 166438448.00 correlation: 0.2509
713
+ Elapse: 546.45s
714
+
715
+ Epoch 112/400
716
+ Train loss: 70337264.00 correlation: 0.3050
717
+ Validation loss: 166435040.00 correlation: 0.2509
718
+ Elapse: 546.37s
719
+
720
+ Loaded checkpoint from epoch 107 (correlation: 0.2509).
721
+
722
+ Reduce learning rate of core to 1.0498e-06 (num. reduce: 1).
723
+ Reduce learning rate of readouts to 7.8732e-07 (num. reduce: 1).
724
+ Reduce learning rate of shifters to 7.8732e-07 (num. reduce: 1).
725
+
726
+ Epoch 113/400
727
+ Train loss: 70326192.00 correlation: 0.3050
728
+ Validation loss: 166438976.00 correlation: 0.2509
729
+ Elapse: 546.86s
730
+
731
+ Epoch 114/400
732
+ Train loss: 70297808.00 correlation: 0.3056
733
+ Validation loss: 166439680.00 correlation: 0.2509
734
+ Elapse: 546.99s
735
+
736
+ Epoch 115/400
737
+ Train loss: 70375312.00 correlation: 0.3045
738
+ Validation loss: 166439312.00 correlation: 0.2509
739
+ Elapse: 547.26s
740
+
741
+ Epoch 116/400
742
+ Train loss: 70331832.00 correlation: 0.3050
743
+ Validation loss: 166439392.00 correlation: 0.2509
744
+ Elapse: 546.75s
745
+
746
+ Epoch 117/400
747
+ Train loss: 70241608.00 correlation: 0.3060
748
+ Validation loss: 166441104.00 correlation: 0.2509
749
+ Elapse: 546.43s
750
+
751
+ Loaded checkpoint from epoch 107 (correlation: 0.2509).
752
+
753
+ Reduce learning rate of core to 3.1493e-07 (num. reduce: 2).
754
+ Reduce learning rate of readouts to 2.3620e-07 (num. reduce: 2).
755
+ Reduce learning rate of shifters to 2.3620e-07 (num. reduce: 2).
756
+
757
+ Epoch 118/400
758
+ Train loss: 70344976.00 correlation: 0.3049
759
+ Validation loss: 166439680.00 correlation: 0.2509
760
+ Elapse: 546.75s
761
+
762
+ Epoch 119/400
763
+ Train loss: 70278184.00 correlation: 0.3054
764
+ Validation loss: 166439840.00 correlation: 0.2509
765
+ Elapse: 547.33s
766
+
767
+ Epoch 120/400
768
+ Train loss: 70224856.00 correlation: 0.3062
769
+ Validation loss: 166439440.00 correlation: 0.2509
770
+ Elapse: 546.94s
771
+
772
+ Epoch 121/400
773
+ Train loss: 70317744.00 correlation: 0.3049
774
+ Validation loss: 166439280.00 correlation: 0.2509
775
+ Elapse: 547.22s
776
+
777
+ Epoch 122/400
778
+ Train loss: 70322624.00 correlation: 0.3052
779
+ Validation loss: 166438784.00 correlation: 0.2509
780
+ Elapse: 546.83s
781
+
782
+ Model has not improved after 2 LR reductions.
783
+
784
+ Loaded checkpoint from epoch 107 (correlation: 0.2509).
785
+
786
+
787
+ ValidationA: 0.2475 B: 0.2751 C: 0.2730 D: 0.2364 E: 0.2355 F: 0.2343 G: 0.2543 H: 0.2344 I: 0.2602 J: 0.2588 average: 0.2509
788
+
789
+ Results saved to /home/storage/runs/vivit_ensemble/012.
004/args.yaml ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_eps: 1e-08
4
+ batch_size: 6
5
+ cache_data: false
6
+ center_crop: 1.0
7
+ clear_output_dir: true
8
+ core: vivit
9
+ core_behavior_mode: 2
10
+ core_compile: false
11
+ core_drop_path: 0.0505
12
+ core_emb_dim: 112
13
+ core_ff_activation: gelu
14
+ core_ff_dropout: 0.0592
15
+ core_flash_attention: 1
16
+ core_head_dim: 48
17
+ core_lr: 0.0048
18
+ core_mha_dropout: 0.358
19
+ core_mlp_dim: 136
20
+ core_norm_qk: false
21
+ core_num_heads: 11
22
+ core_p_dropout: 0.1338
23
+ core_parallel_attention: true
24
+ core_patch_mode: 0
25
+ core_pos_encoding: 3
26
+ core_spatial_depth: 3
27
+ core_spatial_patch_size: 7
28
+ core_spatial_patch_stride: 2
29
+ core_temporal_depth: 5
30
+ core_temporal_patch_size: 25
31
+ core_temporal_patch_stride: 1
32
+ core_weight_decay: 0.1789
33
+ criterion: poisson_correlation
34
+ critic_mode: 0
35
+ crop_frame: 140
36
+ data: /home/sensorium2023
37
+ deterministic: false
38
+ device: cuda
39
+ dpi: 120
40
+ ds_mode: 3
41
+ ds_scale: 1
42
+ epochs: 400
43
+ format: svg
44
+ git_hash: 1033c29
45
+ grad_checkpointing: 0
46
+ grad_norm: null
47
+ input_shapes:
48
+ behavior: [2, 140]
49
+ pupil_center: [2, 140]
50
+ video: [1, 140, 36, 64]
51
+ limit_data: null
52
+ lr: 0.0036
53
+ max_frame: 300
54
+ micro_batch_size: 6
55
+ modulator_mode: 0
56
+ mouse_ids: [A, B, C, D, E, F, G, H, I, J]
57
+ num_workers: 2
58
+ output_dir: /home/storage/runs/004
59
+ output_mode: 1
60
+ output_shapes:
61
+ A: [7440, 140]
62
+ B: [7928, 140]
63
+ C: [8285, 140]
64
+ D: [7671, 140]
65
+ E: [7495, 140]
66
+ F: [7863, 140]
67
+ G: [7908, 140]
68
+ H: [8202, 140]
69
+ I: [7939, 140]
70
+ J: [8122, 140]
71
+ precision: "32"
72
+ pretrain_core: null
73
+ readout: gaussian2d
74
+ readout_bias_mode: 2
75
+ readout_dropout: 0.0
76
+ readout_grid_mode: 1
77
+ restore: null
78
+ save_plots: false
79
+ seed: 15
80
+ shifter_layers: 3
81
+ shifter_mode: 1
82
+ shifter_size: 5
83
+ stat_mode: 1
84
+ trainable_params: 12278365
85
+ transform_mode: 2
86
+ verbose: 1
87
+ weight_decay: 0.3939
004/ckpt/model_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8538df1cffe25f014e11f5db7e89d7b4e8167dd9545be98a14aa7f78e7bc6b42
3
+ size 148268583
004/evaluation.yaml ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ validation: {A: 0.24283820390701294, B: 0.2745824456214905, C: 0.2716088593006134,
2
+ D: 0.2359682023525238, E: 0.2350907325744629, F: 0.2335391342639923, G: 0.25313541293144226,
3
+ H: 0.23314021527767181, I: 0.25676068663597107, J: 0.2575773298740387, average: 0.24942412227392197}
004/model.txt ADDED
@@ -0,0 +1,143 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ =======================================================================================================================================
2
+ Layer (type:depth-idx) Input Shape Output Shape Param #
3
+ =======================================================================================================================================
4
+ Model -- [1, 7440, 116] --
5
+ ├─ViViTCore: 1-1 -- [1, 112, 116, 15, 29] --
6
+ │ └─ViViT: 2-1 [1, 5, 140, 36, 64] [1, 112, 116, 15, 29] --
7
+ │ │ └─Tokenizer: 3-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] 79,632
8
+ │ │ │ └─Sequential: 4-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] --
9
+ │ │ │ │ └─Unfold3d: 5-1 [1, 5, 140, 36, 64] [1, 116, 435, 6125] --
10
+ │ │ │ │ └─LayerNorm: 5-2 [1, 116, 435, 6125] [1, 116, 435, 6125] 12,250
11
+ │ │ │ │ └─Linear: 5-3 [1, 116, 435, 6125] [1, 116, 435, 112] 686,112
12
+ │ │ │ │ └─LayerNorm: 5-4 [1, 116, 435, 112] [1, 116, 435, 112] 224
13
+ │ │ │ │ └─Dropout: 5-5 [1, 116, 435, 112] [1, 116, 435, 112] --
14
+ │ │ └─Transformer: 3-2 [116, 435, 112] [116, 435, 112] --
15
+ │ │ │ └─ModuleList: 4-2 -- -- --
16
+ │ │ │ │ └─ParallelTransformerBlock: 5-6 [116, 435, 112] [116, 435, 112] --
17
+ │ │ │ │ │ └─LayerNorm: 6-1 [116, 435, 112] [116, 435, 112] 224
18
+ │ │ │ │ │ └─Linear: 6-2 [116, 435, 112] [116, 435, 1720] 192,640
19
+ │ │ │ │ │ └─Linear: 6-3 [116, 435, 528] [116, 435, 112] 59,136
20
+ │ │ │ │ │ └─DropPath: 6-4 [116, 435, 112] [116, 435, 112] --
21
+ │ │ │ │ │ └─Sequential: 6-5 [116, 435, 136] [116, 435, 112] --
22
+ │ │ │ │ │ │ └─GELU: 7-1 [116, 435, 136] [116, 435, 136] --
23
+ │ │ │ │ │ │ └─Dropout: 7-2 [116, 435, 136] [116, 435, 136] --
24
+ │ │ │ │ │ │ └─Linear: 7-3 [116, 435, 136] [116, 435, 112] 15,232
25
+ │ │ │ │ │ └─DropPath: 6-6 [116, 435, 112] [116, 435, 112] --
26
+ │ │ │ │ └─ParallelTransformerBlock: 5-7 [116, 435, 112] [116, 435, 112] --
27
+ │ │ │ │ │ └─LayerNorm: 6-7 [116, 435, 112] [116, 435, 112] 224
28
+ │ │ │ │ │ └─Linear: 6-8 [116, 435, 112] [116, 435, 1720] 192,640
29
+ │ │ │ │ │ └─Linear: 6-9 [116, 435, 528] [116, 435, 112] 59,136
30
+ │ │ │ │ │ └─DropPath: 6-10 [116, 435, 112] [116, 435, 112] --
31
+ │ │ │ │ │ └─Sequential: 6-11 [116, 435, 136] [116, 435, 112] --
32
+ │ │ │ │ │ │ └─GELU: 7-4 [116, 435, 136] [116, 435, 136] --
33
+ │ │ │ │ │ │ └─Dropout: 7-5 [116, 435, 136] [116, 435, 136] --
34
+ │ │ │ │ │ │ └─Linear: 7-6 [116, 435, 136] [116, 435, 112] 15,232
35
+ │ │ │ │ │ └─DropPath: 6-12 [116, 435, 112] [116, 435, 112] --
36
+ │ │ │ │ └─ParallelTransformerBlock: 5-8 [116, 435, 112] [116, 435, 112] --
37
+ │ │ │ │ │ └─LayerNorm: 6-13 [116, 435, 112] [116, 435, 112] 224
38
+ │ │ │ │ │ └─Linear: 6-14 [116, 435, 112] [116, 435, 1720] 192,640
39
+ │ │ │ │ │ └─Linear: 6-15 [116, 435, 528] [116, 435, 112] 59,136
40
+ │ │ │ │ │ └─DropPath: 6-16 [116, 435, 112] [116, 435, 112] --
41
+ │ │ │ │ │ └─Sequential: 6-17 [116, 435, 136] [116, 435, 112] --
42
+ │ │ │ │ │ │ └─GELU: 7-7 [116, 435, 136] [116, 435, 136] --
43
+ │ │ │ │ │ │ └─Dropout: 7-8 [116, 435, 136] [116, 435, 136] --
44
+ │ │ │ │ │ │ └─Linear: 7-9 [116, 435, 136] [116, 435, 112] 15,232
45
+ │ │ │ │ │ └─DropPath: 6-18 [116, 435, 112] [116, 435, 112] --
46
+ │ │ └─Transformer: 3-3 [435, 116, 112] [435, 116, 112] --
47
+ │ │ │ └─ModuleList: 4-3 -- -- --
48
+ │ │ │ │ └─ParallelTransformerBlock: 5-9 [435, 116, 112] [435, 116, 112] --
49
+ │ │ │ │ │ └─LayerNorm: 6-19 [435, 116, 112] [435, 116, 112] 224
50
+ │ │ │ │ │ └─Linear: 6-20 [435, 116, 112] [435, 116, 1720] 192,640
51
+ │ │ │ │ │ └─Linear: 6-21 [435, 116, 528] [435, 116, 112] 59,136
52
+ │ │ │ │ │ └─DropPath: 6-22 [435, 116, 112] [435, 116, 112] --
53
+ │ │ │ │ │ └─Sequential: 6-23 [435, 116, 136] [435, 116, 112] --
54
+ │ │ │ │ │ │ └─GELU: 7-10 [435, 116, 136] [435, 116, 136] --
55
+ │ │ │ │ │ │ └─Dropout: 7-11 [435, 116, 136] [435, 116, 136] --
56
+ │ │ │ │ │ │ └─Linear: 7-12 [435, 116, 136] [435, 116, 112] 15,232
57
+ │ │ │ │ │ └─DropPath: 6-24 [435, 116, 112] [435, 116, 112] --
58
+ │ │ │ │ └─ParallelTransformerBlock: 5-10 [435, 116, 112] [435, 116, 112] --
59
+ │ │ │ │ │ └─LayerNorm: 6-25 [435, 116, 112] [435, 116, 112] 224
60
+ │ │ │ │ │ └─Linear: 6-26 [435, 116, 112] [435, 116, 1720] 192,640
61
+ │ │ │ │ │ └─Linear: 6-27 [435, 116, 528] [435, 116, 112] 59,136
62
+ │ │ │ │ │ └─DropPath: 6-28 [435, 116, 112] [435, 116, 112] --
63
+ │ │ │ │ │ └─Sequential: 6-29 [435, 116, 136] [435, 116, 112] --
64
+ │ │ │ │ │ │ └─GELU: 7-13 [435, 116, 136] [435, 116, 136] --
65
+ │ │ │ │ │ │ └─Dropout: 7-14 [435, 116, 136] [435, 116, 136] --
66
+ │ │ │ │ │ │ └─Linear: 7-15 [435, 116, 136] [435, 116, 112] 15,232
67
+ │ │ │ │ │ └─DropPath: 6-30 [435, 116, 112] [435, 116, 112] --
68
+ │ │ │ │ └─ParallelTransformerBlock: 5-11 [435, 116, 112] [435, 116, 112] --
69
+ │ │ │ │ │ └─LayerNorm: 6-31 [435, 116, 112] [435, 116, 112] 224
70
+ │ │ │ │ │ └─Linear: 6-32 [435, 116, 112] [435, 116, 1720] 192,640
71
+ │ │ │ │ │ └─Linear: 6-33 [435, 116, 528] [435, 116, 112] 59,136
72
+ │ │ │ │ │ └─DropPath: 6-34 [435, 116, 112] [435, 116, 112] --
73
+ │ │ │ │ │ └─Sequential: 6-35 [435, 116, 136] [435, 116, 112] --
74
+ │ │ │ │ │ │ └─GELU: 7-16 [435, 116, 136] [435, 116, 136] --
75
+ │ │ │ │ │ │ └─Dropout: 7-17 [435, 116, 136] [435, 116, 136] --
76
+ │ │ │ │ │ │ └─Linear: 7-18 [435, 116, 136] [435, 116, 112] 15,232
77
+ │ │ │ │ │ └─DropPath: 6-36 [435, 116, 112] [435, 116, 112] --
78
+ │ │ │ │ └─ParallelTransformerBlock: 5-12 [435, 116, 112] [435, 116, 112] --
79
+ │ │ │ │ │ └─LayerNorm: 6-37 [435, 116, 112] [435, 116, 112] 224
80
+ │ │ │ │ │ └─Linear: 6-38 [435, 116, 112] [435, 116, 1720] 192,640
81
+ │ │ │ │ │ └─Linear: 6-39 [435, 116, 528] [435, 116, 112] 59,136
82
+ │ │ │ │ │ └─DropPath: 6-40 [435, 116, 112] [435, 116, 112] --
83
+ │ │ │ │ │ └─Sequential: 6-41 [435, 116, 136] [435, 116, 112] --
84
+ │ │ │ │ │ │ └─GELU: 7-19 [435, 116, 136] [435, 116, 136] --
85
+ │ │ │ │ │ │ └─Dropout: 7-20 [435, 116, 136] [435, 116, 136] --
86
+ │ │ │ │ │ │ └─Linear: 7-21 [435, 116, 136] [435, 116, 112] 15,232
87
+ │ │ │ │ │ └─DropPath: 6-42 [435, 116, 112] [435, 116, 112] --
88
+ │ │ │ │ └─ParallelTransformerBlock: 5-13 [435, 116, 112] [435, 116, 112] --
89
+ │ │ │ │ │ └─LayerNorm: 6-43 [435, 116, 112] [435, 116, 112] 224
90
+ │ │ │ │ │ └─Linear: 6-44 [435, 116, 112] [435, 116, 1720] 192,640
91
+ │ │ │ │ │ └─Linear: 6-45 [435, 116, 528] [435, 116, 112] 59,136
92
+ │ │ │ │ │ └─DropPath: 6-46 [435, 116, 112] [435, 116, 112] --
93
+ │ │ │ │ │ └─Sequential: 6-47 [435, 116, 136] [435, 116, 112] --
94
+ │ │ │ │ │ │ └─GELU: 7-22 [435, 116, 136] [435, 116, 136] --
95
+ │ │ │ │ │ │ └─Dropout: 7-23 [435, 116, 136] [435, 116, 136] --
96
+ │ │ │ │ │ │ └─Linear: 7-24 [435, 116, 136] [435, 116, 112] 15,232
97
+ │ │ │ │ │ └─DropPath: 6-48 [435, 116, 112] [435, 116, 112] --
98
+ │ │ └─Rearrange: 3-4 [1, 116, 435, 112] [1, 112, 116, 15, 29] --
99
+ ├─MLPShifters: 1-2 -- [1, 2, 116] 513
100
+ │ └─MLPShifter: 2-2 [116, 2] [116, 2] --
101
+ │ │ └─Sequential: 3-5 [116, 2] [116, 2] --
102
+ │ │ │ └─Linear: 4-4 [116, 2] [116, 5] 15
103
+ │ │ │ └─Tanh: 4-5 [116, 5] [116, 5] --
104
+ │ │ │ └─Linear: 4-6 [116, 5] [116, 5] 30
105
+ │ │ │ └─Tanh: 4-7 [116, 5] [116, 5] --
106
+ │ │ │ └─Linear: 4-8 [116, 5] [116, 2] 12
107
+ │ │ │ └─Tanh: 4-9 [116, 2] [116, 2] --
108
+ ├─Readouts: 1-3 [1, 112, 116, 15, 29] [1, 7440, 116] 8,477,649
109
+ │ └─Gaussian2DReadout2: 2-3 [1, 112, 116, 15, 29] [1, 7440, 116] 870,480
110
+ │ │ └─Sequential: 3-6 [7440, 2] [7440, 2] --
111
+ │ │ │ └─Linear: 4-10 [7440, 2] [7440, 30] 90
112
+ │ │ │ └─ELU: 4-11 [7440, 30] [7440, 30] --
113
+ │ │ │ └─Linear: 4-12 [7440, 30] [7440, 2] 62
114
+ │ │ │ └─Tanh: 4-13 [7440, 2] [7440, 2] --
115
+ │ │ └─Sequential: 3-7 [7440, 2] [7440, 2] (recursive)
116
+ │ │ │ └─Linear: 4-14 [7440, 2] [7440, 30] (recursive)
117
+ │ │ │ └─ELU: 4-15 [7440, 30] [7440, 30] --
118
+ �� │ │ └─Linear: 4-16 [7440, 30] [7440, 2] (recursive)
119
+ │ │ │ └─Tanh: 4-17 [7440, 2] [7440, 2] --
120
+ │ │ └─Sequential: 3-8 [7440, 2] [7440, 2] (recursive)
121
+ │ │ │ └─Linear: 4-18 [7440, 2] [7440, 30] (recursive)
122
+ │ │ │ └─ELU: 4-19 [7440, 30] [7440, 30] --
123
+ │ │ │ └─Linear: 4-20 [7440, 30] [7440, 2] (recursive)
124
+ │ │ │ └─Tanh: 4-21 [7440, 2] [7440, 2] --
125
+ │ │ └─Sequential: 3-9 [116, 4] [116, 112] --
126
+ │ │ │ └─Linear: 4-22 [116, 4] [116, 112] 560
127
+ │ │ │ └─LayerNorm: 4-23 [116, 112] [116, 112] 224
128
+ │ │ │ └─GELU: 4-24 [116, 112] [116, 112] --
129
+ │ │ │ └─Dropout: 4-25 [116, 112] [116, 112] --
130
+ │ │ │ └─Linear: 4-26 [116, 112] [116, 112] 12,656
131
+ │ │ │ └─Tanh: 4-27 [116, 112] [116, 112] --
132
+ ├─Exponential: 1-4 [1, 7440, 116] [1, 7440, 116] --
133
+ =======================================================================================================================================
134
+ Total params: 12,278,365
135
+ Trainable params: 12,278,365
136
+ Non-trainable params: 0
137
+ Total mult-adds (Units.MEGABYTES): 679.88
138
+ =======================================================================================================================================
139
+ Input size (MB): 1.29
140
+ Forward/backward pass size (MB): 9208.73
141
+ Params size (MB): 11.40
142
+ Estimated Total Size (MB): 9221.42
143
+ =======================================================================================================================================
004/output.log ADDED
@@ -0,0 +1,770 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Use bfloat16 for core module.
2
+ Use parallel attention and MLP in ViViT.
3
+
4
+ Epoch 001/400
5
+ Train loss: 108875712.00 correlation: 0.0142
6
+ Validation loss: 200009632.00 correlation: 0.0280
7
+ Elapse: 536.31s
8
+
9
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
10
+
11
+ Epoch 002/400
12
+ Train loss: 97286888.00 correlation: 0.0397
13
+ Validation loss: 199179056.00 correlation: 0.0389
14
+ Elapse: 540.45s
15
+
16
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
17
+
18
+ Epoch 003/400
19
+ Train loss: 96065840.00 correlation: 0.0525
20
+ Validation loss: 198705632.00 correlation: 0.0414
21
+ Elapse: 548.06s
22
+
23
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
24
+
25
+ Epoch 004/400
26
+ Train loss: 95196720.00 correlation: 0.0616
27
+ Validation loss: 197267888.00 correlation: 0.0520
28
+ Elapse: 550.50s
29
+
30
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
31
+
32
+ Epoch 005/400
33
+ Train loss: 94175976.00 correlation: 0.0728
34
+ Validation loss: 195531712.00 correlation: 0.0637
35
+ Elapse: 549.52s
36
+
37
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
38
+
39
+ Epoch 006/400
40
+ Train loss: 92696320.00 correlation: 0.0883
41
+ Validation loss: 193088208.00 correlation: 0.0800
42
+ Elapse: 547.83s
43
+
44
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
45
+
46
+ Epoch 007/400
47
+ Train loss: 91328912.00 correlation: 0.1027
48
+ Validation loss: 190954368.00 correlation: 0.0931
49
+ Elapse: 546.41s
50
+
51
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
52
+
53
+ Epoch 008/400
54
+ Train loss: 90154608.00 correlation: 0.1149
55
+ Validation loss: 189186224.00 correlation: 0.1027
56
+ Elapse: 544.21s
57
+
58
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
59
+
60
+ Epoch 009/400
61
+ Train loss: 88984904.00 correlation: 0.1267
62
+ Validation loss: 187096768.00 correlation: 0.1152
63
+ Elapse: 542.67s
64
+
65
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
66
+
67
+ Epoch 010/400
68
+ Train loss: 87719928.00 correlation: 0.1389
69
+ Validation loss: 185224656.00 correlation: 0.1287
70
+ Elapse: 541.24s
71
+
72
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
73
+
74
+ Epoch 011/400
75
+ Train loss: 86455896.00 correlation: 0.1522
76
+ Validation loss: 183495936.00 correlation: 0.1386
77
+ Elapse: 540.40s
78
+
79
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
80
+
81
+ Epoch 012/400
82
+ Train loss: 85286208.00 correlation: 0.1638
83
+ Validation loss: 181750576.00 correlation: 0.1502
84
+ Elapse: 539.78s
85
+
86
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
87
+
88
+ Epoch 013/400
89
+ Train loss: 84359632.00 correlation: 0.1728
90
+ Validation loss: 180806192.00 correlation: 0.1570
91
+ Elapse: 540.59s
92
+
93
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
94
+
95
+ Epoch 014/400
96
+ Train loss: 83654496.00 correlation: 0.1800
97
+ Validation loss: 179662112.00 correlation: 0.1648
98
+ Elapse: 539.99s
99
+
100
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
101
+
102
+ Epoch 015/400
103
+ Train loss: 82936160.00 correlation: 0.1870
104
+ Validation loss: 178832416.00 correlation: 0.1697
105
+ Elapse: 540.96s
106
+
107
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
108
+
109
+ Epoch 016/400
110
+ Train loss: 82256432.00 correlation: 0.1933
111
+ Validation loss: 177940560.00 correlation: 0.1755
112
+ Elapse: 541.08s
113
+
114
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
115
+
116
+ Epoch 017/400
117
+ Train loss: 81816704.00 correlation: 0.1974
118
+ Validation loss: 177331792.00 correlation: 0.1789
119
+ Elapse: 541.24s
120
+
121
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
122
+
123
+ Epoch 018/400
124
+ Train loss: 81317624.00 correlation: 0.2024
125
+ Validation loss: 176620096.00 correlation: 0.1839
126
+ Elapse: 541.38s
127
+
128
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
129
+
130
+ Epoch 019/400
131
+ Train loss: 80761904.00 correlation: 0.2073
132
+ Validation loss: 175956080.00 correlation: 0.1882
133
+ Elapse: 540.85s
134
+
135
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
136
+
137
+ Epoch 020/400
138
+ Train loss: 80425104.00 correlation: 0.2111
139
+ Validation loss: 175399376.00 correlation: 0.1923
140
+ Elapse: 541.23s
141
+
142
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
143
+
144
+ Epoch 021/400
145
+ Train loss: 80006704.00 correlation: 0.2149
146
+ Validation loss: 174810944.00 correlation: 0.1963
147
+ Elapse: 540.64s
148
+
149
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
150
+
151
+ Epoch 022/400
152
+ Train loss: 79605576.00 correlation: 0.2188
153
+ Validation loss: 174441312.00 correlation: 0.1990
154
+ Elapse: 541.29s
155
+
156
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
157
+
158
+ Epoch 023/400
159
+ Train loss: 79238384.00 correlation: 0.2225
160
+ Validation loss: 173628144.00 correlation: 0.2041
161
+ Elapse: 541.23s
162
+
163
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
164
+
165
+ Epoch 024/400
166
+ Train loss: 78942312.00 correlation: 0.2253
167
+ Validation loss: 173239408.00 correlation: 0.2069
168
+ Elapse: 541.38s
169
+
170
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
171
+
172
+ Epoch 025/400
173
+ Train loss: 78635512.00 correlation: 0.2284
174
+ Validation loss: 172979872.00 correlation: 0.2084
175
+ Elapse: 541.43s
176
+
177
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
178
+
179
+ Epoch 026/400
180
+ Train loss: 78411792.00 correlation: 0.2303
181
+ Validation loss: 172513792.00 correlation: 0.2110
182
+ Elapse: 541.42s
183
+
184
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
185
+
186
+ Epoch 027/400
187
+ Train loss: 78185872.00 correlation: 0.2329
188
+ Validation loss: 172230208.00 correlation: 0.2128
189
+ Elapse: 540.87s
190
+
191
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
192
+
193
+ Epoch 028/400
194
+ Train loss: 77904656.00 correlation: 0.2353
195
+ Validation loss: 172162992.00 correlation: 0.2139
196
+ Elapse: 541.44s
197
+
198
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
199
+
200
+ Epoch 029/400
201
+ Train loss: 77741728.00 correlation: 0.2368
202
+ Validation loss: 171699152.00 correlation: 0.2166
203
+ Elapse: 542.05s
204
+
205
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
206
+
207
+ Epoch 030/400
208
+ Train loss: 77624216.00 correlation: 0.2381
209
+ Validation loss: 171523792.00 correlation: 0.2179
210
+ Elapse: 541.70s
211
+
212
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
213
+
214
+ Epoch 031/400
215
+ Train loss: 77405640.00 correlation: 0.2398
216
+ Validation loss: 171512912.00 correlation: 0.2182
217
+ Elapse: 541.80s
218
+
219
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
220
+
221
+ Epoch 032/400
222
+ Train loss: 77315544.00 correlation: 0.2411
223
+ Validation loss: 171059296.00 correlation: 0.2209
224
+ Elapse: 541.92s
225
+
226
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
227
+
228
+ Epoch 033/400
229
+ Train loss: 77214704.00 correlation: 0.2420
230
+ Validation loss: 171228784.00 correlation: 0.2201
231
+ Elapse: 541.77s
232
+
233
+ Epoch 034/400
234
+ Train loss: 77108704.00 correlation: 0.2433
235
+ Validation loss: 170971952.00 correlation: 0.2219
236
+ Elapse: 541.81s
237
+
238
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
239
+
240
+ Epoch 035/400
241
+ Train loss: 76970384.00 correlation: 0.2445
242
+ Validation loss: 170653312.00 correlation: 0.2236
243
+ Elapse: 542.50s
244
+
245
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
246
+
247
+ Epoch 036/400
248
+ Train loss: 76829184.00 correlation: 0.2459
249
+ Validation loss: 170723072.00 correlation: 0.2228
250
+ Elapse: 542.11s
251
+
252
+ Epoch 037/400
253
+ Train loss: 76814728.00 correlation: 0.2461
254
+ Validation loss: 170317536.00 correlation: 0.2260
255
+ Elapse: 542.26s
256
+
257
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
258
+
259
+ Epoch 038/400
260
+ Train loss: 76648232.00 correlation: 0.2476
261
+ Validation loss: 170352096.00 correlation: 0.2263
262
+ Elapse: 542.30s
263
+
264
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
265
+
266
+ Epoch 039/400
267
+ Train loss: 76570480.00 correlation: 0.2485
268
+ Validation loss: 170048544.00 correlation: 0.2276
269
+ Elapse: 542.30s
270
+
271
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
272
+
273
+ Epoch 040/400
274
+ Train loss: 76481936.00 correlation: 0.2492
275
+ Validation loss: 170178064.00 correlation: 0.2271
276
+ Elapse: 542.72s
277
+
278
+ Epoch 041/400
279
+ Train loss: 76392648.00 correlation: 0.2501
280
+ Validation loss: 169916672.00 correlation: 0.2292
281
+ Elapse: 542.22s
282
+
283
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
284
+
285
+ Epoch 042/400
286
+ Train loss: 76277856.00 correlation: 0.2512
287
+ Validation loss: 169939984.00 correlation: 0.2288
288
+ Elapse: 542.30s
289
+
290
+ Epoch 043/400
291
+ Train loss: 76200912.00 correlation: 0.2518
292
+ Validation loss: 169966848.00 correlation: 0.2293
293
+ Elapse: 543.01s
294
+
295
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
296
+
297
+ Epoch 044/400
298
+ Train loss: 76180752.00 correlation: 0.2520
299
+ Validation loss: 169804672.00 correlation: 0.2301
300
+ Elapse: 541.51s
301
+
302
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
303
+
304
+ Epoch 045/400
305
+ Train loss: 76124944.00 correlation: 0.2529
306
+ Validation loss: 169699056.00 correlation: 0.2297
307
+ Elapse: 541.18s
308
+
309
+ Epoch 046/400
310
+ Train loss: 75982544.00 correlation: 0.2542
311
+ Validation loss: 169554976.00 correlation: 0.2308
312
+ Elapse: 541.59s
313
+
314
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
315
+
316
+ Epoch 047/400
317
+ Train loss: 75966320.00 correlation: 0.2542
318
+ Validation loss: 169422160.00 correlation: 0.2317
319
+ Elapse: 540.36s
320
+
321
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
322
+
323
+ Epoch 048/400
324
+ Train loss: 75923248.00 correlation: 0.2547
325
+ Validation loss: 169780352.00 correlation: 0.2287
326
+ Elapse: 540.75s
327
+
328
+ Epoch 049/400
329
+ Train loss: 75947968.00 correlation: 0.2547
330
+ Validation loss: 169837856.00 correlation: 0.2298
331
+ Elapse: 541.57s
332
+
333
+ Epoch 050/400
334
+ Train loss: 75809040.00 correlation: 0.2556
335
+ Validation loss: 169605200.00 correlation: 0.2306
336
+ Elapse: 541.98s
337
+
338
+ Epoch 051/400
339
+ Train loss: 75789808.00 correlation: 0.2558
340
+ Validation loss: 169401440.00 correlation: 0.2307
341
+ Elapse: 542.15s
342
+
343
+ Epoch 052/400
344
+ Train loss: 75764560.00 correlation: 0.2561
345
+ Validation loss: 169899840.00 correlation: 0.2291
346
+ Elapse: 541.98s
347
+
348
+ Loaded checkpoint from epoch 47 (correlation: 0.2317).
349
+
350
+ Reduce learning rate of core to 1.4400e-03 (num. reduce: 1).
351
+ Reduce learning rate of readouts to 1.0800e-03 (num. reduce: 1).
352
+ Reduce learning rate of shifters to 1.0800e-03 (num. reduce: 1).
353
+
354
+ Epoch 053/400
355
+ Train loss: 73947496.00 correlation: 0.2716
356
+ Validation loss: 167854176.00 correlation: 0.2423
357
+ Elapse: 542.40s
358
+
359
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
360
+
361
+ Epoch 054/400
362
+ Train loss: 73334280.00 correlation: 0.2771
363
+ Validation loss: 167810464.00 correlation: 0.2430
364
+ Elapse: 543.06s
365
+
366
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
367
+
368
+ Epoch 055/400
369
+ Train loss: 73178416.00 correlation: 0.2788
370
+ Validation loss: 167610272.00 correlation: 0.2431
371
+ Elapse: 543.11s
372
+
373
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
374
+
375
+ Epoch 056/400
376
+ Train loss: 73106944.00 correlation: 0.2793
377
+ Validation loss: 167676960.00 correlation: 0.2432
378
+ Elapse: 543.44s
379
+
380
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
381
+
382
+ Epoch 057/400
383
+ Train loss: 73098200.00 correlation: 0.2798
384
+ Validation loss: 167731616.00 correlation: 0.2427
385
+ Elapse: 543.05s
386
+
387
+ Epoch 058/400
388
+ Train loss: 73030688.00 correlation: 0.2803
389
+ Validation loss: 167715872.00 correlation: 0.2427
390
+ Elapse: 543.72s
391
+
392
+ Epoch 059/400
393
+ Train loss: 72944768.00 correlation: 0.2814
394
+ Validation loss: 167514192.00 correlation: 0.2440
395
+ Elapse: 543.63s
396
+
397
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
398
+
399
+ Epoch 060/400
400
+ Train loss: 72929872.00 correlation: 0.2815
401
+ Validation loss: 167771024.00 correlation: 0.2423
402
+ Elapse: 543.29s
403
+
404
+ Epoch 061/400
405
+ Train loss: 72848184.00 correlation: 0.2822
406
+ Validation loss: 167556976.00 correlation: 0.2437
407
+ Elapse: 543.81s
408
+
409
+ Epoch 062/400
410
+ Train loss: 72894440.00 correlation: 0.2819
411
+ Validation loss: 167687056.00 correlation: 0.2429
412
+ Elapse: 543.05s
413
+
414
+ Epoch 063/400
415
+ Train loss: 72843624.00 correlation: 0.2824
416
+ Validation loss: 167582688.00 correlation: 0.2431
417
+ Elapse: 544.00s
418
+
419
+ Epoch 064/400
420
+ Train loss: 72864712.00 correlation: 0.2818
421
+ Validation loss: 167485088.00 correlation: 0.2435
422
+ Elapse: 543.20s
423
+
424
+ Loaded checkpoint from epoch 59 (correlation: 0.2440).
425
+
426
+ Reduce learning rate of core to 4.3200e-04 (num. reduce: 1).
427
+ Reduce learning rate of readouts to 3.2400e-04 (num. reduce: 1).
428
+ Reduce learning rate of shifters to 3.2400e-04 (num. reduce: 1).
429
+
430
+ Epoch 065/400
431
+ Train loss: 72100880.00 correlation: 0.2884
432
+ Validation loss: 167043168.00 correlation: 0.2470
433
+ Elapse: 543.83s
434
+
435
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
436
+
437
+ Epoch 066/400
438
+ Train loss: 71817264.00 correlation: 0.2907
439
+ Validation loss: 166928480.00 correlation: 0.2480
440
+ Elapse: 543.10s
441
+
442
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
443
+
444
+ Epoch 067/400
445
+ Train loss: 71765488.00 correlation: 0.2914
446
+ Validation loss: 166935472.00 correlation: 0.2473
447
+ Elapse: 543.05s
448
+
449
+ Epoch 068/400
450
+ Train loss: 71709384.00 correlation: 0.2919
451
+ Validation loss: 166836192.00 correlation: 0.2479
452
+ Elapse: 544.05s
453
+
454
+ Epoch 069/400
455
+ Train loss: 71609624.00 correlation: 0.2931
456
+ Validation loss: 166932704.00 correlation: 0.2478
457
+ Elapse: 544.51s
458
+
459
+ Epoch 070/400
460
+ Train loss: 71532048.00 correlation: 0.2937
461
+ Validation loss: 166911168.00 correlation: 0.2475
462
+ Elapse: 543.81s
463
+
464
+ Epoch 071/400
465
+ Train loss: 71531912.00 correlation: 0.2938
466
+ Validation loss: 166931488.00 correlation: 0.2474
467
+ Elapse: 543.44s
468
+
469
+ Loaded checkpoint from epoch 66 (correlation: 0.2480).
470
+
471
+ Reduce learning rate of core to 1.2960e-04 (num. reduce: 1).
472
+ Reduce learning rate of readouts to 9.7200e-05 (num. reduce: 1).
473
+ Reduce learning rate of shifters to 9.7200e-05 (num. reduce: 1).
474
+
475
+ Epoch 072/400
476
+ Train loss: 71521936.00 correlation: 0.2938
477
+ Validation loss: 166835152.00 correlation: 0.2481
478
+ Elapse: 544.28s
479
+
480
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
481
+
482
+ Epoch 073/400
483
+ Train loss: 71422952.00 correlation: 0.2945
484
+ Validation loss: 166809568.00 correlation: 0.2486
485
+ Elapse: 542.98s
486
+
487
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
488
+
489
+ Epoch 074/400
490
+ Train loss: 71402352.00 correlation: 0.2945
491
+ Validation loss: 166765920.00 correlation: 0.2487
492
+ Elapse: 544.22s
493
+
494
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
495
+
496
+ Epoch 075/400
497
+ Train loss: 71357648.00 correlation: 0.2949
498
+ Validation loss: 166766240.00 correlation: 0.2487
499
+ Elapse: 544.05s
500
+
501
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
502
+
503
+ Epoch 076/400
504
+ Train loss: 71315664.00 correlation: 0.2955
505
+ Validation loss: 166761216.00 correlation: 0.2489
506
+ Elapse: 544.69s
507
+
508
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
509
+
510
+ Epoch 077/400
511
+ Train loss: 71363472.00 correlation: 0.2948
512
+ Validation loss: 166736352.00 correlation: 0.2489
513
+ Elapse: 544.27s
514
+
515
+ Epoch 078/400
516
+ Train loss: 71227736.00 correlation: 0.2964
517
+ Validation loss: 166733360.00 correlation: 0.2489
518
+ Elapse: 544.22s
519
+
520
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
521
+
522
+ Epoch 079/400
523
+ Train loss: 71277464.00 correlation: 0.2955
524
+ Validation loss: 166735664.00 correlation: 0.2488
525
+ Elapse: 543.94s
526
+
527
+ Epoch 080/400
528
+ Train loss: 71206488.00 correlation: 0.2965
529
+ Validation loss: 166742432.00 correlation: 0.2489
530
+ Elapse: 544.10s
531
+
532
+ Epoch 081/400
533
+ Train loss: 71163264.00 correlation: 0.2968
534
+ Validation loss: 166738592.00 correlation: 0.2489
535
+ Elapse: 544.08s
536
+
537
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
538
+
539
+ Epoch 082/400
540
+ Train loss: 71186960.00 correlation: 0.2968
541
+ Validation loss: 166722656.00 correlation: 0.2489
542
+ Elapse: 544.32s
543
+
544
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
545
+
546
+ Epoch 083/400
547
+ Train loss: 71185200.00 correlation: 0.2968
548
+ Validation loss: 166706704.00 correlation: 0.2489
549
+ Elapse: 543.20s
550
+
551
+ Epoch 084/400
552
+ Train loss: 71172336.00 correlation: 0.2970
553
+ Validation loss: 166667952.00 correlation: 0.2490
554
+ Elapse: 544.33s
555
+
556
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
557
+
558
+ Epoch 085/400
559
+ Train loss: 71094784.00 correlation: 0.2977
560
+ Validation loss: 166736224.00 correlation: 0.2490
561
+ Elapse: 544.02s
562
+
563
+ Epoch 086/400
564
+ Train loss: 71121680.00 correlation: 0.2972
565
+ Validation loss: 166702080.00 correlation: 0.2491
566
+ Elapse: 544.15s
567
+
568
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
569
+
570
+ Epoch 087/400
571
+ Train loss: 71068680.00 correlation: 0.2980
572
+ Validation loss: 166759776.00 correlation: 0.2488
573
+ Elapse: 544.35s
574
+
575
+ Epoch 088/400
576
+ Train loss: 71037376.00 correlation: 0.2982
577
+ Validation loss: 166717840.00 correlation: 0.2488
578
+ Elapse: 544.48s
579
+
580
+ Epoch 089/400
581
+ Train loss: 71044336.00 correlation: 0.2979
582
+ Validation loss: 166688608.00 correlation: 0.2491
583
+ Elapse: 543.63s
584
+
585
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
586
+
587
+ Epoch 090/400
588
+ Train loss: 71028720.00 correlation: 0.2984
589
+ Validation loss: 166697808.00 correlation: 0.2488
590
+ Elapse: 544.01s
591
+
592
+ Epoch 091/400
593
+ Train loss: 70956424.00 correlation: 0.2991
594
+ Validation loss: 166683104.00 correlation: 0.2491
595
+ Elapse: 544.36s
596
+
597
+ Epoch 092/400
598
+ Train loss: 71034488.00 correlation: 0.2982
599
+ Validation loss: 166691024.00 correlation: 0.2491
600
+ Elapse: 544.53s
601
+
602
+ Epoch 093/400
603
+ Train loss: 71008336.00 correlation: 0.2981
604
+ Validation loss: 166667472.00 correlation: 0.2493
605
+ Elapse: 544.24s
606
+
607
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
608
+
609
+ Epoch 094/400
610
+ Train loss: 70955584.00 correlation: 0.2990
611
+ Validation loss: 166707392.00 correlation: 0.2487
612
+ Elapse: 543.78s
613
+
614
+ Epoch 095/400
615
+ Train loss: 70927976.00 correlation: 0.2993
616
+ Validation loss: 166647504.00 correlation: 0.2491
617
+ Elapse: 543.94s
618
+
619
+ Epoch 096/400
620
+ Train loss: 70877440.00 correlation: 0.2996
621
+ Validation loss: 166701728.00 correlation: 0.2486
622
+ Elapse: 543.45s
623
+
624
+ Epoch 097/400
625
+ Train loss: 70917616.00 correlation: 0.2991
626
+ Validation loss: 166641920.00 correlation: 0.2492
627
+ Elapse: 544.10s
628
+
629
+ Epoch 098/400
630
+ Train loss: 70867216.00 correlation: 0.2999
631
+ Validation loss: 166664160.00 correlation: 0.2492
632
+ Elapse: 544.30s
633
+
634
+ Loaded checkpoint from epoch 93 (correlation: 0.2493).
635
+
636
+ Reduce learning rate of core to 3.8880e-05 (num. reduce: 1).
637
+ Reduce learning rate of readouts to 2.9160e-05 (num. reduce: 1).
638
+ Reduce learning rate of shifters to 2.9160e-05 (num. reduce: 1).
639
+
640
+ Epoch 099/400
641
+ Train loss: 70901904.00 correlation: 0.2993
642
+ Validation loss: 166624560.00 correlation: 0.2493
643
+ Elapse: 544.44s
644
+
645
+ Epoch 100/400
646
+ Train loss: 70815976.00 correlation: 0.3000
647
+ Validation loss: 166631168.00 correlation: 0.2494
648
+ Elapse: 544.02s
649
+
650
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
651
+
652
+ Epoch 101/400
653
+ Train loss: 70876152.00 correlation: 0.2993
654
+ Validation loss: 166642400.00 correlation: 0.2492
655
+ Elapse: 544.50s
656
+
657
+ Epoch 102/400
658
+ Train loss: 70783744.00 correlation: 0.3006
659
+ Validation loss: 166643056.00 correlation: 0.2492
660
+ Elapse: 544.34s
661
+
662
+ Epoch 103/400
663
+ Train loss: 70822832.00 correlation: 0.3002
664
+ Validation loss: 166621408.00 correlation: 0.2494
665
+ Elapse: 544.59s
666
+
667
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
668
+
669
+ Epoch 104/400
670
+ Train loss: 70795760.00 correlation: 0.3005
671
+ Validation loss: 166626384.00 correlation: 0.2494
672
+ Elapse: 544.65s
673
+
674
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/015/ckpt/model_state.pt.
675
+
676
+ Epoch 105/400
677
+ Train loss: 70758416.00 correlation: 0.3004
678
+ Validation loss: 166603600.00 correlation: 0.2494
679
+ Elapse: 544.30s
680
+
681
+ Epoch 106/400
682
+ Train loss: 70836856.00 correlation: 0.2999
683
+ Validation loss: 166631360.00 correlation: 0.2493
684
+ Elapse: 544.28s
685
+
686
+ Epoch 107/400
687
+ Train loss: 70783560.00 correlation: 0.3006
688
+ Validation loss: 166638304.00 correlation: 0.2493
689
+ Elapse: 544.44s
690
+
691
+ Epoch 108/400
692
+ Train loss: 70793304.00 correlation: 0.3004
693
+ Validation loss: 166632480.00 correlation: 0.2492
694
+ Elapse: 544.19s
695
+
696
+ Epoch 109/400
697
+ Train loss: 70730064.00 correlation: 0.3012
698
+ Validation loss: 166617632.00 correlation: 0.2493
699
+ Elapse: 543.89s
700
+
701
+ Loaded checkpoint from epoch 104 (correlation: 0.2494).
702
+
703
+ Reduce learning rate of core to 1.1664e-05 (num. reduce: 1).
704
+ Reduce learning rate of readouts to 8.7480e-06 (num. reduce: 1).
705
+ Reduce learning rate of shifters to 8.7480e-06 (num. reduce: 1).
706
+
707
+ Epoch 110/400
708
+ Train loss: 70741584.00 correlation: 0.3007
709
+ Validation loss: 166614400.00 correlation: 0.2493
710
+ Elapse: 544.26s
711
+
712
+ Epoch 111/400
713
+ Train loss: 70763320.00 correlation: 0.3005
714
+ Validation loss: 166633072.00 correlation: 0.2493
715
+ Elapse: 544.57s
716
+
717
+ Epoch 112/400
718
+ Train loss: 70721984.00 correlation: 0.3011
719
+ Validation loss: 166633552.00 correlation: 0.2493
720
+ Elapse: 544.64s
721
+
722
+ Epoch 113/400
723
+ Train loss: 70737856.00 correlation: 0.3009
724
+ Validation loss: 166608208.00 correlation: 0.2494
725
+ Elapse: 544.39s
726
+
727
+ Epoch 114/400
728
+ Train loss: 70798224.00 correlation: 0.3000
729
+ Validation loss: 166619792.00 correlation: 0.2494
730
+ Elapse: 543.95s
731
+
732
+ Loaded checkpoint from epoch 104 (correlation: 0.2494).
733
+
734
+ Reduce learning rate of core to 3.4992e-06 (num. reduce: 2).
735
+ Reduce learning rate of readouts to 2.6244e-06 (num. reduce: 2).
736
+ Reduce learning rate of shifters to 2.6244e-06 (num. reduce: 2).
737
+
738
+ Epoch 115/400
739
+ Train loss: 70736776.00 correlation: 0.3008
740
+ Validation loss: 166615600.00 correlation: 0.2494
741
+ Elapse: 544.31s
742
+
743
+ Epoch 116/400
744
+ Train loss: 70760608.00 correlation: 0.3006
745
+ Validation loss: 166622592.00 correlation: 0.2493
746
+ Elapse: 544.61s
747
+
748
+ Epoch 117/400
749
+ Train loss: 70707912.00 correlation: 0.3011
750
+ Validation loss: 166622416.00 correlation: 0.2494
751
+ Elapse: 544.73s
752
+
753
+ Epoch 118/400
754
+ Train loss: 70797264.00 correlation: 0.3002
755
+ Validation loss: 166620240.00 correlation: 0.2493
756
+ Elapse: 545.29s
757
+
758
+ Epoch 119/400
759
+ Train loss: 70782240.00 correlation: 0.3003
760
+ Validation loss: 166620000.00 correlation: 0.2493
761
+ Elapse: 544.33s
762
+
763
+ Model has not improved after 2 LR reductions.
764
+
765
+ Loaded checkpoint from epoch 104 (correlation: 0.2494).
766
+
767
+
768
+ ValidationA: 0.2428 B: 0.2746 C: 0.2716 D: 0.2360 E: 0.2351 F: 0.2335 G: 0.2531 H: 0.2331 I: 0.2568 J: 0.2576 average: 0.2494
769
+
770
+ Results saved to /home/storage/runs/vivit_ensemble/015.
005/args.yaml ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_eps: 1e-08
4
+ batch_size: 6
5
+ cache_data: false
6
+ center_crop: 1.0
7
+ clear_output_dir: true
8
+ core: vivit
9
+ core_behavior_mode: 2
10
+ core_compile: false
11
+ core_drop_path: 0.0505
12
+ core_emb_dim: 112
13
+ core_ff_activation: gelu
14
+ core_ff_dropout: 0.0592
15
+ core_flash_attention: 1
16
+ core_head_dim: 48
17
+ core_lr: 0.0048
18
+ core_mha_dropout: 0.358
19
+ core_mlp_dim: 136
20
+ core_norm_qk: false
21
+ core_num_heads: 11
22
+ core_p_dropout: 0.1338
23
+ core_parallel_attention: true
24
+ core_patch_mode: 0
25
+ core_pos_encoding: 3
26
+ core_spatial_depth: 3
27
+ core_spatial_patch_size: 7
28
+ core_spatial_patch_stride: 2
29
+ core_temporal_depth: 5
30
+ core_temporal_patch_size: 25
31
+ core_temporal_patch_stride: 1
32
+ core_weight_decay: 0.1789
33
+ criterion: poisson_correlation
34
+ critic_mode: 0
35
+ crop_frame: 140
36
+ data: /home/sensorium2023
37
+ deterministic: false
38
+ device: cuda
39
+ dpi: 120
40
+ ds_mode: 3
41
+ ds_scale: 1
42
+ epochs: 400
43
+ format: svg
44
+ git_hash: 3cd580b
45
+ grad_checkpointing: 0
46
+ grad_norm: null
47
+ input_shapes:
48
+ behavior: [2, 140]
49
+ pupil_center: [2, 140]
50
+ video: [1, 140, 36, 64]
51
+ limit_data: null
52
+ lr: 0.0036
53
+ max_frame: 300
54
+ micro_batch_size: 6
55
+ modulator_mode: 0
56
+ mouse_ids: [A, B, C, D, E, F, G, H, I, J]
57
+ num_workers: 2
58
+ output_dir: /home/storage/runs/005
59
+ output_mode: 1
60
+ output_shapes:
61
+ A: [7440, 140]
62
+ B: [7928, 140]
63
+ C: [8285, 140]
64
+ D: [7671, 140]
65
+ E: [7495, 140]
66
+ F: [7863, 140]
67
+ G: [7908, 140]
68
+ H: [8202, 140]
69
+ I: [7939, 140]
70
+ J: [8122, 140]
71
+ precision: "32"
72
+ pretrain_core: null
73
+ readout: gaussian2d
74
+ readout_bias_mode: 2
75
+ readout_dropout: 0.0
76
+ readout_grid_mode: 1
77
+ restore: null
78
+ save_plots: false
79
+ seed: 28
80
+ shifter_layers: 3
81
+ shifter_mode: 1
82
+ shifter_size: 5
83
+ stat_mode: 1
84
+ trainable_params: 12278365
85
+ transform_mode: 2
86
+ verbose: 1
87
+ weight_decay: 0.3939
005/ckpt/model_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f8586d53aa03f24b6b533d7a172c6c33aefaf02e346d810dbb171fcf6202e2b
3
+ size 148268583
005/evaluation.yaml ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ validation: {A: 0.2465260773897171, B: 0.27831149101257324, C: 0.2688469886779785,
2
+ D: 0.22918999195098877, E: 0.23662497103214264, F: 0.2340845912694931, G: 0.254902184009552,
3
+ H: 0.23301741480827332, I: 0.25673478841781616, J: 0.2570823132991791, average: 0.2495320811867714}
005/model.txt ADDED
@@ -0,0 +1,143 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ =======================================================================================================================================
2
+ Layer (type:depth-idx) Input Shape Output Shape Param #
3
+ =======================================================================================================================================
4
+ Model -- [1, 7440, 116] --
5
+ ├─ViViTCore: 1-1 -- [1, 112, 116, 15, 29] --
6
+ │ └─ViViT: 2-1 [1, 5, 140, 36, 64] [1, 112, 116, 15, 29] --
7
+ │ │ └─Tokenizer: 3-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] 79,632
8
+ │ │ │ └─Sequential: 4-1 [1, 5, 140, 36, 64] [1, 116, 435, 112] --
9
+ │ │ │ │ └─Unfold3d: 5-1 [1, 5, 140, 36, 64] [1, 116, 435, 6125] --
10
+ │ │ │ │ └─LayerNorm: 5-2 [1, 116, 435, 6125] [1, 116, 435, 6125] 12,250
11
+ │ │ │ │ └─Linear: 5-3 [1, 116, 435, 6125] [1, 116, 435, 112] 686,112
12
+ │ │ │ │ └─LayerNorm: 5-4 [1, 116, 435, 112] [1, 116, 435, 112] 224
13
+ │ │ │ │ └─Dropout: 5-5 [1, 116, 435, 112] [1, 116, 435, 112] --
14
+ │ │ └─Transformer: 3-2 [116, 435, 112] [116, 435, 112] --
15
+ │ │ │ └─ModuleList: 4-2 -- -- --
16
+ │ │ │ │ └─ParallelTransformerBlock: 5-6 [116, 435, 112] [116, 435, 112] --
17
+ │ │ │ │ │ └─LayerNorm: 6-1 [116, 435, 112] [116, 435, 112] 224
18
+ │ │ │ │ │ └─Linear: 6-2 [116, 435, 112] [116, 435, 1720] 192,640
19
+ │ │ │ │ │ └─Linear: 6-3 [116, 435, 528] [116, 435, 112] 59,136
20
+ │ │ │ │ │ └─DropPath: 6-4 [116, 435, 112] [116, 435, 112] --
21
+ │ │ │ │ │ └─Sequential: 6-5 [116, 435, 136] [116, 435, 112] --
22
+ │ │ │ │ │ │ └─GELU: 7-1 [116, 435, 136] [116, 435, 136] --
23
+ │ │ │ │ │ │ └─Dropout: 7-2 [116, 435, 136] [116, 435, 136] --
24
+ │ │ │ │ │ │ └─Linear: 7-3 [116, 435, 136] [116, 435, 112] 15,232
25
+ │ │ │ │ │ └─DropPath: 6-6 [116, 435, 112] [116, 435, 112] --
26
+ │ │ │ │ └─ParallelTransformerBlock: 5-7 [116, 435, 112] [116, 435, 112] --
27
+ │ │ │ │ │ └─LayerNorm: 6-7 [116, 435, 112] [116, 435, 112] 224
28
+ │ │ │ │ │ └─Linear: 6-8 [116, 435, 112] [116, 435, 1720] 192,640
29
+ │ │ │ │ │ └─Linear: 6-9 [116, 435, 528] [116, 435, 112] 59,136
30
+ │ │ │ │ │ └─DropPath: 6-10 [116, 435, 112] [116, 435, 112] --
31
+ │ │ │ │ │ └─Sequential: 6-11 [116, 435, 136] [116, 435, 112] --
32
+ │ │ │ │ │ │ └─GELU: 7-4 [116, 435, 136] [116, 435, 136] --
33
+ │ │ │ │ │ │ └─Dropout: 7-5 [116, 435, 136] [116, 435, 136] --
34
+ │ │ │ │ │ │ └─Linear: 7-6 [116, 435, 136] [116, 435, 112] 15,232
35
+ │ │ │ │ │ └─DropPath: 6-12 [116, 435, 112] [116, 435, 112] --
36
+ │ │ │ │ └─ParallelTransformerBlock: 5-8 [116, 435, 112] [116, 435, 112] --
37
+ │ │ │ │ │ └─LayerNorm: 6-13 [116, 435, 112] [116, 435, 112] 224
38
+ │ │ │ │ │ └─Linear: 6-14 [116, 435, 112] [116, 435, 1720] 192,640
39
+ │ │ │ │ │ └─Linear: 6-15 [116, 435, 528] [116, 435, 112] 59,136
40
+ │ │ │ │ │ └─DropPath: 6-16 [116, 435, 112] [116, 435, 112] --
41
+ │ │ │ │ │ └─Sequential: 6-17 [116, 435, 136] [116, 435, 112] --
42
+ │ │ │ │ │ │ └─GELU: 7-7 [116, 435, 136] [116, 435, 136] --
43
+ │ │ │ │ │ │ └─Dropout: 7-8 [116, 435, 136] [116, 435, 136] --
44
+ │ │ │ │ │ │ └─Linear: 7-9 [116, 435, 136] [116, 435, 112] 15,232
45
+ │ │ │ │ │ └─DropPath: 6-18 [116, 435, 112] [116, 435, 112] --
46
+ │ │ └─Transformer: 3-3 [435, 116, 112] [435, 116, 112] --
47
+ │ │ │ └─ModuleList: 4-3 -- -- --
48
+ │ │ │ │ └─ParallelTransformerBlock: 5-9 [435, 116, 112] [435, 116, 112] --
49
+ │ │ │ │ │ └─LayerNorm: 6-19 [435, 116, 112] [435, 116, 112] 224
50
+ │ │ │ │ │ └─Linear: 6-20 [435, 116, 112] [435, 116, 1720] 192,640
51
+ │ │ │ │ │ └─Linear: 6-21 [435, 116, 528] [435, 116, 112] 59,136
52
+ │ │ │ │ │ └─DropPath: 6-22 [435, 116, 112] [435, 116, 112] --
53
+ │ │ │ │ │ └─Sequential: 6-23 [435, 116, 136] [435, 116, 112] --
54
+ │ │ │ │ │ │ └─GELU: 7-10 [435, 116, 136] [435, 116, 136] --
55
+ │ │ │ │ │ │ └─Dropout: 7-11 [435, 116, 136] [435, 116, 136] --
56
+ │ │ │ │ │ │ └─Linear: 7-12 [435, 116, 136] [435, 116, 112] 15,232
57
+ │ │ │ │ │ └─DropPath: 6-24 [435, 116, 112] [435, 116, 112] --
58
+ │ │ │ │ └─ParallelTransformerBlock: 5-10 [435, 116, 112] [435, 116, 112] --
59
+ │ │ │ │ │ └─LayerNorm: 6-25 [435, 116, 112] [435, 116, 112] 224
60
+ │ │ │ │ │ └─Linear: 6-26 [435, 116, 112] [435, 116, 1720] 192,640
61
+ │ │ │ │ │ └─Linear: 6-27 [435, 116, 528] [435, 116, 112] 59,136
62
+ │ │ │ │ │ └─DropPath: 6-28 [435, 116, 112] [435, 116, 112] --
63
+ │ │ │ │ │ └─Sequential: 6-29 [435, 116, 136] [435, 116, 112] --
64
+ │ │ │ │ │ │ └─GELU: 7-13 [435, 116, 136] [435, 116, 136] --
65
+ │ │ │ │ │ │ └─Dropout: 7-14 [435, 116, 136] [435, 116, 136] --
66
+ │ │ │ │ │ │ └─Linear: 7-15 [435, 116, 136] [435, 116, 112] 15,232
67
+ │ │ │ │ │ └─DropPath: 6-30 [435, 116, 112] [435, 116, 112] --
68
+ │ │ │ │ └─ParallelTransformerBlock: 5-11 [435, 116, 112] [435, 116, 112] --
69
+ │ │ │ │ │ └─LayerNorm: 6-31 [435, 116, 112] [435, 116, 112] 224
70
+ │ │ │ │ │ └─Linear: 6-32 [435, 116, 112] [435, 116, 1720] 192,640
71
+ │ │ │ │ │ └─Linear: 6-33 [435, 116, 528] [435, 116, 112] 59,136
72
+ │ │ │ │ │ └─DropPath: 6-34 [435, 116, 112] [435, 116, 112] --
73
+ │ │ │ │ │ └─Sequential: 6-35 [435, 116, 136] [435, 116, 112] --
74
+ │ │ │ │ │ │ └─GELU: 7-16 [435, 116, 136] [435, 116, 136] --
75
+ │ │ │ │ │ │ └─Dropout: 7-17 [435, 116, 136] [435, 116, 136] --
76
+ │ │ │ │ │ │ └─Linear: 7-18 [435, 116, 136] [435, 116, 112] 15,232
77
+ │ │ │ │ │ └─DropPath: 6-36 [435, 116, 112] [435, 116, 112] --
78
+ │ │ │ │ └─ParallelTransformerBlock: 5-12 [435, 116, 112] [435, 116, 112] --
79
+ │ │ │ │ │ └─LayerNorm: 6-37 [435, 116, 112] [435, 116, 112] 224
80
+ │ │ │ │ │ └─Linear: 6-38 [435, 116, 112] [435, 116, 1720] 192,640
81
+ │ │ │ │ │ └─Linear: 6-39 [435, 116, 528] [435, 116, 112] 59,136
82
+ │ │ │ │ │ └─DropPath: 6-40 [435, 116, 112] [435, 116, 112] --
83
+ │ │ │ │ │ └─Sequential: 6-41 [435, 116, 136] [435, 116, 112] --
84
+ │ │ │ │ │ │ └─GELU: 7-19 [435, 116, 136] [435, 116, 136] --
85
+ │ │ │ │ │ │ └─Dropout: 7-20 [435, 116, 136] [435, 116, 136] --
86
+ │ │ │ │ │ │ └─Linear: 7-21 [435, 116, 136] [435, 116, 112] 15,232
87
+ │ │ │ │ │ └─DropPath: 6-42 [435, 116, 112] [435, 116, 112] --
88
+ │ │ │ │ └─ParallelTransformerBlock: 5-13 [435, 116, 112] [435, 116, 112] --
89
+ │ │ │ │ │ └─LayerNorm: 6-43 [435, 116, 112] [435, 116, 112] 224
90
+ │ │ │ │ │ └─Linear: 6-44 [435, 116, 112] [435, 116, 1720] 192,640
91
+ │ │ │ │ │ └─Linear: 6-45 [435, 116, 528] [435, 116, 112] 59,136
92
+ │ │ │ │ │ └─DropPath: 6-46 [435, 116, 112] [435, 116, 112] --
93
+ │ │ │ │ │ └─Sequential: 6-47 [435, 116, 136] [435, 116, 112] --
94
+ │ │ │ │ │ │ └─GELU: 7-22 [435, 116, 136] [435, 116, 136] --
95
+ │ │ │ │ │ │ └─Dropout: 7-23 [435, 116, 136] [435, 116, 136] --
96
+ │ │ │ │ │ │ └─Linear: 7-24 [435, 116, 136] [435, 116, 112] 15,232
97
+ │ │ │ │ │ └─DropPath: 6-48 [435, 116, 112] [435, 116, 112] --
98
+ │ │ └─Rearrange: 3-4 [1, 116, 435, 112] [1, 112, 116, 15, 29] --
99
+ ├─MLPShifters: 1-2 -- [1, 2, 116] 513
100
+ │ └─MLPShifter: 2-2 [116, 2] [116, 2] --
101
+ │ │ └─Sequential: 3-5 [116, 2] [116, 2] --
102
+ │ │ │ └─Linear: 4-4 [116, 2] [116, 5] 15
103
+ │ │ │ └─Tanh: 4-5 [116, 5] [116, 5] --
104
+ │ │ │ └─Linear: 4-6 [116, 5] [116, 5] 30
105
+ │ │ │ └─Tanh: 4-7 [116, 5] [116, 5] --
106
+ │ │ │ └─Linear: 4-8 [116, 5] [116, 2] 12
107
+ │ │ │ └─Tanh: 4-9 [116, 2] [116, 2] --
108
+ ├─Readouts: 1-3 [1, 112, 116, 15, 29] [1, 7440, 116] 8,477,649
109
+ │ └─Gaussian2DReadout2: 2-3 [1, 112, 116, 15, 29] [1, 7440, 116] 870,480
110
+ │ │ └─Sequential: 3-6 [7440, 2] [7440, 2] --
111
+ │ │ │ └─Linear: 4-10 [7440, 2] [7440, 30] 90
112
+ │ │ │ └─ELU: 4-11 [7440, 30] [7440, 30] --
113
+ │ │ │ └─Linear: 4-12 [7440, 30] [7440, 2] 62
114
+ │ │ │ └─Tanh: 4-13 [7440, 2] [7440, 2] --
115
+ │ │ └─Sequential: 3-7 [7440, 2] [7440, 2] (recursive)
116
+ │ │ │ └─Linear: 4-14 [7440, 2] [7440, 30] (recursive)
117
+ │ │ │ └─ELU: 4-15 [7440, 30] [7440, 30] --
118
+ �� │ │ └─Linear: 4-16 [7440, 30] [7440, 2] (recursive)
119
+ │ │ │ └─Tanh: 4-17 [7440, 2] [7440, 2] --
120
+ │ │ └─Sequential: 3-8 [7440, 2] [7440, 2] (recursive)
121
+ │ │ │ └─Linear: 4-18 [7440, 2] [7440, 30] (recursive)
122
+ │ │ │ └─ELU: 4-19 [7440, 30] [7440, 30] --
123
+ │ │ │ └─Linear: 4-20 [7440, 30] [7440, 2] (recursive)
124
+ │ │ │ └─Tanh: 4-21 [7440, 2] [7440, 2] --
125
+ │ │ └─Sequential: 3-9 [116, 4] [116, 112] --
126
+ │ │ │ └─Linear: 4-22 [116, 4] [116, 112] 560
127
+ │ │ │ └─LayerNorm: 4-23 [116, 112] [116, 112] 224
128
+ │ │ │ └─GELU: 4-24 [116, 112] [116, 112] --
129
+ │ │ │ └─Dropout: 4-25 [116, 112] [116, 112] --
130
+ │ │ │ └─Linear: 4-26 [116, 112] [116, 112] 12,656
131
+ │ │ │ └─Tanh: 4-27 [116, 112] [116, 112] --
132
+ ├─Exponential: 1-4 [1, 7440, 116] [1, 7440, 116] --
133
+ =======================================================================================================================================
134
+ Total params: 12,278,365
135
+ Trainable params: 12,278,365
136
+ Non-trainable params: 0
137
+ Total mult-adds (Units.MEGABYTES): 679.88
138
+ =======================================================================================================================================
139
+ Input size (MB): 1.29
140
+ Forward/backward pass size (MB): 9208.73
141
+ Params size (MB): 11.40
142
+ Estimated Total Size (MB): 9221.42
143
+ =======================================================================================================================================
005/output.log ADDED
@@ -0,0 +1,822 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Use bfloat16 for core module.
2
+ Use parallel attention and MLP in ViViT.
3
+
4
+ Epoch 001/400
5
+ Train loss: 111647336.00 correlation: 0.0122
6
+ Validation loss: 200300080.00 correlation: 0.0267
7
+ Elapse: 537.13s
8
+
9
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
10
+
11
+ Epoch 002/400
12
+ Train loss: 97648256.00 correlation: 0.0367
13
+ Validation loss: 199289632.00 correlation: 0.0355
14
+ Elapse: 539.72s
15
+
16
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
17
+
18
+ Epoch 003/400
19
+ Train loss: 96321792.00 correlation: 0.0500
20
+ Validation loss: 198299696.00 correlation: 0.0446
21
+ Elapse: 548.37s
22
+
23
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
24
+
25
+ Epoch 004/400
26
+ Train loss: 95213544.00 correlation: 0.0617
27
+ Validation loss: 196983504.00 correlation: 0.0527
28
+ Elapse: 552.04s
29
+
30
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
31
+
32
+ Epoch 005/400
33
+ Train loss: 93915056.00 correlation: 0.0756
34
+ Validation loss: 195022704.00 correlation: 0.0660
35
+ Elapse: 551.29s
36
+
37
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
38
+
39
+ Epoch 006/400
40
+ Train loss: 92500376.00 correlation: 0.0909
41
+ Validation loss: 193045536.00 correlation: 0.0815
42
+ Elapse: 549.45s
43
+
44
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
45
+
46
+ Epoch 007/400
47
+ Train loss: 91511136.00 correlation: 0.1012
48
+ Validation loss: 191545056.00 correlation: 0.0905
49
+ Elapse: 547.11s
50
+
51
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
52
+
53
+ Epoch 008/400
54
+ Train loss: 90428944.00 correlation: 0.1113
55
+ Validation loss: 189976016.00 correlation: 0.0998
56
+ Elapse: 544.76s
57
+
58
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
59
+
60
+ Epoch 009/400
61
+ Train loss: 89301664.00 correlation: 0.1228
62
+ Validation loss: 188514336.00 correlation: 0.1074
63
+ Elapse: 541.79s
64
+
65
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
66
+
67
+ Epoch 010/400
68
+ Train loss: 88238616.00 correlation: 0.1335
69
+ Validation loss: 186730592.00 correlation: 0.1194
70
+ Elapse: 540.44s
71
+
72
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
73
+
74
+ Epoch 011/400
75
+ Train loss: 87239336.00 correlation: 0.1436
76
+ Validation loss: 185287104.00 correlation: 0.1296
77
+ Elapse: 539.71s
78
+
79
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
80
+
81
+ Epoch 012/400
82
+ Train loss: 86205256.00 correlation: 0.1540
83
+ Validation loss: 183237792.00 correlation: 0.1419
84
+ Elapse: 540.02s
85
+
86
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
87
+
88
+ Epoch 013/400
89
+ Train loss: 85068472.00 correlation: 0.1655
90
+ Validation loss: 181721296.00 correlation: 0.1515
91
+ Elapse: 539.81s
92
+
93
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
94
+
95
+ Epoch 014/400
96
+ Train loss: 84160560.00 correlation: 0.1745
97
+ Validation loss: 180469664.00 correlation: 0.1595
98
+ Elapse: 540.34s
99
+
100
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
101
+
102
+ Epoch 015/400
103
+ Train loss: 83386128.00 correlation: 0.1821
104
+ Validation loss: 179517792.00 correlation: 0.1658
105
+ Elapse: 540.81s
106
+
107
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
108
+
109
+ Epoch 016/400
110
+ Train loss: 82805200.00 correlation: 0.1877
111
+ Validation loss: 178801584.00 correlation: 0.1698
112
+ Elapse: 540.70s
113
+
114
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
115
+
116
+ Epoch 017/400
117
+ Train loss: 82275736.00 correlation: 0.1926
118
+ Validation loss: 177842080.00 correlation: 0.1761
119
+ Elapse: 540.76s
120
+
121
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
122
+
123
+ Epoch 018/400
124
+ Train loss: 81662840.00 correlation: 0.1987
125
+ Validation loss: 176971248.00 correlation: 0.1820
126
+ Elapse: 541.07s
127
+
128
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
129
+
130
+ Epoch 019/400
131
+ Train loss: 81147088.00 correlation: 0.2038
132
+ Validation loss: 176423600.00 correlation: 0.1858
133
+ Elapse: 541.20s
134
+
135
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
136
+
137
+ Epoch 020/400
138
+ Train loss: 80748784.00 correlation: 0.2079
139
+ Validation loss: 175690976.00 correlation: 0.1908
140
+ Elapse: 541.22s
141
+
142
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
143
+
144
+ Epoch 021/400
145
+ Train loss: 80313880.00 correlation: 0.2122
146
+ Validation loss: 175389216.00 correlation: 0.1929
147
+ Elapse: 540.65s
148
+
149
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
150
+
151
+ Epoch 022/400
152
+ Train loss: 79957744.00 correlation: 0.2153
153
+ Validation loss: 174862864.00 correlation: 0.1968
154
+ Elapse: 540.96s
155
+
156
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
157
+
158
+ Epoch 023/400
159
+ Train loss: 79621360.00 correlation: 0.2186
160
+ Validation loss: 174437632.00 correlation: 0.1996
161
+ Elapse: 541.11s
162
+
163
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
164
+
165
+ Epoch 024/400
166
+ Train loss: 79374368.00 correlation: 0.2211
167
+ Validation loss: 173783968.00 correlation: 0.2031
168
+ Elapse: 542.03s
169
+
170
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
171
+
172
+ Epoch 025/400
173
+ Train loss: 79085072.00 correlation: 0.2240
174
+ Validation loss: 173357520.00 correlation: 0.2059
175
+ Elapse: 541.66s
176
+
177
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
178
+
179
+ Epoch 026/400
180
+ Train loss: 78723728.00 correlation: 0.2273
181
+ Validation loss: 173125120.00 correlation: 0.2087
182
+ Elapse: 542.13s
183
+
184
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
185
+
186
+ Epoch 027/400
187
+ Train loss: 78456624.00 correlation: 0.2299
188
+ Validation loss: 172740432.00 correlation: 0.2102
189
+ Elapse: 541.72s
190
+
191
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
192
+
193
+ Epoch 028/400
194
+ Train loss: 78264240.00 correlation: 0.2316
195
+ Validation loss: 172426416.00 correlation: 0.2125
196
+ Elapse: 541.90s
197
+
198
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
199
+
200
+ Epoch 029/400
201
+ Train loss: 78095968.00 correlation: 0.2335
202
+ Validation loss: 172338688.00 correlation: 0.2139
203
+ Elapse: 542.04s
204
+
205
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
206
+
207
+ Epoch 030/400
208
+ Train loss: 77880056.00 correlation: 0.2357
209
+ Validation loss: 171972944.00 correlation: 0.2151
210
+ Elapse: 541.96s
211
+
212
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
213
+
214
+ Epoch 031/400
215
+ Train loss: 77782920.00 correlation: 0.2367
216
+ Validation loss: 171662176.00 correlation: 0.2171
217
+ Elapse: 542.59s
218
+
219
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
220
+
221
+ Epoch 032/400
222
+ Train loss: 77596272.00 correlation: 0.2382
223
+ Validation loss: 171484624.00 correlation: 0.2187
224
+ Elapse: 543.51s
225
+
226
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
227
+
228
+ Epoch 033/400
229
+ Train loss: 77378984.00 correlation: 0.2403
230
+ Validation loss: 171180896.00 correlation: 0.2208
231
+ Elapse: 542.09s
232
+
233
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
234
+
235
+ Epoch 034/400
236
+ Train loss: 77329272.00 correlation: 0.2411
237
+ Validation loss: 171382000.00 correlation: 0.2191
238
+ Elapse: 541.49s
239
+
240
+ Epoch 035/400
241
+ Train loss: 77173400.00 correlation: 0.2426
242
+ Validation loss: 170990288.00 correlation: 0.2215
243
+ Elapse: 542.22s
244
+
245
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
246
+
247
+ Epoch 036/400
248
+ Train loss: 77103352.00 correlation: 0.2430
249
+ Validation loss: 171064224.00 correlation: 0.2212
250
+ Elapse: 542.85s
251
+
252
+ Epoch 037/400
253
+ Train loss: 76961264.00 correlation: 0.2447
254
+ Validation loss: 170693952.00 correlation: 0.2239
255
+ Elapse: 542.80s
256
+
257
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
258
+
259
+ Epoch 038/400
260
+ Train loss: 76838424.00 correlation: 0.2456
261
+ Validation loss: 170481408.00 correlation: 0.2246
262
+ Elapse: 542.40s
263
+
264
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
265
+
266
+ Epoch 039/400
267
+ Train loss: 76726736.00 correlation: 0.2469
268
+ Validation loss: 170405888.00 correlation: 0.2257
269
+ Elapse: 541.86s
270
+
271
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
272
+
273
+ Epoch 040/400
274
+ Train loss: 76625736.00 correlation: 0.2481
275
+ Validation loss: 170183216.00 correlation: 0.2271
276
+ Elapse: 542.67s
277
+
278
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
279
+
280
+ Epoch 041/400
281
+ Train loss: 76633712.00 correlation: 0.2477
282
+ Validation loss: 170194400.00 correlation: 0.2270
283
+ Elapse: 542.30s
284
+
285
+ Epoch 042/400
286
+ Train loss: 76442136.00 correlation: 0.2493
287
+ Validation loss: 170452384.00 correlation: 0.2263
288
+ Elapse: 542.26s
289
+
290
+ Epoch 043/400
291
+ Train loss: 76492200.00 correlation: 0.2491
292
+ Validation loss: 170249952.00 correlation: 0.2260
293
+ Elapse: 542.10s
294
+
295
+ Epoch 044/400
296
+ Train loss: 76279480.00 correlation: 0.2510
297
+ Validation loss: 169784496.00 correlation: 0.2295
298
+ Elapse: 541.77s
299
+
300
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
301
+
302
+ Epoch 045/400
303
+ Train loss: 76193080.00 correlation: 0.2520
304
+ Validation loss: 169944928.00 correlation: 0.2278
305
+ Elapse: 542.23s
306
+
307
+ Epoch 046/400
308
+ Train loss: 76107936.00 correlation: 0.2526
309
+ Validation loss: 169860016.00 correlation: 0.2283
310
+ Elapse: 542.90s
311
+
312
+ Epoch 047/400
313
+ Train loss: 76111024.00 correlation: 0.2527
314
+ Validation loss: 169548304.00 correlation: 0.2308
315
+ Elapse: 541.89s
316
+
317
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
318
+
319
+ Epoch 048/400
320
+ Train loss: 76049672.00 correlation: 0.2534
321
+ Validation loss: 169801264.00 correlation: 0.2296
322
+ Elapse: 543.95s
323
+
324
+ Epoch 049/400
325
+ Train loss: 75997232.00 correlation: 0.2537
326
+ Validation loss: 169721248.00 correlation: 0.2301
327
+ Elapse: 543.00s
328
+
329
+ Epoch 050/400
330
+ Train loss: 75961488.00 correlation: 0.2545
331
+ Validation loss: 169722912.00 correlation: 0.2293
332
+ Elapse: 542.91s
333
+
334
+ Epoch 051/400
335
+ Train loss: 75908376.00 correlation: 0.2548
336
+ Validation loss: 169474704.00 correlation: 0.2310
337
+ Elapse: 542.56s
338
+
339
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
340
+
341
+ Epoch 052/400
342
+ Train loss: 75771856.00 correlation: 0.2561
343
+ Validation loss: 170132720.00 correlation: 0.2272
344
+ Elapse: 542.05s
345
+
346
+ Epoch 053/400
347
+ Train loss: 75913696.00 correlation: 0.2547
348
+ Validation loss: 169491888.00 correlation: 0.2309
349
+ Elapse: 542.57s
350
+
351
+ Epoch 054/400
352
+ Train loss: 75764272.00 correlation: 0.2560
353
+ Validation loss: 169266704.00 correlation: 0.2330
354
+ Elapse: 542.91s
355
+
356
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
357
+
358
+ Epoch 055/400
359
+ Train loss: 75670816.00 correlation: 0.2569
360
+ Validation loss: 169200320.00 correlation: 0.2327
361
+ Elapse: 542.21s
362
+
363
+ Epoch 056/400
364
+ Train loss: 75680240.00 correlation: 0.2570
365
+ Validation loss: 169253344.00 correlation: 0.2322
366
+ Elapse: 542.73s
367
+
368
+ Epoch 057/400
369
+ Train loss: 75623792.00 correlation: 0.2573
370
+ Validation loss: 169158704.00 correlation: 0.2336
371
+ Elapse: 544.29s
372
+
373
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
374
+
375
+ Epoch 058/400
376
+ Train loss: 75518968.00 correlation: 0.2584
377
+ Validation loss: 169124832.00 correlation: 0.2339
378
+ Elapse: 542.64s
379
+
380
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
381
+
382
+ Epoch 059/400
383
+ Train loss: 75452928.00 correlation: 0.2591
384
+ Validation loss: 169483008.00 correlation: 0.2320
385
+ Elapse: 542.34s
386
+
387
+ Epoch 060/400
388
+ Train loss: 75478992.00 correlation: 0.2590
389
+ Validation loss: 169223728.00 correlation: 0.2337
390
+ Elapse: 543.01s
391
+
392
+ Epoch 061/400
393
+ Train loss: 75414704.00 correlation: 0.2597
394
+ Validation loss: 169588672.00 correlation: 0.2307
395
+ Elapse: 542.79s
396
+
397
+ Epoch 062/400
398
+ Train loss: 75631880.00 correlation: 0.2578
399
+ Validation loss: 169325440.00 correlation: 0.2326
400
+ Elapse: 543.75s
401
+
402
+ Epoch 063/400
403
+ Train loss: 75359640.00 correlation: 0.2602
404
+ Validation loss: 169091040.00 correlation: 0.2339
405
+ Elapse: 543.16s
406
+
407
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
408
+
409
+ Epoch 064/400
410
+ Train loss: 75319080.00 correlation: 0.2605
411
+ Validation loss: 169416560.00 correlation: 0.2321
412
+ Elapse: 543.52s
413
+
414
+ Epoch 065/400
415
+ Train loss: 75306104.00 correlation: 0.2609
416
+ Validation loss: 169176224.00 correlation: 0.2331
417
+ Elapse: 542.80s
418
+
419
+ Epoch 066/400
420
+ Train loss: 75301592.00 correlation: 0.2609
421
+ Validation loss: 169371616.00 correlation: 0.2327
422
+ Elapse: 543.10s
423
+
424
+ Epoch 067/400
425
+ Train loss: 75389672.00 correlation: 0.2601
426
+ Validation loss: 169169312.00 correlation: 0.2332
427
+ Elapse: 544.11s
428
+
429
+ Epoch 068/400
430
+ Train loss: 75361008.00 correlation: 0.2604
431
+ Validation loss: 169366960.00 correlation: 0.2315
432
+ Elapse: 543.42s
433
+
434
+ Loaded checkpoint from epoch 63 (correlation: 0.2339).
435
+
436
+ Reduce learning rate of core to 1.4400e-03 (num. reduce: 1).
437
+ Reduce learning rate of readouts to 1.0800e-03 (num. reduce: 1).
438
+ Reduce learning rate of shifters to 1.0800e-03 (num. reduce: 1).
439
+
440
+ Epoch 069/400
441
+ Train loss: 73278464.00 correlation: 0.2784
442
+ Validation loss: 167482848.00 correlation: 0.2447
443
+ Elapse: 544.59s
444
+
445
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
446
+
447
+ Epoch 070/400
448
+ Train loss: 72562424.00 correlation: 0.2849
449
+ Validation loss: 167277872.00 correlation: 0.2456
450
+ Elapse: 544.90s
451
+
452
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
453
+
454
+ Epoch 071/400
455
+ Train loss: 72429480.00 correlation: 0.2862
456
+ Validation loss: 167337568.00 correlation: 0.2452
457
+ Elapse: 544.84s
458
+
459
+ Epoch 072/400
460
+ Train loss: 72339856.00 correlation: 0.2872
461
+ Validation loss: 167472656.00 correlation: 0.2442
462
+ Elapse: 544.89s
463
+
464
+ Epoch 073/400
465
+ Train loss: 72270912.00 correlation: 0.2877
466
+ Validation loss: 167356592.00 correlation: 0.2443
467
+ Elapse: 545.34s
468
+
469
+ Epoch 074/400
470
+ Train loss: 72207960.00 correlation: 0.2884
471
+ Validation loss: 167467040.00 correlation: 0.2434
472
+ Elapse: 545.38s
473
+
474
+ Epoch 075/400
475
+ Train loss: 72186752.00 correlation: 0.2885
476
+ Validation loss: 167473600.00 correlation: 0.2434
477
+ Elapse: 545.13s
478
+
479
+ Loaded checkpoint from epoch 70 (correlation: 0.2456).
480
+
481
+ Reduce learning rate of core to 4.3200e-04 (num. reduce: 1).
482
+ Reduce learning rate of readouts to 3.2400e-04 (num. reduce: 1).
483
+ Reduce learning rate of shifters to 3.2400e-04 (num. reduce: 1).
484
+
485
+ Epoch 076/400
486
+ Train loss: 71743648.00 correlation: 0.2919
487
+ Validation loss: 166945040.00 correlation: 0.2479
488
+ Elapse: 544.86s
489
+
490
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
491
+
492
+ Epoch 077/400
493
+ Train loss: 71453328.00 correlation: 0.2949
494
+ Validation loss: 166933984.00 correlation: 0.2480
495
+ Elapse: 545.20s
496
+
497
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
498
+
499
+ Epoch 078/400
500
+ Train loss: 71407184.00 correlation: 0.2951
501
+ Validation loss: 166839616.00 correlation: 0.2480
502
+ Elapse: 545.38s
503
+
504
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
505
+
506
+ Epoch 079/400
507
+ Train loss: 71308560.00 correlation: 0.2960
508
+ Validation loss: 166820688.00 correlation: 0.2484
509
+ Elapse: 545.26s
510
+
511
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
512
+
513
+ Epoch 080/400
514
+ Train loss: 71223520.00 correlation: 0.2968
515
+ Validation loss: 166801616.00 correlation: 0.2487
516
+ Elapse: 545.81s
517
+
518
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
519
+
520
+ Epoch 081/400
521
+ Train loss: 71151600.00 correlation: 0.2975
522
+ Validation loss: 166777584.00 correlation: 0.2485
523
+ Elapse: 545.15s
524
+
525
+ Epoch 082/400
526
+ Train loss: 71166128.00 correlation: 0.2973
527
+ Validation loss: 166806736.00 correlation: 0.2484
528
+ Elapse: 545.51s
529
+
530
+ Epoch 083/400
531
+ Train loss: 71003768.00 correlation: 0.2991
532
+ Validation loss: 166794000.00 correlation: 0.2487
533
+ Elapse: 545.39s
534
+
535
+ Epoch 084/400
536
+ Train loss: 71028680.00 correlation: 0.2987
537
+ Validation loss: 166740976.00 correlation: 0.2486
538
+ Elapse: 545.50s
539
+
540
+ Epoch 085/400
541
+ Train loss: 70987920.00 correlation: 0.2989
542
+ Validation loss: 166771344.00 correlation: 0.2483
543
+ Elapse: 545.38s
544
+
545
+ Loaded checkpoint from epoch 80 (correlation: 0.2487).
546
+
547
+ Reduce learning rate of core to 1.2960e-04 (num. reduce: 1).
548
+ Reduce learning rate of readouts to 9.7200e-05 (num. reduce: 1).
549
+ Reduce learning rate of shifters to 9.7200e-05 (num. reduce: 1).
550
+
551
+ Epoch 086/400
552
+ Train loss: 70886192.00 correlation: 0.2998
553
+ Validation loss: 166696544.00 correlation: 0.2492
554
+ Elapse: 545.68s
555
+
556
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
557
+
558
+ Epoch 087/400
559
+ Train loss: 70891072.00 correlation: 0.2998
560
+ Validation loss: 166700640.00 correlation: 0.2493
561
+ Elapse: 545.36s
562
+
563
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
564
+
565
+ Epoch 088/400
566
+ Train loss: 70786208.00 correlation: 0.3009
567
+ Validation loss: 166720928.00 correlation: 0.2490
568
+ Elapse: 545.75s
569
+
570
+ Epoch 089/400
571
+ Train loss: 70840864.00 correlation: 0.3002
572
+ Validation loss: 166705888.00 correlation: 0.2491
573
+ Elapse: 546.01s
574
+
575
+ Epoch 090/400
576
+ Train loss: 70781008.00 correlation: 0.3008
577
+ Validation loss: 166757248.00 correlation: 0.2489
578
+ Elapse: 545.02s
579
+
580
+ Epoch 091/400
581
+ Train loss: 70768960.00 correlation: 0.3009
582
+ Validation loss: 166698640.00 correlation: 0.2489
583
+ Elapse: 545.07s
584
+
585
+ Epoch 092/400
586
+ Train loss: 70700664.00 correlation: 0.3016
587
+ Validation loss: 166705392.00 correlation: 0.2491
588
+ Elapse: 545.85s
589
+
590
+ Loaded checkpoint from epoch 87 (correlation: 0.2493).
591
+
592
+ Reduce learning rate of core to 3.8880e-05 (num. reduce: 1).
593
+ Reduce learning rate of readouts to 2.9160e-05 (num. reduce: 1).
594
+ Reduce learning rate of shifters to 2.9160e-05 (num. reduce: 1).
595
+
596
+ Epoch 093/400
597
+ Train loss: 70743624.00 correlation: 0.3012
598
+ Validation loss: 166685456.00 correlation: 0.2494
599
+ Elapse: 545.69s
600
+
601
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
602
+
603
+ Epoch 094/400
604
+ Train loss: 70752552.00 correlation: 0.3012
605
+ Validation loss: 166676048.00 correlation: 0.2493
606
+ Elapse: 545.53s
607
+
608
+ Epoch 095/400
609
+ Train loss: 70729328.00 correlation: 0.3013
610
+ Validation loss: 166677072.00 correlation: 0.2494
611
+ Elapse: 545.12s
612
+
613
+ Epoch 096/400
614
+ Train loss: 70661304.00 correlation: 0.3018
615
+ Validation loss: 166687824.00 correlation: 0.2493
616
+ Elapse: 545.30s
617
+
618
+ Epoch 097/400
619
+ Train loss: 70768896.00 correlation: 0.3006
620
+ Validation loss: 166658272.00 correlation: 0.2492
621
+ Elapse: 545.47s
622
+
623
+ Epoch 098/400
624
+ Train loss: 70673976.00 correlation: 0.3017
625
+ Validation loss: 166648288.00 correlation: 0.2495
626
+ Elapse: 545.22s
627
+
628
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
629
+
630
+ Epoch 099/400
631
+ Train loss: 70635672.00 correlation: 0.3022
632
+ Validation loss: 166648032.00 correlation: 0.2495
633
+ Elapse: 545.17s
634
+
635
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
636
+
637
+ Epoch 100/400
638
+ Train loss: 70748008.00 correlation: 0.3010
639
+ Validation loss: 166647312.00 correlation: 0.2495
640
+ Elapse: 545.61s
641
+
642
+ Epoch 101/400
643
+ Train loss: 70682408.00 correlation: 0.3016
644
+ Validation loss: 166662208.00 correlation: 0.2494
645
+ Elapse: 545.56s
646
+
647
+ Epoch 102/400
648
+ Train loss: 70642688.00 correlation: 0.3020
649
+ Validation loss: 166662624.00 correlation: 0.2495
650
+ Elapse: 545.17s
651
+
652
+ Epoch 103/400
653
+ Train loss: 70638368.00 correlation: 0.3019
654
+ Validation loss: 166645120.00 correlation: 0.2495
655
+ Elapse: 545.25s
656
+
657
+ Epoch 104/400
658
+ Train loss: 70563872.00 correlation: 0.3027
659
+ Validation loss: 166649696.00 correlation: 0.2495
660
+ Elapse: 545.70s
661
+
662
+ Loaded checkpoint from epoch 99 (correlation: 0.2495).
663
+
664
+ Reduce learning rate of core to 1.1664e-05 (num. reduce: 1).
665
+ Reduce learning rate of readouts to 8.7480e-06 (num. reduce: 1).
666
+ Reduce learning rate of shifters to 8.7480e-06 (num. reduce: 1).
667
+
668
+ Epoch 105/400
669
+ Train loss: 70679696.00 correlation: 0.3019
670
+ Validation loss: 166646944.00 correlation: 0.2495
671
+ Elapse: 545.44s
672
+
673
+ Epoch 106/400
674
+ Train loss: 70623656.00 correlation: 0.3021
675
+ Validation loss: 166651056.00 correlation: 0.2495
676
+ Elapse: 545.46s
677
+
678
+ Epoch 107/400
679
+ Train loss: 70689912.00 correlation: 0.3013
680
+ Validation loss: 166642080.00 correlation: 0.2495
681
+ Elapse: 545.17s
682
+
683
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
684
+
685
+ Epoch 108/400
686
+ Train loss: 70636352.00 correlation: 0.3019
687
+ Validation loss: 166643376.00 correlation: 0.2495
688
+ Elapse: 545.12s
689
+
690
+ Epoch 109/400
691
+ Train loss: 70622056.00 correlation: 0.3021
692
+ Validation loss: 166645664.00 correlation: 0.2495
693
+ Elapse: 545.91s
694
+
695
+ Epoch 110/400
696
+ Train loss: 70689848.00 correlation: 0.3013
697
+ Validation loss: 166646544.00 correlation: 0.2495
698
+ Elapse: 544.95s
699
+
700
+ Epoch 111/400
701
+ Train loss: 70594792.00 correlation: 0.3025
702
+ Validation loss: 166655344.00 correlation: 0.2494
703
+ Elapse: 545.66s
704
+
705
+ Epoch 112/400
706
+ Train loss: 70636904.00 correlation: 0.3020
707
+ Validation loss: 166638224.00 correlation: 0.2495
708
+ Elapse: 544.74s
709
+
710
+ Loaded checkpoint from epoch 107 (correlation: 0.2495).
711
+
712
+ Reduce learning rate of core to 3.4992e-06 (num. reduce: 1).
713
+ Reduce learning rate of readouts to 2.6244e-06 (num. reduce: 1).
714
+ Reduce learning rate of shifters to 2.6244e-06 (num. reduce: 1).
715
+
716
+ Epoch 113/400
717
+ Train loss: 70679760.00 correlation: 0.3016
718
+ Validation loss: 166645488.00 correlation: 0.2495
719
+ Elapse: 543.62s
720
+
721
+ Epoch 114/400
722
+ Train loss: 70609840.00 correlation: 0.3026
723
+ Validation loss: 166641568.00 correlation: 0.2495
724
+ Elapse: 543.57s
725
+
726
+ Checkpoint saved to /home/storage/runs/vivit_ensemble/028/ckpt/model_state.pt.
727
+
728
+ Epoch 115/400
729
+ Train loss: 70676264.00 correlation: 0.3017
730
+ Validation loss: 166645824.00 correlation: 0.2495
731
+ Elapse: 545.22s
732
+
733
+ Epoch 116/400
734
+ Train loss: 70640760.00 correlation: 0.3023
735
+ Validation loss: 166649888.00 correlation: 0.2495
736
+ Elapse: 545.14s
737
+
738
+ Epoch 117/400
739
+ Train loss: 70651464.00 correlation: 0.3017
740
+ Validation loss: 166644896.00 correlation: 0.2495
741
+ Elapse: 545.75s
742
+
743
+ Epoch 118/400
744
+ Train loss: 70647664.00 correlation: 0.3020
745
+ Validation loss: 166642016.00 correlation: 0.2495
746
+ Elapse: 551.10s
747
+
748
+ Epoch 119/400
749
+ Train loss: 70647632.00 correlation: 0.3017
750
+ Validation loss: 166642992.00 correlation: 0.2495
751
+ Elapse: 545.02s
752
+
753
+ Loaded checkpoint from epoch 114 (correlation: 0.2495).
754
+
755
+ Reduce learning rate of core to 1.0498e-06 (num. reduce: 1).
756
+ Reduce learning rate of readouts to 7.8732e-07 (num. reduce: 1).
757
+ Reduce learning rate of shifters to 7.8732e-07 (num. reduce: 1).
758
+
759
+ Epoch 120/400
760
+ Train loss: 70673976.00 correlation: 0.3014
761
+ Validation loss: 166641376.00 correlation: 0.2495
762
+ Elapse: 544.88s
763
+
764
+ Epoch 121/400
765
+ Train loss: 70599064.00 correlation: 0.3023
766
+ Validation loss: 166642464.00 correlation: 0.2495
767
+ Elapse: 544.91s
768
+
769
+ Epoch 122/400
770
+ Train loss: 70592552.00 correlation: 0.3025
771
+ Validation loss: 166642720.00 correlation: 0.2495
772
+ Elapse: 544.80s
773
+
774
+ Epoch 123/400
775
+ Train loss: 70644184.00 correlation: 0.3019
776
+ Validation loss: 166643072.00 correlation: 0.2495
777
+ Elapse: 544.57s
778
+
779
+ Epoch 124/400
780
+ Train loss: 70629504.00 correlation: 0.3022
781
+ Validation loss: 166642208.00 correlation: 0.2495
782
+ Elapse: 545.38s
783
+
784
+ Loaded checkpoint from epoch 114 (correlation: 0.2495).
785
+
786
+ Reduce learning rate of core to 3.1493e-07 (num. reduce: 2).
787
+ Reduce learning rate of readouts to 2.3620e-07 (num. reduce: 2).
788
+ Reduce learning rate of shifters to 2.3620e-07 (num. reduce: 2).
789
+
790
+ Epoch 125/400
791
+ Train loss: 70617168.00 correlation: 0.3023
792
+ Validation loss: 166641952.00 correlation: 0.2495
793
+ Elapse: 544.97s
794
+
795
+ Epoch 126/400
796
+ Train loss: 70613328.00 correlation: 0.3026
797
+ Validation loss: 166642704.00 correlation: 0.2495
798
+ Elapse: 544.92s
799
+
800
+ Epoch 127/400
801
+ Train loss: 70681712.00 correlation: 0.3016
802
+ Validation loss: 166642848.00 correlation: 0.2495
803
+ Elapse: 544.98s
804
+
805
+ Epoch 128/400
806
+ Train loss: 70630672.00 correlation: 0.3021
807
+ Validation loss: 166642912.00 correlation: 0.2495
808
+ Elapse: 544.96s
809
+
810
+ Epoch 129/400
811
+ Train loss: 70600632.00 correlation: 0.3025
812
+ Validation loss: 166642848.00 correlation: 0.2495
813
+ Elapse: 545.27s
814
+
815
+ Model has not improved after 2 LR reductions.
816
+
817
+ Loaded checkpoint from epoch 114 (correlation: 0.2495).
818
+
819
+
820
+ ValidationA: 0.2465 B: 0.2783 C: 0.2688 D: 0.2292 E: 0.2366 F: 0.2341 G: 0.2549 H: 0.2330 I: 0.2567 J: 0.2571 average: 0.2495
821
+
822
+ Results saved to /home/storage/runs/vivit_ensemble/028.