File size: 2,631 Bytes
78ab311
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
{
    "model": {
        "name": "PatchFusion",
        "version_name": "patchfusion",
        "n_bins": 64,
        "bin_embedding_dim": 128,
        "bin_centers_type": "softplus",
        "n_attractors":[16, 8, 4, 1],
        "attractor_alpha": 1000,
        "attractor_gamma": 2,
        "attractor_kind" : "mean",
        "attractor_type" : "inv",
        "midas_model_type" : "DPT_BEiT_L_384",
        "min_temp": 0.0212,
        "max_temp": 50.0,
        "output_distribution": "logbinomial",
        "memory_efficient": true,
        "inverse_midas": false,
        "img_size": [384, 512],
        "do_resize": false, // do resize in dataloader to speed up
        "raw_depth_shape": [2160, 3840], // 540, 960
        "sr_ratio": 1,
        "sampled_training": false,
        "transform_sample_gt_size": [2160, 3840],
        "sample_feat_level": 4,
        "use_hr": false,
        "baseline": true,
        "condition": true,
        "freeze": true,
        "g2l": true,
        "use_fusion_network": true,
        "use_area_prior": true,
        "consistency_training": true,
        // "consistency_target": "final_feat",
        "consistency_target": "mix",
    },
    
    "train": {
        "use_rgb": true,
        "use_blur": false,
        "train_midas": true,
        "use_pretrained_midas": true,
        "trainer": "zoedepth_custom",
        "epochs": 12,
        "bs": 16,
        "optim_kwargs": {"lr": 0.0001, "wd": 0.01},
        "sched_kwargs": {"div_factor": 10, "final_div_factor": 10000, "pct_start": 0.5, "three_phase":false, "cycle_momentum": true},
        "same_lr": false,
        "w_si": 1,
        "w_domain": 0.2,
        "w_reg": 0,
        "w_grad": 0,
        "avoid_boundary": false,
        "random_crop": true,
        "input_width": 640,
        "input_height": 480,
        "midas_lr_factor": 1,
        "encoder_lr_factor":10,
        "pos_enc_lr_factor":10,
        "freeze_midas_bn": true,
        "sec_stage": true,
        "multi_consistency": true,
        "w_consistency": 0.1, // consistency weight here
        "overlap_length_h": 135,
        "overlap_length_w": 240,
        "w_p": 0.1 // weight of pred depth in consistency loss
    },

    "infer":{
        "train_midas": false,
        "use_pretrained_midas": false,
        "pretrained_resource" : "url::https://github.com/isl-org/ZoeDepth/releases/download/v1.0/ZoeD_M12_N.pt",
        "force_keep_ar": true
    },

    "eval":{
        "train_midas": false,
        "use_pretrained_midas": false,
        "pretrained_resource" : "url::https://github.com/isl-org/ZoeDepth/releases/download/v1.0/ZoeD_M12_N.pt"
    }
}