saicharan1234 commited on
Commit
24a2ec2
·
verified ·
1 Parent(s): 5056230

Delete train_configs

Browse files
train_configs/minigpt4_stage1_laion.yaml DELETED
@@ -1,62 +0,0 @@
1
- # Copyright (c) 2022, salesforce.com, inc.
2
- # All rights reserved.
3
- # SPDX-License-Identifier: BSD-3-Clause
4
- # For full license text, see the LICENSE file in the repo root or https://opensource.org/licenses/BSD-3-Clause
5
-
6
- model:
7
- arch: mini_gpt4
8
- model_type: pretrain_vicuna
9
- freeze_vit: True
10
- freeze_qformer: True
11
-
12
-
13
- datasets:
14
- laion:
15
- vis_processor:
16
- train:
17
- name: "blip2_image_train"
18
- image_size: 224
19
- text_processor:
20
- train:
21
- name: "blip_caption"
22
- sample_ratio: 115
23
- cc_combine:
24
- vis_processor:
25
- train:
26
- name: "blip2_image_train"
27
- image_size: 224
28
- text_processor:
29
- train:
30
- name: "blip_caption"
31
- sample_ratio: 14
32
-
33
-
34
- run:
35
- task: image_text_pretrain
36
- # optimizer
37
- lr_sched: "linear_warmup_cosine_lr"
38
- init_lr: 1e-4
39
- min_lr: 3e-5
40
- warmup_lr: 1e-6
41
-
42
- weight_decay: 0.05
43
- max_epoch: 4
44
- batch_size_train: 64
45
- batch_size_eval: 64
46
- num_workers: 4
47
- warmup_steps: 5000
48
- iters_per_epoch: 5000
49
-
50
- seed: 42
51
- output_dir: "/path/to/save/your/model/"
52
-
53
- amp: True
54
- resume_ckpt_path: null
55
-
56
- evaluate: False
57
- train_splits: ["train"]
58
-
59
- device: "cuda"
60
- world_size: 1
61
- dist_url: "env://"
62
- distributed: True
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
train_configs/minigpt4_stage2_align.yaml DELETED
@@ -1,56 +0,0 @@
1
- # Copyright (c) 2022, salesforce.com, inc.
2
- # All rights reserved.
3
- # SPDX-License-Identifier: BSD-3-Clause
4
- # For full license text, see the LICENSE file in the repo root or https://opensource.org/licenses/BSD-3-Clause
5
-
6
- model:
7
- arch: mini_gpt4
8
- model_type: pretrain_vicuna
9
- freeze_vit: True
10
- freeze_qformer: True
11
- max_txt_len: 160
12
- end_sym: "###"
13
- prompt_path: "prompts/alignment.txt"
14
- prompt_template: '###Human: {} ###Assistant: '
15
- ckpt: '/ibex/project/c2133/vicuna_jun_checkpoint_wihtout_prompt/20230412162/checkpoint_3.pth'
16
-
17
-
18
- datasets:
19
- cc_align:
20
- vis_processor:
21
- train:
22
- name: "blip2_image_train"
23
- image_size: 224
24
- text_processor:
25
- train:
26
- name: "blip_caption"
27
-
28
- run:
29
- task: image_text_pretrain
30
- # optimizer
31
- lr_sched: "linear_warmup_cosine_lr"
32
- init_lr: 3e-5
33
- min_lr: 1e-5
34
- warmup_lr: 1e-6
35
-
36
- weight_decay: 0.05
37
- max_epoch: 5
38
- iters_per_epoch: 200
39
- batch_size_train: 12
40
- batch_size_eval: 12
41
- num_workers: 4
42
- warmup_steps: 200
43
-
44
- seed: 42
45
- output_dir: "/ibex/project/c2133/vicuna_ckpt_test/minigpt4_stage2_align"
46
-
47
- amp: True
48
- resume_ckpt_path: null
49
-
50
- evaluate: False
51
- train_splits: ["train"]
52
-
53
- device: "cuda"
54
- world_size: 1
55
- dist_url: "env://"
56
- distributed: True