File size: 2,194 Bytes
945d036 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 |
accum_freq: 1 aug_cfg: {} batch_size: 32 beta1: 0.9 beta2: 0.999 cache_dir: None checkpoint_path: ./logs/2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16/checkpoints coca_caption_loss_weight: 2.0 coca_contrastive_loss_weight: 1.0 copy_codebase: False csv_caption_key: title csv_img_key: filepath csv_separator: dataset_resampled: False dataset_type: hf ddp_static_graph: False debug: False delete_previous_checkpoint: False device: cuda dist_backend: None dist_url: None distill: False distill_model: None distill_pretrained: None distributed: False epochs: 30 epochs_cooldown: None eps: 1e-08 force_custom_text: False force_image_size: None force_patch_dropout: None force_quick_gelu: False gather_with_grad: False grad_checkpointing: False grad_clip_norm: None hf_dataset: photonmz/opi_function_packed horovod: False image_interpolation: None image_mean: None image_resize_mode: None image_std: None imagenet_v2: None imagenet_val: None local_loss: False local_rank: 0 lock_image: False lock_image_freeze_bn_stats: False lock_image_unlocked_groups: 0 lock_text: False lock_text_freeze_layer_norm: False lock_text_unlocked_layers: 0 log_every_n_steps: 100 log_level: 20 log_local: False log_path: ./logs/2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16/out.log logs: ./logs/ loss_dist_impl: None lr: 0.0002 lr_cooldown_end: 0.0 lr_cooldown_power: 1.0 lr_scheduler: cosine model: crisp_1 momentum: None name: 2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16 no_set_device_rank: False opt: adamw precision: amp_bfloat16 pretrained: pretrained_image: False rank: 0 remote_sync: None remote_sync_frequency: 300 remote_sync_protocol: s3 report_to: wandb resume: None save_frequency: 1 save_most_recent: True seed: 0 siglip: False skip_scheduler: False tensorboard: False tensorboard_path: torchcompile: False torchscript: False trace: False train_data: stub train_data_upsampling_factors: None train_num_samples: None use_bn_sync: False use_bnb_linear: None val_data: stub val_frequency: 1 val_num_samples: None wandb: True wandb_notes: wandb_project_name: open-clip warmup: 10000 wd: 0.1 workers: 1 world_size: 1 zeroshot_frequency: 1 |