|
import torch |
|
|
|
class CFG: |
|
debug = False |
|
batch_size = 32 |
|
num_workers = 2 |
|
head_lr = 1e-3 |
|
image_encoder_lr = 1e-4 |
|
text_encoder_lr = 1e-5 |
|
weight_decay = 1e-3 |
|
patience = 1 |
|
factor = 0.8 |
|
epochs = 1 |
|
device = torch.device("cuda" if torch.cuda.is_available() else "cpu") |
|
|
|
model_name = 'resnet50' |
|
image_embedding = 2048 |
|
text_encoder_model = "distilbert-base-uncased" |
|
text_embedding = 768 |
|
text_tokenizer = "distilbert-base-uncased" |
|
max_length = 200 |
|
|
|
pretrained = True |
|
trainable = True |
|
temperature = 1.0 |
|
|
|
|
|
size = 224 |
|
|
|
|
|
num_projection_layers = 1 |
|
projection_dim = 256 |
|
dropout = 0.1 |