| import torch |
|
|
| IMAGE_SIZE = 512 |
| PATCH_SIZE = 16 |
| HIDDEN_DIM = 256 |
| CONTEXT_LENGTH = 1536 |
| TEXT_LENGTH = 512 |
| PROMPT_LENGTH = 64 |
| DROPOUT = 0.1 |
| NUM_HEADS = 8 |
| NUM_LAYERS = 12 |
| BATCH_SIZE = 16 |
| LEARNING_RATE = 1e-3 |
| DTYPE = torch.float32 |
| GRAD_ACCUMULATION_STEPS = 16 |
| IMAGE_MEAN = [0.485, 0.456, 0.406] |
| IMAGE_STD = [0.229, 0.224, 0.225] |
| DEVICE = 'cuda' if torch.cuda.is_available() else 'cpu' |
| IMAGE_LOCATION = "./images/" |
| NUM_BINS = 32 |
| SHARED_EMBED_DIM = 256 |
| NUM_BINS = 32 |
| MAX_POINTS = 10 |
|
|
| |
| NUM_EPOCHS = 400 |
| LOGGING_STEPS = 1 |
| MAX_GRAD_NORM = 1.0 |
| LAMBDA_CONTRASTIVE = 2 |
| LAMBDA_REGRESSION = 2 |
|
|