|
import torch |
|
|
|
IMAGE_SIZE = 512 |
|
PATCH_SIZE = 16 |
|
HIDDEN_DIM = 256 |
|
CONTEXT_LENGTH = 1536 |
|
TEXT_LENGTH = 512 |
|
PROMPT_LENGTH = 64 |
|
DROPOUT = 0.1 |
|
NUM_HEADS = 8 |
|
NUM_LAYERS = 12 |
|
BATCH_SIZE = 16 |
|
LEARNING_RATE = 1e-3 |
|
DTYPE = torch.float32 |
|
GRAD_ACCUMULATION_STEPS = 16 |
|
IMAGE_MEAN = [0.485, 0.456, 0.406] |
|
IMAGE_STD = [0.229, 0.224, 0.225] |
|
DEVICE = 'cuda' if torch.cuda.is_available() else 'cpu' |
|
IMAGE_LOCATION = "./images/" |
|
NUM_BINS = 32 |
|
SHARED_EMBED_DIM = 256 |
|
NUM_BINS = 32 |
|
MAX_POINTS = 10 |
|
|
|
|
|
NUM_EPOCHS = 400 |
|
LOGGING_STEPS = 1 |
|
MAX_GRAD_NORM = 1.0 |
|
LAMBDA_CONTRASTIVE = 2 |
|
LAMBDA_REGRESSION = 2 |
|
|