Spaces:
Running
Running
File size: 885 Bytes
653dc95 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 |
PATCH_LENGTH = 128 # Patch Length
PATCH_SIZE = 32 # Patch Size
PATCH_NUM_LAYERS = 9 # Number of layers in the encoder
CHAR_NUM_LAYERS = 3 # Number of layers in the decoder
# Number of epochs to train for (if early stopping doesn't intervene)
NUM_EPOCHS = 5 # 32
LEARNING_RATE = 5e-5 # Learning rate for the optimizer
# Batch size for patch during training, 0 for full context
PATCH_SAMPLING_BATCH_SIZE = 0
LOAD_FROM_CHECKPOINT = True # Whether to load weights from a checkpoint
# Whether to share weights between the encoder and decoder
SHARE_WEIGHTS = False
WEIGHT_URL = 'https://huggingface.co/MuGeminorum/hoyoGPT/resolve/main/weights.pth'
ZH_WEIGHT_URL = 'https://www.modelscope.cn/api/v1/models/MuGeminorum/hoyoGPT/repo?Revision=master&FilePath=weights.pth'
WEIGHT_PATH = 'weights.pth'
LOG_PATH = 'logs.txt'
PROMPT_PATH = 'prompt.txt'
|