Spaces:
Running
Running
PATCH_LENGTH = 128 # Patch Length | |
PATCH_SIZE = 32 # Patch Size | |
PATCH_NUM_LAYERS = 9 # Number of layers in the encoder | |
CHAR_NUM_LAYERS = 3 # Number of layers in the decoder | |
# Number of epochs to train for (if early stopping doesn't intervene) | |
NUM_EPOCHS = 5 # 32 | |
LEARNING_RATE = 5e-5 # Learning rate for the optimizer | |
# Batch size for patch during training, 0 for full context | |
PATCH_SAMPLING_BATCH_SIZE = 0 | |
LOAD_FROM_CHECKPOINT = True # Whether to load weights from a checkpoint | |
# Whether to share weights between the encoder and decoder | |
SHARE_WEIGHTS = False | |
WEIGHT_URL = 'https://huggingface.co/MuGeminorum/hoyoGPT/resolve/main/weights.pth' | |
ZH_WEIGHT_URL = 'https://www.modelscope.cn/api/v1/models/MuGeminorum/hoyoGPT/repo?Revision=master&FilePath=weights.pth' | |
WEIGHT_PATH = 'weights.pth' | |
LOG_PATH = 'logs.txt' | |
PROMPT_PATH = 'prompt.txt' | |