File size: 885 Bytes
653dc95
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
PATCH_LENGTH = 128      # Patch Length
PATCH_SIZE = 32       # Patch Size

PATCH_NUM_LAYERS = 9         # Number of layers in the encoder
CHAR_NUM_LAYERS = 3          # Number of layers in the decoder

# Number of epochs to train for (if early stopping doesn't intervene)
NUM_EPOCHS = 5  # 32
LEARNING_RATE = 5e-5            # Learning rate for the optimizer
# Batch size for patch during training, 0 for full context
PATCH_SAMPLING_BATCH_SIZE = 0
LOAD_FROM_CHECKPOINT = True     # Whether to load weights from a checkpoint
# Whether to share weights between the encoder and decoder
SHARE_WEIGHTS = False
WEIGHT_URL = 'https://huggingface.co/MuGeminorum/hoyoGPT/resolve/main/weights.pth'
ZH_WEIGHT_URL = 'https://www.modelscope.cn/api/v1/models/MuGeminorum/hoyoGPT/repo?Revision=master&FilePath=weights.pth'
WEIGHT_PATH = 'weights.pth'
LOG_PATH = 'logs.txt'
PROMPT_PATH = 'prompt.txt'