|
11:44:11 {'seed': 1, 'ver': 'v1a', 'use_log': True, 'use_tqdm': True, 'debug': False, 'tokenizer': BertTokenizerFast(name_or_path='tokenizer', vocab_size=52000, model_max_length=512, is_fast=True, padding_side='right', truncation_side='right', special_tokens={'unk_token': '[UNK]', 'sep_token': '[SEP]', 'pad_token': '[PAD]', 'cls_token': '[CLS]', 'mask_token': '[MASK]'}, clean_up_tokenization_spaces=True), 'config': <custom_config.LongBERTConfig object at 0x7f2b78440110>, 'max_len': 45000, 'train_one_part': False, 'gradient_accumulation_steps': 2, 'apex': True, 'device': device(type='cuda', index=1), 'nepochs': 4, 'batch_size': 2, 'num_workers': 128, 'lr': 2e-05, 'weight_decay': 0.01, 'encoder_lr': 2e-05, 'decoder_lr': 0.001, 'min_lr': 1e-06, 'eps': 1e-06, 'betas': (0.9, 0.999), 'scheduler_type': 'cosine', 'num_cycles': 0.5, 'num_warmup_steps': 0.0, 'train_data_dir': 'data/train', 'valid_data_dir': 'data/valid', 'test_data_dir': '.', 'output_dir': 'model/v1/a'} |