File size: 1,414 Bytes
7806f40 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 |
experiment_group: training
run_name: roberta-base_2024-04-23T15-11-06
seed: 42
model:
name: roberta-base
revision: null
seed: 42
base_model: roberta-base
estimator:
accelerator: gpu
precision: bf16-true
deterministic: true
tf32_mode: high
convert_to_bettertransformer: false
fit:
max_epochs: 20
min_epochs: null
optimizer_kwargs:
name: adamw
lr: 3.0e-05
init_kwargs:
fused: true
scheduler_kwargs:
name: constant_schedule_with_warmup
num_warmup_steps: 2000
log_interval: 100
enable_progress_bar: true
limit_train_batches: null
data:
batch_size: 32
eval_batch_size: 128
shuffle: true
replacement: false
data_seed: 42
drop_last: false
num_workers: 8
pin_memory: true
persistent_workers: false
multiprocessing_context: null
max_length: 512
root_path: /home/pl487/coreset-project
data_path: /home/pl487/coreset-project/data/processed
dataset: mnli
dataset_split: train
evaluation: null
loggers:
tensorboard:
_target_: energizer.loggers.TensorBoardLogger
root_dir: ./
name: tb_logs
version: null
callbacks:
timer:
_target_: energizer.active_learning.callbacks.Timer
lr_monitor:
_target_: energizer.callbacks.lr_monitor.LearningRateMonitor
model_checkpoint:
_target_: energizer.callbacks.model_checkpoint.ModelCheckpoint
dirpath: .checkpoints
stage: train
frequency: 1:epoch
user:
id: pl487
|