File size: 1,414 Bytes
7806f40
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
experiment_group: training
run_name: roberta-base_2024-04-23T15-11-06
seed: 42
model:
  name: roberta-base
  revision: null
  seed: 42
  base_model: roberta-base
estimator:
  accelerator: gpu
  precision: bf16-true
  deterministic: true
  tf32_mode: high
  convert_to_bettertransformer: false
fit:
  max_epochs: 20
  min_epochs: null
  optimizer_kwargs:
    name: adamw
    lr: 3.0e-05
    init_kwargs:
      fused: true
  scheduler_kwargs:
    name: constant_schedule_with_warmup
    num_warmup_steps: 2000
  log_interval: 100
  enable_progress_bar: true
  limit_train_batches: null
data:
  batch_size: 32
  eval_batch_size: 128
  shuffle: true
  replacement: false
  data_seed: 42
  drop_last: false
  num_workers: 8
  pin_memory: true
  persistent_workers: false
  multiprocessing_context: null
  max_length: 512
root_path: /home/pl487/coreset-project
data_path: /home/pl487/coreset-project/data/processed
dataset: mnli
dataset_split: train
evaluation: null
loggers:
  tensorboard:
    _target_: energizer.loggers.TensorBoardLogger
    root_dir: ./
    name: tb_logs
    version: null
callbacks:
  timer:
    _target_: energizer.active_learning.callbacks.Timer
  lr_monitor:
    _target_: energizer.callbacks.lr_monitor.LearningRateMonitor
  model_checkpoint:
    _target_: energizer.callbacks.model_checkpoint.ModelCheckpoint
    dirpath: .checkpoints
    stage: train
    frequency: 1:epoch
user:
  id: pl487