wandb_version: 1

_wandb:
  desc: null
  value:
    python_version: 3.9.17
    cli_version: 0.15.9
    framework: huggingface
    huggingface_version: 4.36.0
    is_jupyter_run: false
    is_kaggle_kernel: false
    start_time: 1709313942.075548
    t:
      1:
      - 1
      - 9
      - 11
      - 49
      - 50
      - 51
      - 55
      - 71
      - 103
      2:
      - 1
      - 9
      - 11
      - 49
      - 50
      - 51
      - 55
      - 71
      - 103
      3:
      - 2
      - 7
      - 15
      - 23
      4: 3.9.17
      5: 0.15.9
      6: 4.36.0
      8:
      - 5
    m:
    - 1: trainer/global_step
      6:
      - 3
    - 1: loss/train_step
      5: 1
      6:
      - 1
    - 1: epoch
      5: 1
      6:
      - 1
    - 1: loss/val
      5: 1
      6:
      - 1
    - 1: metric/exact_encoding_matches/val
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/all/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/micro/f1/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/micro/recall/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/micro/precision/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/background_claim/f1/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/background_claim/recall/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/background_claim/precision/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/data/f1/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/data/recall/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/data/precision/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/own_claim/f1/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/own_claim/recall/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/own_claim/precision/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/macro/f1/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/macro/recall/val
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/macro/precision/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/micro/f1/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/micro/recall/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/micro/precision/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/parts_of_same/f1/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/parts_of_same/recall/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/parts_of_same/precision/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/supports/f1/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/supports/recall/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/supports/precision/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/contradicts/f1/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/contradicts/recall/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/contradicts/precision/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/macro/f1/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/macro/recall/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/macro/precision/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/semantically_same/f1/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/semantically_same/recall/val
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/semantically_same/precision/val
      5: 1
      6:
      - 1
    - 1: loss/train_epoch
      5: 1
      6:
      - 1
    - 1: metric/exact_encoding_matches/train
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/label/train
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/index/train
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/len/train
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/order/train
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/correct/train
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/all/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/background_claim/f1/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/background_claim/recall/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/background_claim/precision/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/data/f1/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/data/recall/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/data/precision/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/own_claim/f1/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/own_claim/recall/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/own_claim/precision/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/micro/f1/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/micro/recall/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/micro/precision/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/macro/f1/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/macro/recall/train
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/macro/precision/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/supports/f1/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/supports/recall/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/supports/precision/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/micro/f1/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/micro/recall/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/micro/precision/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/parts_of_same/f1/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/parts_of_same/recall/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/parts_of_same/precision/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/contradicts/f1/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/contradicts/recall/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/contradicts/precision/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/semantically_same/f1/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/semantically_same/recall/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/semantically_same/precision/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/macro/f1/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/macro/recall/train
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/macro/precision/train
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/correct/val
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/index/val
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/len/val
      5: 1
      6:
      - 1
    - 1: loss/test
      5: 1
      6:
      - 1
    - 1: metric/exact_encoding_matches/test
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/correct/test
      5: 1
      6:
      - 1
    - 1: metric/decoding_errors/all/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/micro/f1/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/micro/recall/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/micro/precision/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/own_claim/f1/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/own_claim/recall/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/own_claim/precision/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/background_claim/f1/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/background_claim/recall/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/background_claim/precision/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/data/f1/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/data/recall/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/data/precision/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/macro/f1/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/macro/recall/test
      5: 1
      6:
      - 1
    - 1: metric/labeled_spans/macro/precision/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/micro/f1/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/micro/recall/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/micro/precision/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/parts_of_same/f1/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/parts_of_same/recall/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/parts_of_same/precision/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/supports/f1/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/supports/recall/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/supports/precision/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/contradicts/f1/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/contradicts/recall/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/contradicts/precision/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/semantically_same/f1/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/semantically_same/recall/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/semantically_same/precision/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/macro/f1/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/macro/recall/test
      5: 1
      6:
      - 1
    - 1: metric/binary_relations/macro/precision/test
      5: 1
      6:
      - 1
_num_params/total:
  desc: null
  value: 141788928
_num_params/trainable:
  desc: null
  value: 141788928
_num_params/non_trainable:
  desc: null
  value: 0
_config:
  desc: null
  value:
    pipeline_type: training
    name: dataset-sciarg/task-ner_re/v0.3
    tags:
    - task=ner_re
    - model=pointer_network
    train: true
    validate: true
    test: true
    monitor_metric: metric/binary_relations/micro/f1/val
    monitor_mode: max
    seed: 1
    ckpt_path: null
    push_to_hub: false
    model_save_dir: /home/arne/projects/pie-document-level/models/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-32
    dataset:
      _target_: src.utils.execute_pipeline
      input:
        _target_: pie_datasets.DatasetDict.load_dataset
        path: pie/sciarg
        revision: 982d5682ba414ee13cf92cb93ec18fc8e78e2b81
      select_n:
        _processor_: pie_datasets.DatasetDict.select
        split: train
        stop: null
      select_n_test:
        _processor_: pie_datasets.DatasetDict.select
        split: test
        stop: null
      select_n_validation:
        _processor_: pie_datasets.DatasetDict.select
        split: validation
        stop: null
      create_test_split:
        _processor_: pie_datasets.DatasetDict.move_to_new_split
        source_split: train
        target_split: test
        ids:
        - A32
        - A33
        - A34
        - A35
        - A36
        - A37
        - A38
        - A39
        - A40
      create_validation_split:
        _processor_: pie_datasets.DatasetDict.add_test_split
        test_size: 0.1
        seed: 1
        source_split: train
        target_split: validation
    datamodule:
      _target_: src.datamodules.PieDataModule
      batch_size: 2
      num_workers: 0
      pin_memory: false
      show_progress_for_encode: true
      train_split: train
      val_split: validation
      test_split: test
    taskmodule:
      _target_: pie_modules.taskmodules.PointerNetworkTaskModuleForEnd2EndRE
      tokenizer_init_kwargs:
        add_prefix_space: true
      tokenizer_name_or_path: facebook/bart-base
      tokenizer_kwargs:
        truncation: true
        return_overflowing_tokens: true
        stride: 128
        strict_span_conversion: false
      create_constraints: true
      constrained_generation: true
      partition_layer_name: labeled_partitions
    model:
      _target_: pie_modules.models.SimpleGenerativeModel
      base_model_type: pie_modules.models.base_models.BartAsPointerNetwork
      base_model_config:
        pretrained_model_name_or_path: facebook/bart-base
        use_encoder_mlp: true
        use_constraints_encoder_mlp: true
        decoder_position_id_pattern:
        - 0
        - 0
        - 1
        - 0
        - 0
        - 1
        - 1
        encoder_layer_norm_decay: 0.005
        lr: 6.0e-05
        num_beams: 4
        max_length: 768
        decoder_layer_norm_decay: 0.05
      metric_stages:
      - val
      - test
      - train
      metric_call_predict:
      - val
      - test
      warmup_proportion: 0.01
    callbacks:
      model_checkpoint:
        _target_: pytorch_lightning.callbacks.ModelCheckpoint
        dirpath: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0/checkpoints
        filename: epoch_{epoch:03d}
        monitor: metric/binary_relations/micro/f1/val
        verbose: false
        save_last: true
        save_top_k: 1
        mode: max
        auto_insert_metric_name: false
        save_weights_only: false
        every_n_train_steps: null
        train_time_interval: null
        every_n_epochs: null
        save_on_train_epoch_end: null
      early_stopping:
        _target_: pytorch_lightning.callbacks.EarlyStopping
        monitor: metric/binary_relations/micro/f1/val
        min_delta: 0.0
        patience: 100
        verbose: false
        mode: max
        strict: true
        check_finite: true
        stopping_threshold: null
        divergence_threshold: null
        check_on_train_epoch_end: null
      model_summary:
        _target_: pytorch_lightning.callbacks.RichModelSummary
        max_depth: -1
      rich_progress_bar:
        _target_: pytorch_lightning.callbacks.RichProgressBar
    logger:
      wandb:
        _target_: pytorch_lightning.loggers.wandb.WandbLogger
        save_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
        offline: false
        id: null
        anonymous: null
        project: dataset-sciarg-task-ner_re-v0.3-training
        log_model: false
        prefix: ''
        group: ''
        tags:
        - task=ner_re
        - model=pointer_network
        job_type: ''
    trainer:
      _target_: pytorch_lightning.Trainer
      default_root_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
      min_epochs: 150
      max_epochs: 150
      accelerator: gpu
      devices: 1
      check_val_every_n_epoch: 1
      deterministic: false
      gradient_clip_val: 5
      gradient_clip_algorithm: value
    paths:
      root_dir: /home/arne/projects/pie-document-level
      data_dir: /home/arne/projects/pie-document-level/data/
      log_dir: /home/arne/projects/pie-document-level/logs/
      output_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
      save_dir: /home/arne/projects/pie-document-level
      work_dir: /home/arne/projects/pie-document-level
    extras:
      ignore_warnings: false
      enforce_tags: true
      print_config: true
    base_model: facebook/bart-base
base_model_type:
  desc: null
  value: pie_modules.models.base_models.BartAsPointerNetwork
base_model_config:
  desc: null
  value:
    pretrained_model_name_or_path: facebook/bart-base
    use_encoder_mlp: true
    use_constraints_encoder_mlp: true
    decoder_position_id_pattern:
    - 0
    - 0
    - 1
    - 0
    - 0
    - 1
    - 1
    encoder_layer_norm_decay: 0.005
    lr: 6.0e-05
    num_beams: 4
    max_length: 768
    decoder_layer_norm_decay: 0.05
    bos_token_id: 0
    eos_token_id: 1
    pad_token_id: 1
    target_token_ids:
    - 0
    - 2
    - 50267
    - 50265
    - 50268
    - 50270
    - 50271
    - 50269
    - 50272
    - 50266
    embedding_weight_mapping:
      '50267':
      - 4146
      '50265':
      - 3618
      - 1215
      - 31628
      '50268':
      - 414
      '50270':
      - 308
      - 1215
      - 31628
      '50271':
      - 37820
      '50269':
      - 1667
      - 1215
      - 1116
      - 1215
      - 41690
      '50272':
      - 9031
      - 38600
      - 1215
      - 41690
      '50266':
      - 4548
override_generation_kwargs:
  desc: null
  value: null
warmup_proportion:
  desc: null
  value: 0.01
learning_rate:
  desc: null
  value: null
optimizer_type:
  desc: null
  value: null
metric_stages:
  desc: null
  value:
  - val
  - test
  - train
metric_call_predict:
  desc: null
  value:
  - val
  - test
taskmodule_config:
  desc: null
  value:
    taskmodule_type: PointerNetworkTaskModuleForEnd2EndRE
    tokenizer_name_or_path: facebook/bart-base
    document_type: pytorch_ie.documents.TextDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions
    tokenized_document_type: pie_modules.documents.TokenDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions
    span_layer_name: labeled_spans
    relation_layer_name: binary_relations
    none_label: none
    loop_dummy_relation_name: loop
    constrained_generation: true
    label_tokens: null
    label_representations: null
    labels_per_layer:
      labeled_spans:
      - background_claim
      - data
      - own_claim
      binary_relations:
      - contradicts
      - parts_of_same
      - semantically_same
      - supports
    exclude_labels_per_layer: null
    create_constraints: true
    tokenizer_init_kwargs:
      add_prefix_space: true
    tokenizer_kwargs:
      truncation: true
      return_overflowing_tokens: true
      stride: 128
      strict_span_conversion: false
    partition_layer_name: labeled_partitions
    annotation_field_mapping: null
    log_first_n_examples: null
_best_checkpoint:
  desc: null
  value: epoch_145.ckpt
_checkpoint_dir:
  desc: null
  value: /mnt/data/experiments/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0/checkpoints