wandb_version: 1 _wandb: desc: null value: python_version: 3.9.17 cli_version: 0.15.9 framework: huggingface huggingface_version: 4.36.0 is_jupyter_run: false is_kaggle_kernel: false start_time: 1709313942.075548 t: 1: - 1 - 9 - 11 - 49 - 50 - 51 - 55 - 71 - 103 2: - 1 - 9 - 11 - 49 - 50 - 51 - 55 - 71 - 103 3: - 2 - 7 - 15 - 23 4: 3.9.17 5: 0.15.9 6: 4.36.0 8: - 5 m: - 1: trainer/global_step 6: - 3 - 1: loss/train_step 5: 1 6: - 1 - 1: epoch 5: 1 6: - 1 - 1: loss/val 5: 1 6: - 1 - 1: metric/exact_encoding_matches/val 5: 1 6: - 1 - 1: metric/decoding_errors/all/val 5: 1 6: - 1 - 1: metric/labeled_spans/micro/f1/val 5: 1 6: - 1 - 1: metric/labeled_spans/micro/recall/val 5: 1 6: - 1 - 1: metric/labeled_spans/micro/precision/val 5: 1 6: - 1 - 1: metric/labeled_spans/background_claim/f1/val 5: 1 6: - 1 - 1: metric/labeled_spans/background_claim/recall/val 5: 1 6: - 1 - 1: metric/labeled_spans/background_claim/precision/val 5: 1 6: - 1 - 1: metric/labeled_spans/data/f1/val 5: 1 6: - 1 - 1: metric/labeled_spans/data/recall/val 5: 1 6: - 1 - 1: metric/labeled_spans/data/precision/val 5: 1 6: - 1 - 1: metric/labeled_spans/own_claim/f1/val 5: 1 6: - 1 - 1: metric/labeled_spans/own_claim/recall/val 5: 1 6: - 1 - 1: metric/labeled_spans/own_claim/precision/val 5: 1 6: - 1 - 1: metric/labeled_spans/macro/f1/val 5: 1 6: - 1 - 1: metric/labeled_spans/macro/recall/val 5: 1 6: - 1 - 1: metric/labeled_spans/macro/precision/val 5: 1 6: - 1 - 1: metric/binary_relations/micro/f1/val 5: 1 6: - 1 - 1: metric/binary_relations/micro/recall/val 5: 1 6: - 1 - 1: metric/binary_relations/micro/precision/val 5: 1 6: - 1 - 1: metric/binary_relations/parts_of_same/f1/val 5: 1 6: - 1 - 1: metric/binary_relations/parts_of_same/recall/val 5: 1 6: - 1 - 1: metric/binary_relations/parts_of_same/precision/val 5: 1 6: - 1 - 1: metric/binary_relations/supports/f1/val 5: 1 6: - 1 - 1: metric/binary_relations/supports/recall/val 5: 1 6: - 1 - 1: metric/binary_relations/supports/precision/val 5: 1 6: - 1 - 1: metric/binary_relations/contradicts/f1/val 5: 1 6: - 1 - 1: metric/binary_relations/contradicts/recall/val 5: 1 6: - 1 - 1: metric/binary_relations/contradicts/precision/val 5: 1 6: - 1 - 1: metric/binary_relations/macro/f1/val 5: 1 6: - 1 - 1: metric/binary_relations/macro/recall/val 5: 1 6: - 1 - 1: metric/binary_relations/macro/precision/val 5: 1 6: - 1 - 1: metric/binary_relations/semantically_same/f1/val 5: 1 6: - 1 - 1: metric/binary_relations/semantically_same/recall/val 5: 1 6: - 1 - 1: metric/binary_relations/semantically_same/precision/val 5: 1 6: - 1 - 1: loss/train_epoch 5: 1 6: - 1 - 1: metric/exact_encoding_matches/train 5: 1 6: - 1 - 1: metric/decoding_errors/label/train 5: 1 6: - 1 - 1: metric/decoding_errors/index/train 5: 1 6: - 1 - 1: metric/decoding_errors/len/train 5: 1 6: - 1 - 1: metric/decoding_errors/order/train 5: 1 6: - 1 - 1: metric/decoding_errors/correct/train 5: 1 6: - 1 - 1: metric/decoding_errors/all/train 5: 1 6: - 1 - 1: metric/labeled_spans/background_claim/f1/train 5: 1 6: - 1 - 1: metric/labeled_spans/background_claim/recall/train 5: 1 6: - 1 - 1: metric/labeled_spans/background_claim/precision/train 5: 1 6: - 1 - 1: metric/labeled_spans/data/f1/train 5: 1 6: - 1 - 1: metric/labeled_spans/data/recall/train 5: 1 6: - 1 - 1: metric/labeled_spans/data/precision/train 5: 1 6: - 1 - 1: metric/labeled_spans/own_claim/f1/train 5: 1 6: - 1 - 1: metric/labeled_spans/own_claim/recall/train 5: 1 6: - 1 - 1: metric/labeled_spans/own_claim/precision/train 5: 1 6: - 1 - 1: metric/labeled_spans/micro/f1/train 5: 1 6: - 1 - 1: metric/labeled_spans/micro/recall/train 5: 1 6: - 1 - 1: metric/labeled_spans/micro/precision/train 5: 1 6: - 1 - 1: metric/labeled_spans/macro/f1/train 5: 1 6: - 1 - 1: metric/labeled_spans/macro/recall/train 5: 1 6: - 1 - 1: metric/labeled_spans/macro/precision/train 5: 1 6: - 1 - 1: metric/binary_relations/supports/f1/train 5: 1 6: - 1 - 1: metric/binary_relations/supports/recall/train 5: 1 6: - 1 - 1: metric/binary_relations/supports/precision/train 5: 1 6: - 1 - 1: metric/binary_relations/micro/f1/train 5: 1 6: - 1 - 1: metric/binary_relations/micro/recall/train 5: 1 6: - 1 - 1: metric/binary_relations/micro/precision/train 5: 1 6: - 1 - 1: metric/binary_relations/parts_of_same/f1/train 5: 1 6: - 1 - 1: metric/binary_relations/parts_of_same/recall/train 5: 1 6: - 1 - 1: metric/binary_relations/parts_of_same/precision/train 5: 1 6: - 1 - 1: metric/binary_relations/contradicts/f1/train 5: 1 6: - 1 - 1: metric/binary_relations/contradicts/recall/train 5: 1 6: - 1 - 1: metric/binary_relations/contradicts/precision/train 5: 1 6: - 1 - 1: metric/binary_relations/semantically_same/f1/train 5: 1 6: - 1 - 1: metric/binary_relations/semantically_same/recall/train 5: 1 6: - 1 - 1: metric/binary_relations/semantically_same/precision/train 5: 1 6: - 1 - 1: metric/binary_relations/macro/f1/train 5: 1 6: - 1 - 1: metric/binary_relations/macro/recall/train 5: 1 6: - 1 - 1: metric/binary_relations/macro/precision/train 5: 1 6: - 1 - 1: metric/decoding_errors/correct/val 5: 1 6: - 1 - 1: metric/decoding_errors/index/val 5: 1 6: - 1 - 1: metric/decoding_errors/len/val 5: 1 6: - 1 - 1: loss/test 5: 1 6: - 1 - 1: metric/exact_encoding_matches/test 5: 1 6: - 1 - 1: metric/decoding_errors/correct/test 5: 1 6: - 1 - 1: metric/decoding_errors/all/test 5: 1 6: - 1 - 1: metric/labeled_spans/micro/f1/test 5: 1 6: - 1 - 1: metric/labeled_spans/micro/recall/test 5: 1 6: - 1 - 1: metric/labeled_spans/micro/precision/test 5: 1 6: - 1 - 1: metric/labeled_spans/own_claim/f1/test 5: 1 6: - 1 - 1: metric/labeled_spans/own_claim/recall/test 5: 1 6: - 1 - 1: metric/labeled_spans/own_claim/precision/test 5: 1 6: - 1 - 1: metric/labeled_spans/background_claim/f1/test 5: 1 6: - 1 - 1: metric/labeled_spans/background_claim/recall/test 5: 1 6: - 1 - 1: metric/labeled_spans/background_claim/precision/test 5: 1 6: - 1 - 1: metric/labeled_spans/data/f1/test 5: 1 6: - 1 - 1: metric/labeled_spans/data/recall/test 5: 1 6: - 1 - 1: metric/labeled_spans/data/precision/test 5: 1 6: - 1 - 1: metric/labeled_spans/macro/f1/test 5: 1 6: - 1 - 1: metric/labeled_spans/macro/recall/test 5: 1 6: - 1 - 1: metric/labeled_spans/macro/precision/test 5: 1 6: - 1 - 1: metric/binary_relations/micro/f1/test 5: 1 6: - 1 - 1: metric/binary_relations/micro/recall/test 5: 1 6: - 1 - 1: metric/binary_relations/micro/precision/test 5: 1 6: - 1 - 1: metric/binary_relations/parts_of_same/f1/test 5: 1 6: - 1 - 1: metric/binary_relations/parts_of_same/recall/test 5: 1 6: - 1 - 1: metric/binary_relations/parts_of_same/precision/test 5: 1 6: - 1 - 1: metric/binary_relations/supports/f1/test 5: 1 6: - 1 - 1: metric/binary_relations/supports/recall/test 5: 1 6: - 1 - 1: metric/binary_relations/supports/precision/test 5: 1 6: - 1 - 1: metric/binary_relations/contradicts/f1/test 5: 1 6: - 1 - 1: metric/binary_relations/contradicts/recall/test 5: 1 6: - 1 - 1: metric/binary_relations/contradicts/precision/test 5: 1 6: - 1 - 1: metric/binary_relations/semantically_same/f1/test 5: 1 6: - 1 - 1: metric/binary_relations/semantically_same/recall/test 5: 1 6: - 1 - 1: metric/binary_relations/semantically_same/precision/test 5: 1 6: - 1 - 1: metric/binary_relations/macro/f1/test 5: 1 6: - 1 - 1: metric/binary_relations/macro/recall/test 5: 1 6: - 1 - 1: metric/binary_relations/macro/precision/test 5: 1 6: - 1 _num_params/total: desc: null value: 141788928 _num_params/trainable: desc: null value: 141788928 _num_params/non_trainable: desc: null value: 0 _config: desc: null value: pipeline_type: training name: dataset-sciarg/task-ner_re/v0.3 tags: - task=ner_re - model=pointer_network train: true validate: true test: true monitor_metric: metric/binary_relations/micro/f1/val monitor_mode: max seed: 1 ckpt_path: null push_to_hub: false model_save_dir: /home/arne/projects/pie-document-level/models/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-32 dataset: _target_: src.utils.execute_pipeline input: _target_: pie_datasets.DatasetDict.load_dataset path: pie/sciarg revision: 982d5682ba414ee13cf92cb93ec18fc8e78e2b81 select_n: _processor_: pie_datasets.DatasetDict.select split: train stop: null select_n_test: _processor_: pie_datasets.DatasetDict.select split: test stop: null select_n_validation: _processor_: pie_datasets.DatasetDict.select split: validation stop: null create_test_split: _processor_: pie_datasets.DatasetDict.move_to_new_split source_split: train target_split: test ids: - A32 - A33 - A34 - A35 - A36 - A37 - A38 - A39 - A40 create_validation_split: _processor_: pie_datasets.DatasetDict.add_test_split test_size: 0.1 seed: 1 source_split: train target_split: validation datamodule: _target_: src.datamodules.PieDataModule batch_size: 2 num_workers: 0 pin_memory: false show_progress_for_encode: true train_split: train val_split: validation test_split: test taskmodule: _target_: pie_modules.taskmodules.PointerNetworkTaskModuleForEnd2EndRE tokenizer_init_kwargs: add_prefix_space: true tokenizer_name_or_path: facebook/bart-base tokenizer_kwargs: truncation: true return_overflowing_tokens: true stride: 128 strict_span_conversion: false create_constraints: true constrained_generation: true partition_layer_name: labeled_partitions model: _target_: pie_modules.models.SimpleGenerativeModel base_model_type: pie_modules.models.base_models.BartAsPointerNetwork base_model_config: pretrained_model_name_or_path: facebook/bart-base use_encoder_mlp: true use_constraints_encoder_mlp: true decoder_position_id_pattern: - 0 - 0 - 1 - 0 - 0 - 1 - 1 encoder_layer_norm_decay: 0.005 lr: 6.0e-05 num_beams: 4 max_length: 768 decoder_layer_norm_decay: 0.05 metric_stages: - val - test - train metric_call_predict: - val - test warmup_proportion: 0.01 callbacks: model_checkpoint: _target_: pytorch_lightning.callbacks.ModelCheckpoint dirpath: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0/checkpoints filename: epoch_{epoch:03d} monitor: metric/binary_relations/micro/f1/val verbose: false save_last: true save_top_k: 1 mode: max auto_insert_metric_name: false save_weights_only: false every_n_train_steps: null train_time_interval: null every_n_epochs: null save_on_train_epoch_end: null early_stopping: _target_: pytorch_lightning.callbacks.EarlyStopping monitor: metric/binary_relations/micro/f1/val min_delta: 0.0 patience: 100 verbose: false mode: max strict: true check_finite: true stopping_threshold: null divergence_threshold: null check_on_train_epoch_end: null model_summary: _target_: pytorch_lightning.callbacks.RichModelSummary max_depth: -1 rich_progress_bar: _target_: pytorch_lightning.callbacks.RichProgressBar logger: wandb: _target_: pytorch_lightning.loggers.wandb.WandbLogger save_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0 offline: false id: null anonymous: null project: dataset-sciarg-task-ner_re-v0.3-training log_model: false prefix: '' group: '' tags: - task=ner_re - model=pointer_network job_type: '' trainer: _target_: pytorch_lightning.Trainer default_root_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0 min_epochs: 150 max_epochs: 150 accelerator: gpu devices: 1 check_val_every_n_epoch: 1 deterministic: false gradient_clip_val: 5 gradient_clip_algorithm: value paths: root_dir: /home/arne/projects/pie-document-level data_dir: /home/arne/projects/pie-document-level/data/ log_dir: /home/arne/projects/pie-document-level/logs/ output_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0 save_dir: /home/arne/projects/pie-document-level work_dir: /home/arne/projects/pie-document-level extras: ignore_warnings: false enforce_tags: true print_config: true base_model: facebook/bart-base base_model_type: desc: null value: pie_modules.models.base_models.BartAsPointerNetwork base_model_config: desc: null value: pretrained_model_name_or_path: facebook/bart-base use_encoder_mlp: true use_constraints_encoder_mlp: true decoder_position_id_pattern: - 0 - 0 - 1 - 0 - 0 - 1 - 1 encoder_layer_norm_decay: 0.005 lr: 6.0e-05 num_beams: 4 max_length: 768 decoder_layer_norm_decay: 0.05 bos_token_id: 0 eos_token_id: 1 pad_token_id: 1 target_token_ids: - 0 - 2 - 50267 - 50265 - 50268 - 50270 - 50271 - 50269 - 50272 - 50266 embedding_weight_mapping: '50267': - 4146 '50265': - 3618 - 1215 - 31628 '50268': - 414 '50270': - 308 - 1215 - 31628 '50271': - 37820 '50269': - 1667 - 1215 - 1116 - 1215 - 41690 '50272': - 9031 - 38600 - 1215 - 41690 '50266': - 4548 override_generation_kwargs: desc: null value: null warmup_proportion: desc: null value: 0.01 learning_rate: desc: null value: null optimizer_type: desc: null value: null metric_stages: desc: null value: - val - test - train metric_call_predict: desc: null value: - val - test taskmodule_config: desc: null value: taskmodule_type: PointerNetworkTaskModuleForEnd2EndRE tokenizer_name_or_path: facebook/bart-base document_type: pytorch_ie.documents.TextDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions tokenized_document_type: pie_modules.documents.TokenDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions span_layer_name: labeled_spans relation_layer_name: binary_relations none_label: none loop_dummy_relation_name: loop constrained_generation: true label_tokens: null label_representations: null labels_per_layer: labeled_spans: - background_claim - data - own_claim binary_relations: - contradicts - parts_of_same - semantically_same - supports exclude_labels_per_layer: null create_constraints: true tokenizer_init_kwargs: add_prefix_space: true tokenizer_kwargs: truncation: true return_overflowing_tokens: true stride: 128 strict_span_conversion: false partition_layer_name: labeled_partitions annotation_field_mapping: null log_first_n_examples: null _best_checkpoint: desc: null value: epoch_145.ckpt _checkpoint_dir: desc: null value: /mnt/data/experiments/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0/checkpoints