MenahemOz commited on May 13, 2023

Commit

5c058d4

•

1 Parent(s): 966f818

Upload folder using huggingface_hub

Browse files

Files changed (37) hide show

.gitattributes +3 -0
best.th +3 -0
config.json +194 -0
meta.json +1 -0
metrics.json +18 -0
metrics_epoch_0.json +10 -0
metrics_epoch_1.json +10 -0
metrics_epoch_10.json +10 -0
metrics_epoch_11.json +10 -0
metrics_epoch_12.json +10 -0
metrics_epoch_13.json +10 -0
metrics_epoch_14.json +10 -0
metrics_epoch_15.json +18 -0
metrics_epoch_16.json +18 -0
metrics_epoch_17.json +18 -0
metrics_epoch_18.json +18 -0
metrics_epoch_19.json +18 -0
metrics_epoch_2.json +10 -0
metrics_epoch_20.json +18 -0
metrics_epoch_21.json +18 -0
metrics_epoch_22.json +18 -0
metrics_epoch_23.json +18 -0
metrics_epoch_24.json +18 -0
metrics_epoch_3.json +10 -0
metrics_epoch_4.json +10 -0
metrics_epoch_5.json +10 -0
metrics_epoch_6.json +10 -0
metrics_epoch_7.json +10 -0
metrics_epoch_8.json +10 -0
metrics_epoch_9.json +10 -0
model.tar.gz +3 -0
model_state_e25_b0.th +3 -0
out.log +0 -0
training_state_e25_b0.th +3 -0
vocabulary/.lock +0 -0
vocabulary/non_padded_namespaces.txt +2 -0
vocabulary/target_tokens.txt +8 -0

.gitattributes CHANGED Viewed

@@ -32,3 +32,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+best.th filter=lfs diff=lfs merge=lfs -text
+model_state_e25_b0.th filter=lfs diff=lfs merge=lfs -text
+training_state_e25_b0.th filter=lfs diff=lfs merge=lfs -text

best.th ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5c586318da3c2ae218131f4b97bab5608c05c790ed35d84ca4af5600a89e463b
+size 474302867

config.json ADDED Viewed

	@@ -0,0 +1,194 @@

+{
+    "dataset_reader": {
+        "type": "seq2rel",
+        "max_length": 512,
+        "source_token_indexers": {
+            "tokens": {
+                "type": "pretrained_transformer",
+                "model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
+                "tokenizer_kwargs": {
+                    "additional_special_tokens": [
+                        "@ARG@",
+                        "@TRIGGER@"
+                    ],
+                    "do_lower_case": true
+                }
+            }
+        },
+        "source_tokenizer": {
+            "type": "pretrained_transformer",
+            "add_special_tokens": true,
+            "max_length": 512,
+            "model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
+            "tokenizer_kwargs": {
+                "additional_special_tokens": [
+                    "@ARG@",
+                    "@TRIGGER@"
+                ],
+                "do_lower_case": true
+            }
+        },
+        "target_namespace": "target_tokens",
+        "target_tokenizer": {
+            "type": "pretrained_transformer",
+            "add_special_tokens": false,
+            "model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
+            "tokenizer_kwargs": {
+                "additional_special_tokens": [
+                    "@ARG@",
+                    "@TRIGGER@",
+                    "@OSP@",
+                    "@start@",
+                    "@end@",
+                    ";"
+                ],
+                "do_lower_case": true
+            }
+        }
+    },
+    "model": {
+        "type": "copynet_seq2rel",
+        "attention": {
+            "type": "multihead_attention",
+            "dropout": 0.1,
+            "num_heads": 6
+        },
+        "beam_search": {
+            "beam_size": 1,
+            "final_sequence_scorer": {
+                "type": "length-normalized-sequence-log-prob",
+                "length_penalty": 1
+            },
+            "max_steps": 96
+        },
+        "dropout": 0.1,
+        "sequence_based_metrics": [
+            {
+                "average": "micro",
+                "labels": [
+                    "OSP"
+                ],
+                "remove_duplicate_ents": true,
+                "type": "f1_seq2rel"
+            }
+        ],
+        "source_embedder": {
+            "token_embedders": {
+                "tokens": {
+                    "type": "pretrained_transformer",
+                    "model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
+                    "reinit_modules": 2,
+                    "tokenizer_kwargs": {
+                        "additional_special_tokens": [
+                            "@ARG@",
+                            "@TRIGGER@"
+                        ],
+                        "do_lower_case": true
+                    }
+                }
+            }
+        },
+        "target_embedding_dim": 256,
+        "target_tokenizer": {
+            "type": "pretrained_transformer",
+            "add_special_tokens": false,
+            "model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
+            "tokenizer_kwargs": {
+                "additional_special_tokens": [
+                    "@ARG@",
+                    "@TRIGGER@",
+                    "@OSP@",
+                    "@start@",
+                    "@end@",
+                    ";"
+                ],
+                "do_lower_case": true
+            }
+        },
+        "weight_dropout": 0.5
+    },
+    "train_data_path": "../granular/train_transform.tsv",
+    "validation_data_path": "../granular/dev_transform.tsv",
+    "trainer": {
+        "callbacks": [
+            {
+                "type": "should_validate_callback",
+                "validation_interval": 1,
+                "validation_start": 15
+            }
+        ],
+        "checkpointer": {
+            "keep_most_recent_by_count": 1
+        },
+        "grad_norm": 1,
+        "learning_rate_scheduler": {
+            "type": "linear_with_warmup",
+            "warmup_steps": 2906
+        },
+        "num_epochs": 25,
+        "num_gradient_accumulation_steps": 1,
+        "optimizer": {
+            "type": "huggingface_adamw",
+            "correct_bias": true,
+            "eps": 1e-08,
+            "lr": 0.0004,
+            "parameter_groups": [
+                [
+                    [
+                        "transformer_model(?!.*(?:bias|LayerNorm|layer_norm))"
+                    ],
+                    {
+                        "lr": 2e-05,
+                        "weight_decay": 0.01
+                    }
+                ],
+                [
+                    [
+                        "transformer_model(?=.*(?:bias|LayerNorm|layer_norm))"
+                    ],
+                    {
+                        "lr": 2e-05,
+                        "weight_decay": 0
+                    }
+                ]
+            ],
+            "weight_decay": 0
+        },
+        "use_amp": true,
+        "validation_metric": "+fscore"
+    },
+    "vocabulary": {
+        "max_vocab_size": {
+            "target_tokens": 1
+        },
+        "tokens_to_add": {
+            "target_tokens": [
+                "@ARG@",
+                "@TRIGGER@",
+                "@OSP@",
+                "@start@",
+                "@end@",
+                ";"
+            ]
+        }
+    },
+    "data_loader": {
+        "batch_sampler": {
+            "type": "bucket",
+            "batch_size": 4,
+            "sorting_keys": [
+                "source_tokens"
+            ]
+        }
+    },
+    "validation_data_loader": {
+        "batch_sampler": {
+            "type": "bucket",
+            "batch_size": 128,
+            "padding_noise": 0,
+            "sorting_keys": [
+                "source_tokens"
+            ]
+        }
+    }
+}

meta.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"version": "2.9.3"}

metrics.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "best_epoch": 20,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "1:18:27.472121",
+  "epoch": 24,
+  "training_loss": 0.11846704688033759,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2960.6728515625,
+  "validation_precision": 0.7450980544090271,
+  "validation_recall": 0.74301677942276,
+  "validation_fscore": 0.7440559267997742,
+  "validation_loss": 0.895537956195767,
+  "best_validation_precision": 0.7520891427993774,
+  "best_validation_recall": 0.7541899681091309,
+  "best_validation_fscore": 0.7531380653381348,
+  "best_validation_loss": 0.6954866239684634
+}

metrics_epoch_0.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4427.69140625,
+  "peak_gpu_0_memory_MB": 453.30615234375,
+  "training_duration": "0:02:49.858384",
+  "epoch": 0,
+  "training_loss": 5.703986813210456,
+  "training_worker_0_memory_MB": 4427.69140625,
+  "training_gpu_0_memory_MB": 453.30615234375
+}

metrics_epoch_1.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4512.1484375,
+  "peak_gpu_0_memory_MB": 2972.189453125,
+  "training_duration": "0:05:46.709385",
+  "epoch": 1,
+  "training_loss": 1.6510879126760434,
+  "training_worker_0_memory_MB": 4512.1484375,
+  "training_gpu_0_memory_MB": 2972.189453125
+}

metrics_epoch_10.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "0:32:41.701186",
+  "epoch": 10,
+  "training_loss": 0.32350418552688576,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2938.0322265625
+}

metrics_epoch_11.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "0:35:43.708645",
+  "epoch": 11,
+  "training_loss": 0.3814014623322614,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2934.998046875
+}

metrics_epoch_12.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "0:38:38.856506",
+  "epoch": 12,
+  "training_loss": 0.34930390631647273,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2999.27587890625
+}

metrics_epoch_13.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "0:41:36.654824",
+  "epoch": 13,
+  "training_loss": 0.3129212558918542,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2985.3388671875
+}

metrics_epoch_14.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "0:44:35.664415",
+  "epoch": 14,
+  "training_loss": 0.23782727301993464,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2939.4052734375
+}

metrics_epoch_15.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "best_epoch": 15,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "0:48:11.075306",
+  "epoch": 15,
+  "training_loss": 0.22654071982124985,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2977.85693359375,
+  "validation_precision": 0.7706422209739685,
+  "validation_recall": 0.7039105892181396,
+  "validation_fscore": 0.7357664108276367,
+  "validation_loss": 0.6296270303428173,
+  "best_validation_precision": 0.7706422209739685,
+  "best_validation_recall": 0.7039105892181396,
+  "best_validation_fscore": 0.7357664108276367,
+  "best_validation_loss": 0.6296270303428173
+}

metrics_epoch_16.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "best_epoch": 15,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "0:51:32.703688",
+  "epoch": 16,
+  "training_loss": 0.23088603088214132,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2936.81005859375,
+  "validation_precision": 0.6268656849861145,
+  "validation_recall": 0.8212290406227112,
+  "validation_fscore": 0.7110036611557007,
+  "validation_loss": 0.8719936553388834,
+  "best_validation_precision": 0.7706422209739685,
+  "best_validation_recall": 0.7039105892181396,
+  "best_validation_fscore": 0.7357664108276367,
+  "best_validation_loss": 0.6296270303428173
+}

metrics_epoch_17.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "best_epoch": 17,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "0:55:04.892391",
+  "epoch": 17,
+  "training_loss": 0.21293968360438856,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2935.91259765625,
+  "validation_precision": 0.6767441630363464,
+  "validation_recall": 0.8128491640090942,
+  "validation_fscore": 0.7385786771774292,
+  "validation_loss": 0.7829428290715441,
+  "best_validation_precision": 0.6767441630363464,
+  "best_validation_recall": 0.8128491640090942,
+  "best_validation_fscore": 0.7385786771774292,
+  "best_validation_loss": 0.7829428290715441
+}

metrics_epoch_18.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "best_epoch": 18,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "0:58:25.072875",
+  "epoch": 18,
+  "training_loss": 0.22682103761135117,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2935.91259765625,
+  "validation_precision": 0.7067669034004211,
+  "validation_recall": 0.7877094745635986,
+  "validation_fscore": 0.7450462579727173,
+  "validation_loss": 0.5860945553286001,
+  "best_validation_precision": 0.7067669034004211,
+  "best_validation_recall": 0.7877094745635986,
+  "best_validation_fscore": 0.7450462579727173,
+  "best_validation_loss": 0.5860945553286001
+}

metrics_epoch_19.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "best_epoch": 19,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "1:01:47.703034",
+  "epoch": 19,
+  "training_loss": 0.15822486025588112,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2935.91259765625,
+  "validation_precision": 0.7616279125213623,
+  "validation_recall": 0.7318435907363892,
+  "validation_fscore": 0.74643874168396,
+  "validation_loss": 0.655500799020956,
+  "best_validation_precision": 0.7616279125213623,
+  "best_validation_recall": 0.7318435907363892,
+  "best_validation_fscore": 0.74643874168396,
+  "best_validation_loss": 0.655500799020956
+}

metrics_epoch_2.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4520.765625,
+  "peak_gpu_0_memory_MB": 2981.6318359375,
+  "training_duration": "0:08:43.191831",
+  "epoch": 2,
+  "training_loss": 0.8978546816862963,
+  "training_worker_0_memory_MB": 4520.765625,
+  "training_gpu_0_memory_MB": 2981.6318359375
+}

metrics_epoch_20.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "best_epoch": 20,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "1:05:07.013998",
+  "epoch": 20,
+  "training_loss": 0.18703892177863618,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2990.13623046875,
+  "validation_precision": 0.7520891427993774,
+  "validation_recall": 0.7541899681091309,
+  "validation_fscore": 0.7531380653381348,
+  "validation_loss": 0.6954866239684634,
+  "best_validation_precision": 0.7520891427993774,
+  "best_validation_recall": 0.7541899681091309,
+  "best_validation_fscore": 0.7531380653381348,
+  "best_validation_loss": 0.6954866239684634
+}

metrics_epoch_21.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "best_epoch": 20,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "1:08:27.514746",
+  "epoch": 21,
+  "training_loss": 0.1482860020000315,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2935.91259765625,
+  "validation_precision": 0.7549296021461487,
+  "validation_recall": 0.748603343963623,
+  "validation_fscore": 0.7517531514167786,
+  "validation_loss": 0.7926239181542769,
+  "best_validation_precision": 0.7520891427993774,
+  "best_validation_recall": 0.7541899681091309,
+  "best_validation_fscore": 0.7531380653381348,
+  "best_validation_loss": 0.6954866239684634
+}

metrics_epoch_22.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "best_epoch": 20,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "1:11:43.724129",
+  "epoch": 22,
+  "training_loss": 0.13081708632235942,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2935.91259765625,
+  "validation_precision": 0.7645348906517029,
+  "validation_recall": 0.7346368432044983,
+  "validation_fscore": 0.7492877840995789,
+  "validation_loss": 0.8777754297261708,
+  "best_validation_precision": 0.7520891427993774,
+  "best_validation_recall": 0.7541899681091309,
+  "best_validation_fscore": 0.7531380653381348,
+  "best_validation_loss": 0.6954866239684634
+}

metrics_epoch_23.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "best_epoch": 20,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "1:15:10.022658",
+  "epoch": 23,
+  "training_loss": 0.12166217696645308,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2962.43505859375,
+  "validation_precision": 0.7458100318908691,
+  "validation_recall": 0.7458100318908691,
+  "validation_fscore": 0.7458100914955139,
+  "validation_loss": 1.0029180781566538,
+  "best_validation_precision": 0.7520891427993774,
+  "best_validation_recall": 0.7541899681091309,
+  "best_validation_fscore": 0.7531380653381348,
+  "best_validation_loss": 0.6954866239684634
+}

metrics_epoch_24.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "best_epoch": 20,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "1:18:27.472121",
+  "epoch": 24,
+  "training_loss": 0.11846704688033759,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2960.6728515625,
+  "validation_precision": 0.7450980544090271,
+  "validation_recall": 0.74301677942276,
+  "validation_fscore": 0.7440559267997742,
+  "validation_loss": 0.895537956195767,
+  "best_validation_precision": 0.7520891427993774,
+  "best_validation_recall": 0.7541899681091309,
+  "best_validation_fscore": 0.7531380653381348,
+  "best_validation_loss": 0.6954866239684634
+}

metrics_epoch_3.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 2981.6318359375,
+  "training_duration": "0:11:50.294230",
+  "epoch": 3,
+  "training_loss": 0.818887067774918,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2960.4716796875
+}

metrics_epoch_4.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 2981.6318359375,
+  "training_duration": "0:14:45.670883",
+  "epoch": 4,
+  "training_loss": 0.6278288699645987,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2935.5439453125
+}

metrics_epoch_5.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 2981.6318359375,
+  "training_duration": "0:17:41.182135",
+  "epoch": 5,
+  "training_loss": 0.5944990587151476,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2934.998046875
+}

metrics_epoch_6.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 2981.6318359375,
+  "training_duration": "0:20:37.421798",
+  "epoch": 6,
+  "training_loss": 0.5603309030250199,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2935.5439453125
+}

metrics_epoch_7.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 2981.6318359375,
+  "training_duration": "0:23:35.706207",
+  "epoch": 7,
+  "training_loss": 0.5388365288699913,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2934.998046875
+}

metrics_epoch_8.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "0:26:36.182704",
+  "epoch": 8,
+  "training_loss": 0.4333426699106117,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 3001.03662109375
+}

metrics_epoch_9.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "best_epoch": null,
+  "peak_worker_0_memory_MB": 4521.00390625,
+  "peak_gpu_0_memory_MB": 3001.03662109375,
+  "training_duration": "0:29:38.300579",
+  "epoch": 9,
+  "training_loss": 0.42604672657651455,
+  "training_worker_0_memory_MB": 4521.00390625,
+  "training_gpu_0_memory_MB": 2968.00732421875
+}

model.tar.gz ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:64bd9c4ac97d6be446d16878ffae92c6a39e2d377b8c1aa9a96af7fdf1d8cdd1
+size 440131480

model_state_e25_b0.th ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a6304c93788e3d12fbf31b73e33520c4ffc75ef5b5a335a54da6438ccc00704b
+size 474302867

out.log ADDED Viewed

The diff for this file is too large to render. See raw diff

training_state_e25_b0.th ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:864710bd124f7027feab65e4e8051ddad12f4f699e194b0904445d3f4e0ee4b3
+size 939054969

vocabulary/.lock ADDED Viewed

File without changes

vocabulary/non_padded_namespaces.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ *labels
2	+ *tags

vocabulary/target_tokens.txt ADDED Viewed

	@@ -0,0 +1,8 @@

+@@UNKNOWN@@
+@start@
+@ARG@
+@TRIGGER@
+@OSP@
+@end@
+;
+@COPY@