File size: 18,138 Bytes
b163a92
1
[{"id": 140586450389168, "module": "xpmir.text.huggingface", "type": "TransformerTokensEncoderWithMLMOutput", "typename": "xpmir.text.huggingface.TransformerTokensEncoderWithMLMOutput", "identifier": "632ba5887979ba5d8e2364846114db972a70fdb7fff9d192749f22611e1d4d2d", "fields": {"model_id": "distilbert-base-uncased", "trainable": true, "dropout": 0.0}}, {"id": 140586450388304, "module": "xpmir.neural.splade", "type": "MaxAggregation", "typename": "xpmir.neural.splade.MaxAggregation", "identifier": "1c5be6126a3846bdc0303757dca9780a9d905f71f08855aaed4b4718a84f1906", "fields": {}}, {"id": 140586450388832, "module": "xpmir.neural.splade", "type": "SpladeTextEncoder", "typename": "xpmir.neural.splade.SpladeTextEncoder", "identifier": "33b37b3a9259612b72d500c72c75e23b23cde2e6d95c584b97ced965ae04391f", "fields": {"encoder": {"type": "python", "value": 140586450389168}, "aggregation": {"type": "python", "value": 140586450388304}, "maxlen": 200}}, {"id": 140586450392576, "module": "xpmir.neural.splade", "type": "SpladeTextEncoder", "typename": "xpmir.neural.splade.SpladeTextEncoder", "identifier": "ad18df59af97138c1666d2abcd3ccbb9e3e2b5aea8c7a92b8a7d7a6f0c84fb80", "fields": {"encoder": {"type": "python", "value": 140586450389168}, "aggregation": {"type": "python", "value": 140586450388304}, "maxlen": 30}}, {"id": 140586450392816, "module": "xpmir.neural.dual", "type": "DotDense", "typename": "xpmir.neural.dual.DotDense", "identifier": "9cd64c3fd5e0f385490a6e50dbbeb44584b06b7bc7e443556b651b5815abbfd7", "fields": {"encoder": {"type": "python", "value": 140586450388832}, "query_encoder": {"type": "python", "value": 140586450392576}}}, {"id": 140586835900928, "module": "xpmir.learning.base", "type": "Random", "typename": "xpmir.learning.base.Random", "identifier": "5a306f11824a2a1058441627f732c699d1a73e4cb0b0f0e4ca2b951d83f99cb7", "fields": {"seed": 0}}, {"id": 140586450392864, "module": "xpmir.neural.dual", "type": "ScheduledFlopsRegularizer", "typename": "xpmir.neural.dual.ScheduledFlopsRegularizer", "identifier": "65b8035b9b9b83f7f4f409b4734bf0b66cd97ea4f910d992e3783c5bdffb6345", "fields": {"lambda_q": 0.5, "lambda_d": 0.4, "min_lambda_q": 0.0, "min_lambda_d": 0.0, "lambda_warmup_steps": 50000}}, {"id": 140586449370176, "module": "xpmir.learning.batchers", "type": "Batcher", "typename": "xpmir.learning.batchers.Batcher", "identifier": "ee37b1eaed689989dc7e73a4f1182674855b39173706c24e3ad097690db0016e", "fields": {}}, {"id": 140586450395648, "module": "xpmir.letor.distillation.samplers", "type": "PairwiseDistillationSamplesTSV", "typename": "xpmir.letor.distillation.samplers.PairwiseDistillationSamplesTSV", "identifier": "b236713fdda1c88abb547b30e55ea90bf5be75feab54ef7e201da07a445197c2", "fields": {"id": "com.github.sebastian-hofstaetter.neural-ranking-kd.msmarco.ensemble.teacher@ir", "path": {"type": "path", "value": "/linkhome/rech/genlip01/upo82uo/datamaestro/data/ir/com/github/sebastian-hofstaetter/neural-ranking-kd/msmarco/ensemble/teacher/bert_cat_ensemble_msmarcopassage_train_scores_ids.tsv"}, "with_docid": true, "with_queryid": true}}, {"id": 140586836261232, "module": "datamaestro_text.datasets.irds.data", "type": "Documents", "typename": "datamaestro_text.datasets.irds.data.Documents", "identifier": "b719776c0c0b8a51534153659c8b6f87e0b5ae363c216ee129e379cecd1bf69b", "fields": {"irds": "msmarco-passage", "id": "irds.msmarco-passage.documents@irds", "count": null}}, {"id": 140586449112560, "module": "datamaestro_text.datasets.irds.data", "type": "Topics", "typename": "datamaestro_text.datasets.irds.data.Topics", "identifier": "9df75d4b1df2d9516887fd8cf2a526a95e2d4791ff83ecc610ce76ce5a3ee285", "fields": {"irds": "msmarco-passage/train", "id": "irds.msmarco-passage.train.queries@irds"}}, {"id": 140586449362400, "module": "xpmir.datasets.adapters", "type": "MemoryTopicStore", "typename": "xpmir.datasets.adapters.MemoryTopicStore", "identifier": "5d524b1821c05a15ab01485c903770005af38d1b4f372e1074cdefa6b762b9c8", "fields": {"topics": {"type": "python", "value": 140586449112560}}}, {"id": 140586449365088, "module": "xpmir.letor.distillation.samplers", "type": "PairwiseHydrator", "typename": "xpmir.letor.distillation.samplers.PairwiseHydrator", "identifier": "0a065535a286c93b222fa675ef54b2be139de0b2e91bbd62466aa70628b3194f", "fields": {"samples": {"type": "python", "value": 140586450395648}, "documentstore": {"type": "python", "value": 140586836261232}, "querystore": {"type": "python", "value": 140586449362400}}}, {"id": 140586449365136, "module": "xpmir.letor.distillation.samplers", "type": "DistillationPairwiseSampler", "typename": "xpmir.letor.distillation.samplers.DistillationPairwiseSampler", "identifier": "396d8522b383d6f9ddf36bdbf5cc8f12523063e1c381cd26a994668e1dac3faf", "fields": {"samples": {"type": "python", "value": 140586449365088}}}, {"id": 140586449366768, "module": "xpmir.letor.distillation.pairwise", "type": "MSEDifferenceLoss", "typename": "xpmir.letor.distillation.pairwise.MSEDifferenceLoss", "identifier": "3b1ff283817ed67c298e300f1b3e25afe3e83998d15800dba57506cfc68db794", "fields": {"weight": 1.0}}, {"id": 140586449366960, "module": "xpmir.letor.distillation.pairwise", "type": "DistillationPairwiseTrainer", "typename": "xpmir.letor.distillation.pairwise.DistillationPairwiseTrainer", "identifier": "f1c57f83c5723fb235b2ffa1be29e66ef5dc1b0cac540907417ffde2b746205a", "fields": {"hooks": [{"type": "python", "value": 140586450392864}], "model": null, "batcher": {"type": "python", "value": 140586449370176}, "sampler": {"type": "python", "value": 140586449365136}, "batch_size": 96, "lossfn": {"type": "python", "value": 140586449366768}}}, {"id": 140586447557952, "module": "xpmir.learning.optim", "type": "AdamW", "typename": "xpmir.learning.optim.AdamW", "identifier": "218642f09cdb285ad719d8118af9324cf8c04e0aa611b8d7c969dcf8ddc80169", "fields": {"lr": 2e-05, "weight_decay": 0.01, "eps": 1e-08}}, {"id": 140586447557760, "module": "xpmir.learning.schedulers", "type": "LinearWithWarmup", "typename": "xpmir.learning.schedulers.LinearWithWarmup", "identifier": "6c0548cdebd221e332e206ac024b596201cacb1525b99fdca5f24743988ad865", "fields": {"num_warmup_steps": 6000, "min_factor": 0.0}}, {"id": 140586447560880, "module": "xpmir.learning.optim", "type": "ParameterFilter", "typename": "xpmir.learning.optim.ParameterFilter", "identifier": "6b7385c00a73e4491f514855a8d0a0033635bd3422e34f07c8b78fc9b5f129c6", "fields": {}}, {"id": 140586447558912, "module": "xpmir.learning.optim", "type": "ParameterOptimizer", "typename": "xpmir.learning.optim.ParameterOptimizer", "identifier": "da915205131da7cda79f1bf9165470e909e647fb3a8f8b47ea895840972f1cc0", "fields": {"optimizer": {"type": "python", "value": 140586447557952}, "scheduler": {"type": "python", "value": 140586447557760}, "module": null, "filter": {"type": "python", "value": 140586447560880}}}, {"id": 140586451483808, "module": "datamaestro_text.datasets.irds.data", "type": "Documents", "typename": "datamaestro_text.datasets.irds.data.Documents", "identifier": "b719776c0c0b8a51534153659c8b6f87e0b5ae363c216ee129e379cecd1bf69b", "fields": {"irds": "msmarco-passage", "id": "irds.msmarco-passage.documents@irds", "count": null}}, {"id": 140586451481504, "module": "datamaestro_text.datasets.irds.data", "type": "Topics", "typename": "datamaestro_text.datasets.irds.data.Topics", "identifier": "a3ae62e29aba384f96996304c8391ebdb588b1122062249c9c73f1b124ea50c6", "fields": {"irds": "msmarco-passage/dev", "id": "irds.msmarco-passage.dev.queries@irds"}}, {"id": 140586451484576, "module": "datamaestro_text.datasets.irds.data", "type": "AdhocAssessments", "typename": "datamaestro_text.datasets.irds.data.AdhocAssessments", "identifier": "3ceb38ab1310d6f2b5c59979fd59e4490490048b08732f4c9f812883ad6268b7", "fields": {"irds": "msmarco-passage/dev", "id": "irds.msmarco-passage.dev.qrels@irds"}}, {"id": 140586451483280, "module": "datamaestro_text.datasets.irds.data", "type": "Adhoc", "typename": "datamaestro_text.datasets.irds.data.Adhoc", "identifier": "7966d82da2dcaa72d9c10048451f8f82189b8963ae23f358e42956b26a0ce968", "fields": {"irds": "msmarco-passage/dev", "id": "irds.msmarco-passage.dev@irds", "documents": {"type": "python", "value": 140586451483808}, "topics": {"type": "python", "value": 140586451481504}, "assessments": {"type": "python", "value": 140586451484576}}}, {"id": 140586451484384, "module": "datamaestro_text.datasets.irds.data", "type": "Topics", "typename": "datamaestro_text.datasets.irds.data.Topics", "identifier": "86709e8385743a96e30aae2809a36426e24e4a6a87cc7d34cafbd67fea73edb0", "fields": {"irds": "msmarco-passage/dev/small", "id": "irds.msmarco-passage.dev.small.queries@irds"}}, {"id": 140586449962656, "module": "xpmir.datasets.adapters", "type": "RandomFold", "typename": "xpmir.datasets.adapters.RandomFold", "identifier": "8e676329a00b116571e8d450e06cdf6f1963324b940c853f67e07cbf4b7a6f97", "task": 140586449962656, "fields": {"seed": 123, "sizes": [500.0], "dataset": {"type": "python", "value": 140586451483280}, "fold": 0, "exclude": {"type": "python", "value": 140586451484384}, "assessments": {"type": "path", "value": "/gpfsscratch/rech/iea/upo82uo/experiments/neuralir/jobs/xpmir.datasets.adapters.randomfold/8e676329a00b116571e8d450e06cdf6f1963324b940c853f67e07cbf4b7a6f97/assessments.tsv"}, "topics": {"type": "path", "value": "/gpfsscratch/rech/iea/upo82uo/experiments/neuralir/jobs/xpmir.datasets.adapters.randomfold/8e676329a00b116571e8d450e06cdf6f1963324b940c853f67e07cbf4b7a6f97/topics.tsv"}}}, {"id": 140586449967984, "module": "datamaestro_text.data.ir.csv", "type": "Topics", "typename": "datamaestro_text.data.ir.csv.Topics", "identifier": "5abde23732045b71e54db55047f17792e4de0a3c0415fd44225177b3b5db3f0d", "task": 140586449962656, "fields": {"id": "", "separator": "\t", "path": {"type": "path", "value": "/gpfsscratch/rech/iea/upo82uo/experiments/neuralir/jobs/xpmir.datasets.adapters.randomfold/8e676329a00b116571e8d450e06cdf6f1963324b940c853f67e07cbf4b7a6f97/topics.tsv"}}}, {"id": 140586449969136, "module": "datamaestro_text.data.ir.trec", "type": "TrecAdhocAssessments", "typename": "datamaestro_text.data.ir.trec.TrecAdhocAssessments", "identifier": "29877bcede5ab47ca7d0bb1f0cbf406f3fb5fa9a59ddee0d68a1d9786c0eb6ec", "task": 140586449962656, "fields": {"id": "", "path": {"type": "path", "value": "/gpfsscratch/rech/iea/upo82uo/experiments/neuralir/jobs/xpmir.datasets.adapters.randomfold/8e676329a00b116571e8d450e06cdf6f1963324b940c853f67e07cbf4b7a6f97/assessments.tsv"}}}, {"id": 140586449970144, "module": "datamaestro_text.data.ir", "type": "Adhoc", "typename": "datamaestro_text.data.ir.Adhoc", "identifier": "009de43e24e54d97678e4e86d904758a861f4485593638f855c291a40df337a9", "task": 140586449962656, "fields": {"id": "", "documents": {"type": "python", "value": 140586451483808}, "topics": {"type": "python", "value": 140586449967984}, "assessments": {"type": "python", "value": 140586449969136}}}, {"id": 140586449961264, "module": "datamaestro_text.datasets.irds.data", "type": "Documents", "typename": "datamaestro_text.datasets.irds.data.Documents", "identifier": "b719776c0c0b8a51534153659c8b6f87e0b5ae363c216ee129e379cecd1bf69b", "fields": {"irds": "msmarco-passage", "id": "irds.msmarco-passage.documents@irds", "count": null}}, {"id": 140586450288752, "module": "xpmir.interfaces.anserini", "type": "IndexCollection", "typename": "xpmir.interfaces.anserini.IndexCollection", "identifier": "9aed5a0f6654836687d082284725f0d459cd00f69b6e703e815fdcd9cab2a5cf", "task": 140586450288752, "fields": {"id": "", "count": null, "path": {"type": "path", "value": "/gpfsscratch/rech/iea/upo82uo/experiments/neuralir/jobs/xpmir.interfaces.anserini.indexcollection/9aed5a0f6654836687d082284725f0d459cd00f69b6e703e815fdcd9cab2a5cf/index"}, "storePositions": false, "storeDocvectors": false, "storeRaw": false, "storeContents": false, "stemmer": "porter", "threads": 8, "documents": {"type": "python", "value": 140586449961264}, "thread": 8}}, {"id": 140586449974704, "module": "xpmir.rankers.standard", "type": "BM25", "typename": "xpmir.rankers.standard.BM25", "identifier": "feccdba59a7375ef738014135a63ca2a375baf9cfa7695a822094d13a6b94349", "fields": {"k1": 0.9, "b": 0.4}}, {"id": 140586450300992, "module": "xpmir.interfaces.anserini", "type": "AnseriniRetriever", "typename": "xpmir.interfaces.anserini.AnseriniRetriever", "identifier": "a4a8ce364e9802c1f6016a3666391c243a93da67fc516decde05d8ad59d65298", "fields": {"store": null, "index": {"type": "python", "value": 140586450288752}, "model": {"type": "python", "value": 140586449974704}, "k": 50}}, {"id": 140586450301520, "module": "xpmir.datasets.adapters", "type": "RetrieverBasedCollection", "typename": "xpmir.datasets.adapters.RetrieverBasedCollection", "identifier": "c2eb722adcecabbd802d1aad3ceefba37bce8e554003dc243767b0b39d083a4b", "task": 140586450301520, "fields": {"relevance_threshold": 0.0, "dataset": {"type": "python", "value": 140586449970144}, "retrievers": [{"type": "python", "value": 140586450300992}], "keepRelevant": true, "keepNotRelevant": false, "docids_path": {"type": "path", "value": "/gpfsscratch/rech/iea/upo82uo/experiments/neuralir/jobs/xpmir.datasets.adapters.retrieverbasedcollection/c2eb722adcecabbd802d1aad3ceefba37bce8e554003dc243767b0b39d083a4b/docids.txt"}}}, {"id": 140586450296480, "module": "xpmir.datasets.adapters", "type": "DocumentSubset", "typename": "xpmir.datasets.adapters.DocumentSubset", "identifier": "2861abea3c02391600acf3498bd14152485c1185690bdbdc07899ca265297afd", "task": 140586450301520, "fields": {"id": "", "count": null, "base": {"type": "python", "value": 140586451483808}, "docids_path": {"type": "path", "value": "/gpfsscratch/rech/iea/upo82uo/experiments/neuralir/jobs/xpmir.datasets.adapters.retrieverbasedcollection/c2eb722adcecabbd802d1aad3ceefba37bce8e554003dc243767b0b39d083a4b/docids.txt"}, "in_memory": true}}, {"id": 140586450304832, "module": "datamaestro_text.data.ir", "type": "Adhoc", "typename": "datamaestro_text.data.ir.Adhoc", "identifier": "e89b348799bd3c507952272d0b48aac48d0d904141ff71f16d64045ab9c33069", "fields": {"id": "", "documents": {"type": "python", "value": 140586450296480}, "topics": {"type": "python", "value": 140586449967984}, "assessments": {"type": "python", "value": 140586449969136}}}, {"id": 140586447553488, "module": "xpmir.learning.batchers", "type": "PowerAdaptativeBatcher", "typename": "xpmir.learning.batchers.PowerAdaptativeBatcher", "identifier": "d24714900555b64e89e6b113c85846846aef0e48ba995681f286cea11c607735", "fields": {}}, {"id": 140586836256384, "module": "xpmir.learning.devices", "type": "CudaDevice", "typename": "xpmir.learning.devices.CudaDevice", "identifier": "fa61b710c002a8ae4e60c2c6a25a9355a25a7c3f5457794426af0d16da42d26d", "fields": {"gpu_determ": false, "cpu_fallback": false, "distributed": false}}, {"id": 140586447554064, "module": "xpmir.rankers.full", "type": "FullRetrieverRescorer", "typename": "xpmir.rankers.full.FullRetrieverRescorer", "identifier": "694328d0339809dfdc05a62baa73b0ceacf7d44645f8b6b580b921c1fa5571e0", "fields": {"store": null, "documents": {"type": "python", "value": 140586450296480}, "scorer": {"type": "python", "value": 140586450392816}, "batchsize": 200, "batcher": {"type": "python", "value": 140586447553488}, "device": {"type": "python", "value": 140586836256384}}}, {"id": 140586447555456, "module": "xpmir.letor.learner", "type": "ValidationListener", "typename": "xpmir.letor.learner.ValidationListener", "identifier": "5add8ef2dd88026f7bd2846cd05e9ec9e1e2a0b85d6009f4ac7ecad9227ddb8f", "fields": {"id": "bestval", "metrics": {"RR@10": true, "AP": false, "nDCG@10": false}, "dataset": {"type": "python", "value": 140586450304832}, "retriever": {"type": "python", "value": 140586447554064}, "warmup": -1, "bestpath": {"type": "path", "value": "/gpfsscratch/rech/iea/upo82uo/experiments/neuralir/jobs/xpmir.learning.learner.learner/e80c2fa3423d482c97c422a696cc591af2a1c56126b481ab7162fbfc7dfc8982/out/listeners/0/best"}, "info": {"type": "path", "value": "/gpfsscratch/rech/iea/upo82uo/experiments/neuralir/jobs/xpmir.learning.learner.learner/e80c2fa3423d482c97c422a696cc591af2a1c56126b481ab7162fbfc7dfc8982/out/listeners/0/info.json"}, "validation_interval": 40, "early_stop": 0}}, {"id": 140586449368208, "module": "xpmir.distributed", "type": "DistributedHook", "typename": "xpmir.distributed.DistributedHook", "identifier": "73bc56a2a8123cc2e217e05e778252158bf47a3b36e2fe390f4fa77cf24c3572", "meta": true, "fields": {"models": [{"type": "python", "value": 140586450388832}, {"type": "python", "value": 140586450392576}]}}, {"id": 140586447561168, "module": "xpmir.learning.learner", "type": "Learner", "typename": "xpmir.learning.learner.Learner", "identifier": "e80c2fa3423d482c97c422a696cc591af2a1c56126b481ab7162fbfc7dfc8982", "task": 140586447561168, "fields": {"random": {"type": "python", "value": 140586835900928}, "trainer": {"type": "python", "value": 140586449366960}, "model": {"type": "python", "value": 140586450392816}, "max_epochs": 1200, "steps_per_epoch": 128, "use_fp16": true, "optimizers": [{"type": "python", "value": 140586447558912}], "listeners": [{"type": "python", "value": 140586447555456}], "checkpoint_interval": 1, "logpath": {"type": "path", "value": "/gpfsscratch/rech/iea/upo82uo/experiments/neuralir/jobs/xpmir.learning.learner.learner/e80c2fa3423d482c97c422a696cc591af2a1c56126b481ab7162fbfc7dfc8982/runs"}, "checkpointspath": {"type": "path", "value": "/gpfsscratch/rech/iea/upo82uo/experiments/neuralir/jobs/xpmir.learning.learner.learner/e80c2fa3423d482c97c422a696cc591af2a1c56126b481ab7162fbfc7dfc8982/checkpoints"}, "device": {"type": "python", "value": 140586836256384}, "hooks": [{"type": "python", "value": 140586449368208}], "use_pretasks": false}}, {"id": 140586447566064, "module": "xpmir.learning.optim", "type": "ModuleLoader", "typename": "xpmir.learning.optim.ModuleLoader", "identifier": "e88360d409dad308ff598d25e3232edf903c073980d21352b305745947d04921", "task": 140586447561168, "fields": {"value": {"type": "python", "value": 140586450392816}, "path": {"type": "path.serialized", "value": "path", "is_folder": false}}}]