File size: 1,723 Bytes
5dfdbc0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
{
    "query_token_id": "[unused0]",
    "doc_token_id": "[unused1]",
    "query_token": "[Q]",
    "doc_token": "[D]",
    "ncells": null,
    "centroid_score_threshold": null,
    "ndocs": null,
    "load_index_with_mmap": false,
    "index_path": null,
    "index_bsize": 64,
    "nbits": 4,
    "kmeans_niters": 4,
    "resume": false,
    "similarity": "cosine",
    "bsize": 16,
    "accumsteps": 1,
    "lr": 5e-6,
    "maxsteps": 500000,
    "save_every": 19854,
    "warmup": 19854,
    "warmup_bert": null,
    "relu": false,
    "nway": 2,
    "use_ib_negatives": true,
    "reranker": false,
    "distillation_alpha": 1.0,
    "ignore_scores": false,
    "model_name": "ColBERT-mmacro-de-1M",
    "query_maxlen": 32,
    "attend_to_mask_tokens": false,
    "interaction": "colbert",
    "dim": 128,
    "doc_maxlen": 256,
    "mask_punctuation": true,
    "checkpoint": "dbmdz\/bert-base-german-cased",
    "triples": "\/kaggle\/input\/mmarco-de-10m\/triples.train.colbert.jsonl",
    "collection": "\/kaggle\/input\/mmarco-de-10m\/corpus.train.colbert.tsv",
    "queries": "\/kaggle\/input\/mmarco-de-10m\/queries.train.colbert.tsv",
    "index_name": null,
    "overwrite": false,
    "root": ".ragatouille\/",
    "experiment": "colbert",
    "index_root": null,
    "name": "2024-02\/26\/08.29.22",
    "rank": 0,
    "nranks": 2,
    "amp": true,
    "gpus": 2,
    "avoid_fork_if_possible": false,
    "meta": {
        "hostname": "faa3efed3289",
        "current_datetime": "Feb 26, 2024 ;  7:44PM UTC (+0000)",
        "cmd": "\/opt\/conda\/lib\/python3.10\/site-packages\/ipykernel_launcher.py -f \/tmp\/tmpclobcmzl.json --HistoryManager.hist_file=:memory:",
        "version": "colbert-v0.4"
    }
}