davidheineman commited on
Commit
2d0fea9
1 Parent(s): 240668f

add full metadata

Browse files
Files changed (2) hide show
  1. .gitattributes +1 -0
  2. index/metadata.json +3 -62
.gitattributes CHANGED
@@ -36,3 +36,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
36
  *.bib filter=lfs diff=lfs merge=lfs -text
37
  collection.json filter=lfs diff=lfs merge=lfs -text
38
  dataset.json filter=lfs diff=lfs merge=lfs -text
 
 
36
  *.bib filter=lfs diff=lfs merge=lfs -text
37
  collection.json filter=lfs diff=lfs merge=lfs -text
38
  dataset.json filter=lfs diff=lfs merge=lfs -text
39
+ index/metadata.json filter=lfs diff=lfs merge=lfs -text
index/metadata.json CHANGED
@@ -1,62 +1,3 @@
1
- {
2
- "config": {
3
- "query_token_id": "[unused0]",
4
- "doc_token_id": "[unused1]",
5
- "query_token": "[Q]",
6
- "doc_token": "[D]",
7
- "ncells": null,
8
- "centroid_score_threshold": null,
9
- "ndocs": null,
10
- "load_index_with_mmap": false,
11
- "index_path": null,
12
- "nbits": 2,
13
- "kmeans_niters": 4,
14
- "resume": false,
15
- "similarity": "cosine",
16
- "bsize": 64,
17
- "accumsteps": 1,
18
- "lr": 3e-6,
19
- "maxsteps": 500000,
20
- "save_every": null,
21
- "warmup": null,
22
- "warmup_bert": null,
23
- "relu": false,
24
- "nway": 2,
25
- "use_ib_negatives": false,
26
- "reranker": false,
27
- "distillation_alpha": 1.0,
28
- "ignore_scores": false,
29
- "model_name": null,
30
- "query_maxlen": 32,
31
- "attend_to_mask_tokens": false,
32
- "interaction": "colbert",
33
- "dim": 128,
34
- "doc_maxlen": 10,
35
- "mask_punctuation": true,
36
- "checkpoint": "colbert-ir\/colbertv2.0",
37
- "triples": null,
38
- "collection": [
39
- "list with 46880 elements starting with...",
40
- [
41
- "Position paper for YRRSDS 2023",
42
- "In this position paper, I will present the research interests in my PostDoc on safety and robustness specific to conversational AI, including then relevant overlap from my PhD.",
43
- "Speech production is nuanced and unique to every individual, but today{'}s Spoken Dialogue Systems (SDSs) are trained to use general speech patterns to successfully improve performance on various evaluation metrics. However, these patterns do not apply to certain user groups - often the very people that can benefit the most from SDSs. For example, people with dementia produce more disfluent speech than the general population. The healthcare domain is now a popular setting for spoken dialogue and human-robot interaction research. This trend is similar when observing company behaviour. Charities promote industry voice assistants, the creators are getting HIPAA compliance, and their features sometimes target vulnerable user groups. It is therefore critical to adapt SDSs to be more accessible."
44
- ]
45
- ],
46
- "queries": null,
47
- "index_name": "index-1",
48
- "overwrite": false,
49
- "root": "\/content\/experiments",
50
- "experiment": "notebook",
51
- "index_root": null,
52
- "name": "2024-04\/14\/15.49.20",
53
- "rank": 0,
54
- "nranks": 1,
55
- "amp": true,
56
- "gpus": 1
57
- },
58
- "num_chunks": 2,
59
- "num_partitions": 8192,
60
- "num_embeddings": 440546,
61
- "avg_doclen": 9.39731228668942
62
- }
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fabe6f5e95f0eb8bee525adc7ab82d7fe275dc862e354f200eb494a74b2b23ea
3
+ size 45753744