nsthorat-lilac commited on
Commit
4c2c3ca
1 Parent(s): ebbf600

Push to HF space

Browse files
.gitattributes CHANGED
@@ -93,3 +93,5 @@ data/.cache/lilac/local/Capybara/conversation/\*/input__cluster.jsonl filter=lfs
93
  data/.cache/lilac/hf_download/lilacai/hermes-clusters-local-OpenHermes-2.5/local/OpenHermes-2.5/prompt__cluster-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
94
  data/.cache/lilac/hf_download/lilacai/hermes-clusters-local-OpenHermes-2.5/local/OpenHermes-2.5/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
95
  data/.cache/lilac/hf_download/lilacai/hermes-clusters-local-OpenHermes-2.5/local/OpenHermes-2.5/prompt-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
 
 
 
93
  data/.cache/lilac/hf_download/lilacai/hermes-clusters-local-OpenHermes-2.5/local/OpenHermes-2.5/prompt__cluster-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
94
  data/.cache/lilac/hf_download/lilacai/hermes-clusters-local-OpenHermes-2.5/local/OpenHermes-2.5/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
95
  data/.cache/lilac/hf_download/lilacai/hermes-clusters-local-OpenHermes-2.5/local/OpenHermes-2.5/prompt-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
96
+ data/.cache/lilac/hf_download/lilacai/nikhil_staging-local-Capybara/local/Capybara/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
97
+ data/.cache/lilac/hf_download/lilacai/nikhil_staging-local-Capybara/local/Capybara/input-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
data/.cache/lilac/hf_download/lilacai/nikhil_staging-local-Capybara/dataset_config.yml ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ namespace: local
2
+ name: Capybara
3
+ source:
4
+ dataset_name: LDJnr/Capybara
5
+ source_name: huggingface
6
+ signals:
7
+ - path:
8
+ - conversation
9
+ - '*'
10
+ - input
11
+ signal:
12
+ signal_name: text_statistics
13
+ settings:
14
+ ui:
15
+ media_paths:
16
+ - - conversation
17
+ - '*'
18
+ - input
19
+ - - conversation
20
+ - '*'
21
+ - output
22
+ - input
23
+ markdown_paths: []
data/.cache/lilac/hf_download/lilacai/nikhil_staging-local-Capybara/local/Capybara/conversation/input/text_statistics/data-00000-of-00001.parquet ADDED
Binary file (920 kB). View file
 
data/.cache/lilac/hf_download/lilacai/nikhil_staging-local-Capybara/local/Capybara/conversation/input/text_statistics/signal_manifest.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "files": [
3
+ "data-00000-of-00001.parquet"
4
+ ],
5
+ "parquet_id": "conversation.input.text_statistics",
6
+ "data_schema": {
7
+ "fields": {
8
+ "conversation": {
9
+ "repeated_field": {
10
+ "fields": {
11
+ "input": {
12
+ "fields": {
13
+ "text_statistics": {
14
+ "fields": {
15
+ "num_characters": {
16
+ "dtype": {
17
+ "type": "int32"
18
+ }
19
+ },
20
+ "readability": {
21
+ "dtype": {
22
+ "type": "float32"
23
+ }
24
+ },
25
+ "log(type_token_ratio)": {
26
+ "dtype": {
27
+ "type": "float32"
28
+ }
29
+ },
30
+ "frac_non_ascii": {
31
+ "dtype": {
32
+ "type": "float32"
33
+ },
34
+ "bins": [
35
+ [
36
+ "Low",
37
+ null,
38
+ 0.15
39
+ ],
40
+ [
41
+ "Medium",
42
+ 0.15,
43
+ 0.3
44
+ ],
45
+ [
46
+ "High",
47
+ 0.3,
48
+ null
49
+ ]
50
+ ]
51
+ }
52
+ },
53
+ "signal": {
54
+ "signal_name": "text_statistics"
55
+ }
56
+ }
57
+ }
58
+ }
59
+ }
60
+ }
61
+ }
62
+ }
63
+ },
64
+ "signal": {
65
+ "signal_name": "text_statistics"
66
+ },
67
+ "enriched_path": [
68
+ "conversation",
69
+ "*",
70
+ "input"
71
+ ],
72
+ "py_version": "0.2.0"
73
+ }
data/.cache/lilac/hf_download/lilacai/nikhil_staging-local-Capybara/local/Capybara/data-00000-of-00001.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d65eea22b7c3bed4fe945881d287ecbbaa58f37f23e51da75e31d6b51da27494
3
+ size 22848802
data/.cache/lilac/hf_download/lilacai/nikhil_staging-local-Capybara/local/Capybara/input-00000-of-00001.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e58ef67136014e702822e3791b38fd7b89e5dcd060a592865e1a959f7b95f5be
3
+ size 7299202
data/.cache/lilac/hf_download/lilacai/nikhil_staging-local-Capybara/local/Capybara/input.map_manifest.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "files": [
3
+ "input-00000-of-00001.parquet"
4
+ ],
5
+ "parquet_id": "map.input",
6
+ "data_schema": {
7
+ "fields": {
8
+ "input": {
9
+ "dtype": {
10
+ "type": "string"
11
+ },
12
+ "map": {
13
+ "fn_name": "join",
14
+ "fn_source": "def join(item):\n return '\\n'.join([x['input']['__value__'] for x in item['conversation']])\n",
15
+ "date_created": "2024-01-09T14:53:44.410899"
16
+ }
17
+ }
18
+ }
19
+ },
20
+ "py_version": "0.2.0"
21
+ }
data/.cache/lilac/hf_download/lilacai/nikhil_staging-local-Capybara/local/Capybara/input__cluster-00000-of-00001.parquet ADDED
Binary file (886 kB). View file
 
data/.cache/lilac/hf_download/lilacai/nikhil_staging-local-Capybara/local/Capybara/input__cluster.map_manifest.json ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "files": ["input__cluster-00000-of-00001.parquet"],
3
+ "parquet_id": "map.input__cluster",
4
+ "data_schema": {
5
+ "fields": {
6
+ "input__cluster": {
7
+ "fields": {
8
+ "cluster_id": {
9
+ "dtype": {
10
+ "type": "int32"
11
+ },
12
+ "categorical": true
13
+ },
14
+ "cluster_membership_prob": {
15
+ "dtype": {
16
+ "type": "float32"
17
+ }
18
+ },
19
+ "cluster_title": {
20
+ "dtype": {
21
+ "type": "string"
22
+ }
23
+ },
24
+ "category_id": {
25
+ "dtype": {
26
+ "type": "int32"
27
+ },
28
+ "categorical": true
29
+ },
30
+ "category_membership_prob": {
31
+ "dtype": {
32
+ "type": "float32"
33
+ }
34
+ },
35
+ "category_title": {
36
+ "dtype": {
37
+ "type": "string"
38
+ }
39
+ }
40
+ },
41
+ "cluster": {
42
+ "min_cluster_size": 5,
43
+ "remote": true,
44
+ "input_path": ["input"]
45
+ }
46
+ }
47
+ }
48
+ },
49
+ "py_version": "0.2.0"
50
+ }
data/.cache/lilac/hf_download/lilacai/nikhil_staging-local-Capybara/local/Capybara/manifest.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "files": [
3
+ "data-00000-of-00001.parquet"
4
+ ],
5
+ "data_schema": {
6
+ "fields": {
7
+ "source": {
8
+ "dtype": {
9
+ "type": "string"
10
+ }
11
+ },
12
+ "conversation": {
13
+ "repeated_field": {
14
+ "fields": {
15
+ "input": {
16
+ "dtype": {
17
+ "type": "string"
18
+ }
19
+ },
20
+ "output": {
21
+ "dtype": {
22
+ "type": "string"
23
+ }
24
+ }
25
+ }
26
+ }
27
+ },
28
+ "__hfsplit__": {
29
+ "dtype": {
30
+ "type": "string"
31
+ }
32
+ }
33
+ }
34
+ },
35
+ "source": {
36
+ "dataset_name": "LDJnr/Capybara",
37
+ "load_from_disk": false,
38
+ "source_name": "huggingface"
39
+ }
40
+ }
dist/lilac-1337.0.0-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:500b27604324ad6bae259c773d44486872a1754c0b89e6be97fe1b81a3e635e6
3
- size 2477986
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ec9c9a251903209d6c3377ba6cc361a0d0533f87ce7f82d01b2df69ea1fe230
3
+ size 2478036