nsthorat commited on
Commit
658a14c
1 Parent(s): e779420
data/concept/lilac/toxicity/cohere.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:670e81b8448ab0ee5161a42b523410b3af80c6ccce8003cae78edebb9d0981c4
3
- size 9720631
 
 
 
 
data/concept/lilac/toxicity/concept.json DELETED
The diff for this file is too large to render. See raw diff
 
data/concept/lilac/toxicity/openai.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:e15e8235c2152b1412a8e2dee3dcb94b23e95f1fde6fb60f01b876a832e46404
3
- size 3678199
 
 
 
 
data/concept/lilac/toxicity/sbert.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ac8b304760c88242eb6c567e1af87fd87731a192308df8cf43b253e24d2b0ec
3
- size 959111
 
 
 
 
data/datasets/local/spotify/data-00000-of-00001.parquet DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:32224657332b09187a737c73ab634f9d14c9ba9a240bd105f1b9819cde2afcef
3
- size 37128682
 
 
 
 
data/datasets/local/spotify/manifest.json DELETED
@@ -1,27 +0,0 @@
1
- {
2
- "files": [
3
- "data-00000-of-00001.parquet"
4
- ],
5
- "data_schema": {
6
- "fields": {
7
- "artist": {
8
- "dtype": "string"
9
- },
10
- "song": {
11
- "dtype": "string"
12
- },
13
- "link": {
14
- "dtype": "string"
15
- },
16
- "text": {
17
- "dtype": "string"
18
- },
19
- "__line_number__": {
20
- "dtype": "int64"
21
- },
22
- "__rowid__": {
23
- "dtype": "string"
24
- }
25
- }
26
- }
27
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
data/datasets/local/spotify/text/.concepts/local/outer_space/sbert-neg-100.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:39c785533ab17c040510b58b31990ba24b78646cbdfe86273973efa62ba20ebf
3
- size 165756
 
 
 
 
data/datasets/local/spotify/text/.concepts/local/outerspace/sbert-neg-100.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:d95df038f05560b0e4429c43945eb6e773b668b805ae8f6c014529acbeeb755e
3
- size 185263
 
 
 
 
data/datasets/local/spotify/text/sbert/data-00000-of-00001.parquet DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:9796beb630cc3503f3c2ac9db8f71e4c1604570836d78bbf364e801cd427c39e
3
- size 2709987
 
 
 
 
data/datasets/local/spotify/text/sbert/embeddings-00000-of-00001.keys.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5df43291782b8c731d4ce56537946654c642a01dc9a4e37de394836362f6b45
3
- size 3727400
 
 
 
 
data/datasets/local/spotify/text/sbert/embeddings-00000-of-00001.npy DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:94e10c23d7229541e1f60b791a659d13673b10a03649abf0ae092e0e18c5aee3
3
- size 170446976
 
 
 
 
data/datasets/local/spotify/text/sbert/signal_manifest.json DELETED
@@ -1,37 +0,0 @@
1
- {
2
- "files": [
3
- "data-00000-of-00001.parquet"
4
- ],
5
- "parquet_id": "sbert(text)",
6
- "data_schema": {
7
- "fields": {
8
- "__rowid__": {
9
- "dtype": "string"
10
- },
11
- "text": {
12
- "fields": {
13
- "sbert": {
14
- "repeated_field": {
15
- "fields": {
16
- "embedding": {
17
- "dtype": "embedding"
18
- }
19
- },
20
- "dtype": "string_span"
21
- },
22
- "signal": {
23
- "signal_name": "sbert"
24
- }
25
- }
26
- }
27
- }
28
- }
29
- },
30
- "signal": {
31
- "signal_name": "sbert"
32
- },
33
- "enriched_path": [
34
- "text"
35
- ],
36
- "embedding_filename_prefix": "embeddings-00000-of-00001"
37
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
src/concepts/db_concept.py CHANGED
@@ -324,6 +324,7 @@ class DiskConceptDB(ConceptDB):
324
  # Read the concepts and return a ConceptInfo containing the namespace and name.
325
  concept_infos = []
326
  for root, _, files in os.walk(self._base_dir):
 
327
  for file in files:
328
  if file == CONCEPT_JSON_FILENAME:
329
  namespace, name = root.split('/')[-2:]
 
324
  # Read the concepts and return a ConceptInfo containing the namespace and name.
325
  concept_infos = []
326
  for root, _, files in os.walk(self._base_dir):
327
+ print(root, files)
328
  for file in files:
329
  if file == CONCEPT_JSON_FILENAME:
330
  namespace, name = root.split('/')[-2:]
src/server.py CHANGED
@@ -106,7 +106,7 @@ def startup() -> None:
106
  for concept in concepts:
107
  spaces_concept_output_dir = get_concept_output_dir(spaces_data_dir, concept.namespace,
108
  concept.name)
109
- persistent_output_dir = get_dataset_output_dir(data_path(), concept.namespace, concept.name)
110
  shutil.rmtree(persistent_output_dir, ignore_errors=True)
111
  shutil.move(spaces_concept_output_dir, persistent_output_dir)
112
 
 
106
  for concept in concepts:
107
  spaces_concept_output_dir = get_concept_output_dir(spaces_data_dir, concept.namespace,
108
  concept.name)
109
+ persistent_output_dir = get_concept_output_dir(data_path(), concept.namespace, concept.name)
110
  shutil.rmtree(persistent_output_dir, ignore_errors=True)
111
  shutil.move(spaces_concept_output_dir, persistent_output_dir)
112