Spaces:
Runtime error
Runtime error
Change index by dataset name only without user namespace
Browse files
app.py
CHANGED
@@ -88,7 +88,7 @@ def dataset_with_info(dataset):
|
|
88 |
"downloads": dataset.downloads,
|
89 |
"created_at": dataset.created_at,
|
90 |
"tags": dataset.tags,
|
91 |
-
"text": f"{dataset.id}-{','.join(list(columns.keys()))}",
|
92 |
}
|
93 |
except Exception as e:
|
94 |
logger.error(f"Failed to get info for {dataset.id}: {e}")
|
@@ -134,7 +134,6 @@ def search(dataset_name, k):
|
|
134 |
print(f"start search for {dataset_name}")
|
135 |
try:
|
136 |
dataset_row = all_datasets_df[all_datasets_df.dataset == dataset_name].iloc[0]
|
137 |
-
print(dataset_row)
|
138 |
except IndexError:
|
139 |
return pd.DataFrame([{"error": "β Dataset does not exist or is not supported"}])
|
140 |
text = dataset_row["text"]
|
@@ -143,12 +142,9 @@ def search(dataset_name, k):
|
|
143 |
faiss.normalize_L2(_vector)
|
144 |
distances, ann = index.search(_vector, k=k)
|
145 |
results = pd.DataFrame({"distances": distances[0], "ann": ann[0]})
|
146 |
-
print("results for distances and ann")
|
147 |
-
print(results)
|
148 |
merge = pd.merge(results, all_datasets_df, left_on="ann", right_index=True)
|
149 |
-
print("resultst for merged df (distances,ann, dataset info)")
|
150 |
merge["dataset"] = merge["dataset"].apply(render_model_hub_link)
|
151 |
-
return merge
|
152 |
|
153 |
|
154 |
with gr.Blocks() as demo:
|
|
|
88 |
"downloads": dataset.downloads,
|
89 |
"created_at": dataset.created_at,
|
90 |
"tags": dataset.tags,
|
91 |
+
"text": f"{str(dataset.id).split('/')[-1]}-{','.join(list(columns.keys()))}",
|
92 |
}
|
93 |
except Exception as e:
|
94 |
logger.error(f"Failed to get info for {dataset.id}: {e}")
|
|
|
134 |
print(f"start search for {dataset_name}")
|
135 |
try:
|
136 |
dataset_row = all_datasets_df[all_datasets_df.dataset == dataset_name].iloc[0]
|
|
|
137 |
except IndexError:
|
138 |
return pd.DataFrame([{"error": "β Dataset does not exist or is not supported"}])
|
139 |
text = dataset_row["text"]
|
|
|
142 |
faiss.normalize_L2(_vector)
|
143 |
distances, ann = index.search(_vector, k=k)
|
144 |
results = pd.DataFrame({"distances": distances[0], "ann": ann[0]})
|
|
|
|
|
145 |
merge = pd.merge(results, all_datasets_df, left_on="ann", right_index=True)
|
|
|
146 |
merge["dataset"] = merge["dataset"].apply(render_model_hub_link)
|
147 |
+
return merge.drop("text", axis=1)
|
148 |
|
149 |
|
150 |
with gr.Blocks() as demo:
|