rodrigomasini
commited on
Commit
•
dcf9bae
1
Parent(s):
7bb20e3
Update app/main.py
Browse files- app/main.py +1 -1
app/main.py
CHANGED
@@ -116,7 +116,7 @@ def chunk_embed(input_ds, input_splits, input_text_col, chunk_out_ds,
|
|
116 |
gr.Info("Started chunking")
|
117 |
try:
|
118 |
input_splits = [spl.strip() for spl in input_splits.split(",") if spl]
|
119 |
-
input_ds = load_dataset(input_ds, split="+".join(input_splits), token=HF_TOKEN)
|
120 |
chunker = Chunker(strategy, split_seq, chunk_len)
|
121 |
except Exception as e:
|
122 |
raise gr.Error(str(e))
|
|
|
116 |
gr.Info("Started chunking")
|
117 |
try:
|
118 |
input_splits = [spl.strip() for spl in input_splits.split(",") if spl]
|
119 |
+
input_ds = load_dataset(input_ds, "text-corpus", split="+".join(input_splits), token=HF_TOKEN)
|
120 |
chunker = Chunker(strategy, split_seq, chunk_len)
|
121 |
except Exception as e:
|
122 |
raise gr.Error(str(e))
|