Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -3,10 +3,11 @@ os.system('pip install transformers')
|
|
3 |
# Import the necessary libraries
|
4 |
import os
|
5 |
os.system('pip install torch')
|
|
|
6 |
from transformers import AutoModel, AutoTokenizer
|
7 |
import torch
|
8 |
from torch.utils.data import DataLoader, Dataset
|
9 |
-
from sklearn.model_selection import train_test_split
|
10 |
import pandas as pd
|
11 |
import gradio as gr
|
12 |
|
@@ -14,9 +15,9 @@ import gradio as gr
|
|
14 |
model = AutoModel.from_pretrained("Alibaba-NLP/gte-multilingual-base", trust_remote_code=True)
|
15 |
tokenizer = AutoTokenizer.from_pretrained("Alibaba-NLP/gte-multilingual-base", trust_remote_code=True)
|
16 |
|
17 |
-
# Function to load
|
18 |
def load_dataset():
|
19 |
-
df = pd.read_excel("your_dataset.xlsx") # Ensure
|
20 |
print("Columns in the dataset:", df.columns.tolist())
|
21 |
return df
|
22 |
|
|
|
3 |
# Import the necessary libraries
|
4 |
import os
|
5 |
os.system('pip install torch')
|
6 |
+
# Import the necessary libraries
|
7 |
from transformers import AutoModel, AutoTokenizer
|
8 |
import torch
|
9 |
from torch.utils.data import DataLoader, Dataset
|
10 |
+
from sklearn.model_selection import train_test_split # Importing train_test_split from scikit-learn
|
11 |
import pandas as pd
|
12 |
import gradio as gr
|
13 |
|
|
|
15 |
model = AutoModel.from_pretrained("Alibaba-NLP/gte-multilingual-base", trust_remote_code=True)
|
16 |
tokenizer = AutoTokenizer.from_pretrained("Alibaba-NLP/gte-multilingual-base", trust_remote_code=True)
|
17 |
|
18 |
+
# Function to load the dataset
|
19 |
def load_dataset():
|
20 |
+
df = pd.read_excel("your_dataset.xlsx") # Ensure the file name and path are correct
|
21 |
print("Columns in the dataset:", df.columns.tolist())
|
22 |
return df
|
23 |
|