atifsial123 commited on
Commit
bf33cf7
·
verified ·
1 Parent(s): 3af39a2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -3,10 +3,11 @@ os.system('pip install transformers')
3
  # Import the necessary libraries
4
  import os
5
  os.system('pip install torch')
 
6
  from transformers import AutoModel, AutoTokenizer
7
  import torch
8
  from torch.utils.data import DataLoader, Dataset
9
- from sklearn.model_selection import train_test_split
10
  import pandas as pd
11
  import gradio as gr
12
 
@@ -14,9 +15,9 @@ import gradio as gr
14
  model = AutoModel.from_pretrained("Alibaba-NLP/gte-multilingual-base", trust_remote_code=True)
15
  tokenizer = AutoTokenizer.from_pretrained("Alibaba-NLP/gte-multilingual-base", trust_remote_code=True)
16
 
17
- # Function to load dataset (adjust this function if your dataset is complex)
18
  def load_dataset():
19
- df = pd.read_excel("your_dataset.xlsx") # Ensure this file exists in your working directory
20
  print("Columns in the dataset:", df.columns.tolist())
21
  return df
22
 
 
3
  # Import the necessary libraries
4
  import os
5
  os.system('pip install torch')
6
+ # Import the necessary libraries
7
  from transformers import AutoModel, AutoTokenizer
8
  import torch
9
  from torch.utils.data import DataLoader, Dataset
10
+ from sklearn.model_selection import train_test_split # Importing train_test_split from scikit-learn
11
  import pandas as pd
12
  import gradio as gr
13
 
 
15
  model = AutoModel.from_pretrained("Alibaba-NLP/gte-multilingual-base", trust_remote_code=True)
16
  tokenizer = AutoTokenizer.from_pretrained("Alibaba-NLP/gte-multilingual-base", trust_remote_code=True)
17
 
18
+ # Function to load the dataset
19
  def load_dataset():
20
+ df = pd.read_excel("your_dataset.xlsx") # Ensure the file name and path are correct
21
  print("Columns in the dataset:", df.columns.tolist())
22
  return df
23