Spaces:

Pankaj10346
/

Intent-classification

Runtime error

pankaj goyal

modifield result.html

9129286 over 1 year ago

11 kB

	# # from flask import Flask, request, jsonify, render_template
	# # from transformers import RobertaTokenizer, RobertaForSequenceClassification
	# # from bs4 import BeautifulSoup
	# # from langdetect import detect
	# # import torch
	# # import json
	# # import os

	# # app = Flask(__name__)
	# # device = torch.device("cuda") if torch.cuda.is_available() else "cpu"

	# # # Load model and tokenizer
	# # MODEL_PATH = "pankaj100567/Intent-classification"
	# # tokenizer = RobertaTokenizer.from_pretrained(MODEL_PATH)
	# # model = RobertaForSequenceClassification.from_pretrained(MODEL_PATH)
	# # model.eval().to(device)

	# # # Load label mappings from a JSON file
	# # solution_file_path = os.path.join('surprise.solution')
	# # with open(solution_file_path, 'r') as solutions_file:
	# # labels = [json.loads(line)['intent'] for line in solutions_file]

	# # label2id = {label: i for i, label in enumerate(set(labels))}
	# # id2label = {i: label for label, i in label2id.items()}

	# # @app.route('/')
	# # def index():
	# # return render_template('index.html')

	# # @app.route('/classify', methods=['POST'])
	# # def classify():
	# # try:
	# # sentence = request.form['sentence']
	# # soup = BeautifulSoup(sentence, "html.parser")
	# # cleaned_sentence = soup.get_text().strip()

	# # if detect(cleaned_sentence) != 'en':
	# # return jsonify({"error": "Please enter the sentence in English."})

	# # encodings = tokenizer(cleaned_sentence, return_tensors="pt", padding=True, truncation=True, max_length=512)
	# # input_ids = encodings['input_ids'].to(device)
	# # attention_mask = encodings['attention_mask'].to(device)

	# # with torch.no_grad():
	# # outputs = model(input_ids=input_ids, attention_mask=attention_mask)
	# # logits = outputs.logits
	# # probabilities = torch.softmax(logits, dim=1)
	# # predicted_class_index = probabilities.argmax().item()

	# # predicted_intent = id2label[predicted_class_index]
	# # return jsonify({"intent": predicted_intent, "sentence": cleaned_sentence})

	# # except Exception as e:
	# # return jsonify({"error": str(e)})

	# # if __name__ == '__main__':
	# # app.run(debug=True)

	# from flask import Flask, request, jsonify, render_template
	# from transformers import RobertaTokenizer, RobertaForSequenceClassification
	# from bs4 import BeautifulSoup
	# from langdetect import detect
	# from torch.utils.data import DataLoader, TensorDataset
	# import json
	# import torch
	# import os

	# app = Flask(__name__)
	# device = torch.device("cuda") if torch.cuda.is_available() else "cpu"
	# cache_dir = "/code/cache/huggingface"
	# if not os.path.exists(cache_dir):
	# try:
	# os.makedirs(cache_dir)
	# os.chmod(cache_dir, 0o777) # Set directory permissions to read, write, and execute by all users
	# except Exception as e:
	# print(f"Failed to create or set permissions for directory {cache_dir}: {e}")

	# # cache_dir = "/code/cache/huggingface"
	# # if not os.path.exists(cache_dir):
	# # os.makedirs(cache_dir)
	# # Load model and tokenizer
	# MODEL_PATH = "pankaj100567/Intent-classification"
	# tokenizer = RobertaTokenizer.from_pretrained(MODEL_PATH, cache_dir=cache_dir)
	# model = RobertaForSequenceClassification.from_pretrained(MODEL_PATH, cache_dir=cache_dir, num_labels=150)
	# # model.eval().to(device)


	# # Load label mappings
	# solution_file_path=os.path.join('surprise.solution')
	# # test_data_path=os.path.join(data_path,'massive_test.data')
	# # loading surprise.solution file for getting id2label and label2id mapping
	# with open(solution_file_path,'r') as solutions_file:
	# solutions=[json.loads(line) for line in solutions_file] # reading json data from data_path and parse it into a test_data list

	# labels_list=[]
	# for label in solutions:
	# labels_list.append(label['intent'])
	# unique_labels_list=[]
	# for x in labels_list:
	# if x not in unique_labels_list:
	# unique_labels_list.append(x)
	# # unique_labels_list, len(unique_labels_list)

	# label2id={}
	# id2label={}
	# for i, label in enumerate(unique_labels_list):
	# label2id[label]=i
	# id2label[i]=label
	# # # Load label mappings from a JSON file
	# # solution_file_path = os.path.join('surprise.solution')
	# # with open(solution_file_path, 'r') as solutions_file:
	# # labels = [json.loads(line)['intent'] for line in solutions_file]

	# # label2id = {label: i for i, label in enumerate(set(labels))}
	# # id2label = {i: label for label, i in label2id.items()}
	# @app.route('/')
	# def index():
	# return render_template('index.html')

	# @app.route('/classify', methods=['POST'])
	# def classify():
	# try:
	# sentence = request.form['sentence']
	# soup = BeautifulSoup(sentence, "html.parser")
	# cleaned_sentence = soup.get_text().strip()

	# if detect(cleaned_sentence) != 'en':
	# return jsonify({"error": "Please enter the sentence in English."})

	# encodings = tokenizer(cleaned_sentence, return_tensors="pt", padding=True, truncation=True, max_length=512)
	# input_ids = encodings['input_ids'].to(device)
	# attention_mask = encodings['attention_mask'].to(device)
	# # Create a TensorDataset
	# test_dataset = TensorDataset(input_ids, attention_mask,)

	# # Define batch size
	# batch_size = 32

	# # Create a DataLoader
	# test_dataloader = DataLoader(test_dataset, batch_size=batch_size)
	# # Set the model in evaluation mode
	# model.eval()

	# # Iterate through the batches in the DataLoader
	# for batch in test_dataloader:
	# # Unpack the batch
	# input_ids, attention_mask = batch

	# # Move tensors to the device (e.g., GPU if available)
	# input_ids = input_ids.to(device)
	# attention_mask = attention_mask.to(device)


	# # Forward pass to get logits
	# with torch.no_grad():
	# outputs = model(input_ids=input_ids, attention_mask=attention_mask)

	# # Extract the logits tensor from the outputs
	# logits = outputs.logits

	# # Apply softmax to get class probabilities
	# probabilities = torch.softmax(logits, dim=1)

	# # Get the predicted class (index with the highest probability)
	# predicted_class = torch.argmax(probabilities, dim=1)


	# # Append the predicted class to the list of predictions
	# # predictions.extend(predicted_class.tolist())

	# # with torch.no_grad():
	# # outputs = model(input_ids=input_ids, attention_mask=attention_mask)
	# # logits = outputs.logits
	# # probabilities = torch.softmax(logits, dim=1)
	# # predicted_class_index = probabilities.argmax().item()

	# predicted_intent = id2label[predicted_class]
	# print(predicted_class, predicted_intent)
	# return jsonify({"intent": predicted_intent, "sentence": cleaned_sentence})

	# except Exception as e:
	# return jsonify({"error": str(e)})
	from flask import Flask, request, jsonify, render_template
	from transformers import RobertaTokenizer, RobertaForSequenceClassification
	from bs4 import BeautifulSoup
	from langdetect import detect
	from torch.utils.data import DataLoader, TensorDataset
	import json
	import torch
	import os

	app = Flask(__name__)
	device = torch.device("cuda") if torch.cuda.is_available() else "cpu"
	cache_dir = "/code/cache/huggingface"
	if not os.path.exists(cache_dir):
	try:
	os.makedirs(cache_dir)
	os.chmod(cache_dir, 0o777) # Set directory permissions to read, write, and execute by all users
	except Exception as e:
	print(f"Failed to create or set permissions for directory {cache_dir}: {e}")

	# cache_dir = "/code/cache/huggingface"
	# if not os.path.exists(cache_dir):
	# os.makedirs(cache_dir)
	# Load model and tokenizer
	MODEL_PATH = "pankaj100567/Intent-classification"
	tokenizer = RobertaTokenizer.from_pretrained(MODEL_PATH, cache_dir= cache_dir)
	model = RobertaForSequenceClassification.from_pretrained(MODEL_PATH, cache_dir= cache_dir, num_labels=150)
	# model.eval().to(device)


	# Load label mappings
	solution_file_path=os.path.join('surprise.solution')
	# test_data_path=os.path.join(data_path,'massive_test.data')
	# loading surprise.solution file for getting id2label and label2id mapping
	with open(solution_file_path,'r') as solutions_file:
	solutions=[json.loads(line) for line in solutions_file] # reading json data from data_path and parse it into a test_data list

	labels_list=[]
	for label in solutions:
	labels_list.append(label['intent'])
	unique_labels_list=[]
	for x in labels_list:
	if x not in unique_labels_list:
	unique_labels_list.append(x)
	# unique_labels_list, len(unique_labels_list)

	label2id={}
	id2label={}
	for i, label in enumerate(unique_labels_list):
	label2id[label]=i
	id2label[i]=label
	# # Load label mappings from a JSON file
	# solution_file_path = os.path.join('surprise.solution')
	# with open(solution_file_path, 'r') as solutions_file:
	# labels = [json.loads(line)['intent'] for line in solutions_file]

	# label2id = {label: i for i, label in enumerate(set(labels))}
	# id2label = {i: label for label, i in label2id.items()}
	@app.route('/')
	def index():
	return render_template('index.html')

	@app.route('/classify', methods=['POST'])
	def classify():
	try:
	sentence = request.form['sentence']
	soup = BeautifulSoup(sentence, "html.parser")
	cleaned_sentence = soup.get_text().strip()

	if detect(cleaned_sentence) != 'en':
	return render_template('result.html', error="Please enter the sentence in English.")

	encodings = tokenizer(cleaned_sentence, return_tensors="pt", padding=True, truncation=True, max_length=512)
	input_ids = encodings['input_ids'].to(device)
	attention_mask = encodings['attention_mask'].to(device)

	test_dataset = TensorDataset(input_ids, attention_mask)
	test_dataloader = DataLoader(test_dataset, batch_size=1) # Assume a batch size of 1 for individual predictions
	model.eval()

	for batch in test_dataloader:
	input_ids, attention_mask = batch
	input_ids = input_ids.to(device)
	attention_mask = attention_mask.to(device)

	with torch.no_grad():
	outputs = model(input_ids=input_ids, attention_mask=attention_mask)
	logits = outputs.logits
	probabilities = torch.softmax(logits, dim=1)
	predicted_class = torch.argmax(probabilities, dim=1).item()

	predicted_intent = id2label[predicted_class]
	return render_template('result.html', intent=predicted_intent, sentence=cleaned_sentence)

	except Exception as e:
	return render_template('result.html', error=str(e))


	# if __name__ == '__main__':
	# app.run(debug=True)