NeuralChat

Paused

App Files Files Community

NeuralChat / app.py

Tonic

Update app.py

63a0917 8 months ago

raw

history blame

No virus

3.66 kB

	from transformers import AutoConfig, AutoTokenizer, AutoModelForSeq2SeqLM, AutoModelForCausalLM, MistralForCausalLM
	from peft import PeftModel, PeftConfig
	import torch
	import gradio as gr
	import random
	from textwrap import wrap


	title = "👋🏻토닉의 미스트랄메드 채팅에 오신 것을 환영합니다🚀👋🏻Welcome to Tonic's MistralMed Chat🚀"
	description = "이 공간을 사용하여 현재 모델을 테스트할 수 있습니다. [(Tonic/MistralMed)](https://huggingface.co/Tonic/MistralMed) 또는 이 공간을 복제하고 로컬 또는 🤗HuggingFace에서 사용할 수 있습니다. [Discord에서 함께 만들기 위해 Discord에 가입하십시오](https://discord.gg/VqTxc76K3u). You can use this Space to test out the current model [(Tonic/MistralMed)](https://huggingface.co/Tonic/MistralMed) or duplicate this Space and use it locally or on 🤗HuggingFace. [Join me on Discord to build together](https://discord.gg/VqTxc76K3u)."
	examples = [["[Question:] What is the proper treatment for buccal herpes?", "You are a medicine and public health expert, you will receive a question, answer the question, and provide a complete answer"]]

	base_model_id = "mistralai/Mistral-7B-v0.1"
	model_directory = "Tonic/mistralmed"
	device = "cuda" if torch.cuda.is_available() else "cpu"

	def wrap_text(text, width=90):
	lines = text.split('\n')
	wrapped_lines = [textwrap.fill(line, width=width) for line in lines]
	wrapped_text = '\n'.join(wrapped_lines)
	return wrapped_text

	def multimodal_prompt(user_input, system_prompt="You are an expert medical analyst:"):

	formatted_input = f"<s>[INST]{system_prompt} {user_input}[/INST]</s>"

	encodeds = tokenizer(formatted_input, return_tensors="pt", add_special_tokens=False)
	model_inputs = encodeds.to(device)

	output = model.generate(
	**model_inputs,
	max_length=max_length,
	use_cache=True,
	early_stopping=True,
	bos_token_id=model.config.bos_token_id,
	eos_token_id=model.config.eos_token_id,
	pad_token_id=model.config.eos_token_id,
	temperature=0.1,
	do_sample=False
	)

	# Decode the response
	response_text = tokenizer.decode(output[0], skip_special_tokens=True)

	return response_text


	tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-v0.1", trust_remote_code=True, padding_side="left")
	tokenizer.pad_token = tokenizer.eos_token
	tokenizer.padding_side = 'left'

	peft_config = PeftConfig.from_pretrained("Tonic/mistralmed")
	peft_model = MistralForCausalLM.from_pretrained("mistralai/Mistral-7B-v0.1", trust_remote_code=True)
	peft_model = PeftModel.from_pretrained(peft_model, "Tonic/mistralmed")
	peft_model = peft_model.to(torch.bfloat16)
	peft_model = peft_model.to(device)

	class ChatBot:
	def __init__(self):
	self.history = []

	class ChatBot:
	def __init__(self):
	self.history = []

	def predict(self, user_input, system_prompt="You are an expert medical analyst:"):
	formatted_input = f"<s>[INST]{system_prompt} {user_input}[/INST]"
	user_input_ids = tokenizer.encode(formatted_input, return_tensors="pt")
	user_input_ids = user_input_ids.to(device)
	response = peft_model.generate(input_ids=user_input_ids, max_length=256, pad_token_id=tokenizer.eos_token_id)
	response_text = tokenizer.decode(response[0], skip_special_tokens=True)

	return response_text

	bot = ChatBot()

	iface = gr.Interface(
	fn=bot.predict,
	title=title,
	description=description,
	examples=examples,
	inputs=["text", "text"],
	outputs="text",
	theme="ParityError/Anime"
	)

	iface.launch()