Spaces:

pareshmishra
/

MT564AITraining

Running

MT564AITraining / swift_setup.py

pareshmishra

Add full project source files for MT564 AI

2c72e40 5 months ago

8.16 kB

	"""
	Setup Script for SWIFT MT564 Documentation Assistant

	This script guides you through setting up the project, installing dependencies,
	downloading the TinyLlama model, and uploading your fine-tuned model to Hugging Face.

	Usage:
	python setup.py --mode [install\|download\|upload] --options [options]
	"""

	import os
	import sys
	import argparse
	import subprocess
	import logging

	logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
	logger = logging.getLogger(__name__)

	def parse_args():
	parser = argparse.ArgumentParser(description="Setup SWIFT MT564 Documentation Assistant")
	parser.add_argument(
	"--mode",
	type=str,
	choices=["install", "download", "upload", "guide"],
	default="guide",
	help="Mode of operation: install dependencies, download model, upload model, or show guide"
	)
	parser.add_argument(
	"--model_name",
	type=str,
	default="TinyLlama/TinyLlama-1.1B-Chat-v1.0",
	help="Model name on Hugging Face Hub (for download mode)"
	)
	parser.add_argument(
	"--output_dir",
	type=str,
	default="./data/models",
	help="Directory to save the model (for download mode)"
	)
	parser.add_argument(
	"--model_dir",
	type=str,
	default="./mt564_tinyllama_model",
	help="Directory containing fine-tuned model (for upload mode)"
	)
	parser.add_argument(
	"--repo_name",
	type=str,
	help="Repository name on Hugging Face Hub (for upload mode)"
	)
	return parser.parse_args()

	def install_dependencies():
	"""Install required Python packages"""
	try:
	logger.info("Installing dependencies...")

	if os.path.exists("dependencies.txt"):
	subprocess.check_call([sys.executable, "-m", "pip", "install", "-r", "dependencies.txt"])
	logger.info("Dependencies installed successfully")
	else:
	logger.error("dependencies.txt file not found")
	logger.info("You need to install the following packages:")
	logger.info("- torch, transformers, datasets, accelerate")
	logger.info("- huggingface_hub, requests, beautifulsoup4, trafilatura")
	logger.info("- flask, PyPDF2, pdf2image, pytesseract")
	logger.info("Run: pip install torch transformers datasets huggingface_hub accelerate flask")

	return True
	except subprocess.CalledProcessError as e:
	logger.error(f"Error installing dependencies: {e}")
	return False

	def download_model(model_name, output_dir):
	"""Download TinyLlama model"""
	try:
	logger.info(f"Downloading model {model_name}...")

	if not os.path.exists("model/download_tinyllama.py"):
	logger.error("download_tinyllama.py script not found")
	return False

	subprocess.check_call([
	sys.executable,
	"model/download_tinyllama.py",
	"--model_name", model_name,
	"--output_dir", output_dir
	])

	logger.info(f"Model downloaded successfully to {output_dir}")
	return True
	except subprocess.CalledProcessError as e:
	logger.error(f"Error downloading model: {e}")
	return False

	def upload_model(model_dir, repo_name):
	"""Upload fine-tuned model to Hugging Face Hub"""
	try:
	if not repo_name:
	logger.error("Repository name is required for upload mode")
	return False

	if not os.path.exists("model/upload_to_huggingface.py"):
	logger.error("upload_to_huggingface.py script not found")
	return False

	# Check for authentication token
	if "HUGGING_FACE_TOKEN" not in os.environ:
	logger.error("HUGGING_FACE_TOKEN environment variable not set")
	logger.info("You need to set your Hugging Face API token:")
	logger.info("export HUGGING_FACE_TOKEN=your_token_here")
	return False

	logger.info(f"Uploading model from {model_dir} to {repo_name}...")

	subprocess.check_call([
	sys.executable,
	"model/upload_to_huggingface.py",
	"--model_dir", model_dir,
	"--repo_name", repo_name
	])

	logger.info(f"Model uploaded successfully to {repo_name}")
	return True
	except subprocess.CalledProcessError as e:
	logger.error(f"Error uploading model: {e}")
	return False

	def show_guide():
	"""Show guide for using the SWIFT MT564 Documentation Assistant"""
	guide = """
	=================================================
	SWIFT MT564 Documentation Assistant - Setup Guide
	=================================================

	This project helps you build an AI assistant specialized in SWIFT MT564 messages.
	Below is a step-by-step guide to setting up and using this project:

	1. INSTALLATION
	---------------
	Install dependencies:
	python setup.py --mode install

	2. DATA COLLECTION
	-----------------
	Run the ISO20022 scraper:
	python scrapers/iso20022_scraper.py --output_dir ./data/raw

	Process the scraped data:
	python scrapers/data_processor.py --input_dir ./data/raw --output_dir ./data/processed

	3. MODEL PREPARATION
	-------------------
	Download TinyLlama model:
	python setup.py --mode download --model_name TinyLlama/TinyLlama-1.1B-Chat-v1.0 --output_dir ./data/models

	4. TRAINING
	----------
	Train the model on MT564 data:
	python train_mt564_model.py --model_name TinyLlama/TinyLlama-1.1B-Chat-v1.0 --training_data ./data/processed/mt564_training_data.json --output_dir ./mt564_tinyllama_model

	5. DEPLOYMENT
	------------
	Upload model to Hugging Face Hub:
	# First set your Hugging Face token
	export HUGGING_FACE_TOKEN=your_token_here

	# Then upload the model
	python setup.py --mode upload --model_dir ./mt564_tinyllama_model --repo_name your-username/mt564-tinyllama

	6. USING THE MODEL ON HUGGING FACE
	---------------------------------
	Create a Hugging Face Space:
	- Go to huggingface.co
	- Click "New Space"
	- Choose a Gradio or Streamlit template
	- Link to your uploaded model
	- Use the following code in your app.py:

	```python
	import gradio as gr
	from transformers import AutoModelForCausalLM, AutoTokenizer

	# Load your model from Hugging Face Hub
	model_name = "your-username/mt564-tinyllama"
	model = AutoModelForCausalLM.from_pretrained(model_name)
	tokenizer = AutoTokenizer.from_pretrained(model_name)

	def answer_question(question):
	# Format prompt for the chat model
	prompt = f"<\|im_start\|>user\\n{question}<\|im_end\|>\\n<\|im_start\|>assistant\\n"

	# Generate response
	inputs = tokenizer(prompt, return_tensors="pt")
	outputs = model.generate(inputs.input_ids, max_new_tokens=256, temperature=0.7)
	response = tokenizer.decode(outputs[0], skip_special_tokens=True)

	# Extract assistant's response
	try:
	assistant_response = response.split("<\|im_start\|>assistant\\n")[1].split("<\|im_end\|>")[0]
	except:
	assistant_response = response

	return assistant_response

	# Create Gradio interface
	iface = gr.Interface(
	fn=answer_question,
	inputs=gr.Textbox(lines=3, placeholder="Ask a question about SWIFT MT564..."),
	outputs=gr.Textbox(),
	title="SWIFT MT564 Documentation Assistant",
	description="Ask questions about SWIFT MT564 message formats and specifications"
	)

	iface.launch()
	```

	For more details and advanced usage, refer to the README.md.
	"""
	print(guide)
	return True

	def main():
	args = parse_args()

	if args.mode == "install":
	success = install_dependencies()
	elif args.mode == "download":
	success = download_model(args.model_name, args.output_dir)
	elif args.mode == "upload":
	success = upload_model(args.model_dir, args.repo_name)
	else: # guide
	success = show_guide()

	if success:
	logger.info(f"{args.mode.capitalize()} completed successfully")
	else:
	logger.error(f"{args.mode.capitalize()} failed")
	sys.exit(1)

	if __name__ == "__main__":
	main()