Spaces:

ashmib
/

green-city-finder

Sleeping

Ashmi Banerjee

updates to the s-fairness calculation and refactoring code duplication

ac20456 5 months ago

3.67 kB

	"""
	Main file to execute the TRS Pipeline.
	"""
	import sys
	from augmentation import prompt_generation as pg
	from information_retrieval import info_retrieval as ir
	from text_generation.models import (
	Llama3,
	Mistral,
	Gemma2,
	Llama3Point1,
	Llama3Instruct,
	MistralInstruct,
	Llama3Point1Instruct,
	Phi3SmallInstruct,
	GPT4,
	Gemini,
	)
	from text_generation import text_generation as tg
	import logging

	logger = logging.getLogger(__name__)
	logging.basicConfig(encoding='utf-8', level=logging.DEBUG)

	TEST_DIR = "../tests/"
	MODELS = {
	'GPT-4': GPT4,
	'Llama3': Llama3,
	'Mistral': Mistral,
	'Gemma2': Gemma2,
	'Llama3.1': Llama3Point1,
	'Llama3-Instruct': Llama3Instruct,
	'Mistral-Instruct': MistralInstruct,
	'Llama3.1-Instruct': Llama3Point1Instruct,
	'Phi3-Instruct': Phi3SmallInstruct,
	'Gemini-1.0-pro': Gemini,
	}


	def pipeline(starting_point: str, query: str, model_name: str, test: int = 0, **params):
	"""

	Executes the entire RAG pipeline, provided the query and model class name.

	Args:
	- query: str
	- model_name: string, one of the following: Llama3, Mistral, Gemma2, Llama3Point1
	- test: whether the pipeline is running a test
	- params:
	- limit (number of results to be retained)
	- reranking (binary, whether to rerank results using ColBERT or not)
	- sustainability


	"""

	model = MODELS[model_name]

	context_params = {
	'limit': 5,
	'reranking': 0,
	'sustainability': 0,
	}

	if 'limit' in params:
	context_params['limit'] = params['limit']

	if 'reranking' in params:
	context_params['reranking'] = params['reranking']

	if 'sustainability' in params:
	context_params['sustainability'] = params['sustainability']

	logger.info("Retrieving context..")
	try:
	context = ir.get_context(starting_point=starting_point, query=query, **context_params)
	if test:
	retrieved_cities = ir.get_cities(context)
	else:
	retrieved_cities = None
	except Exception as e:
	exc_type, exc_obj, exc_tb = sys.exc_info()
	logger.error(f"Error at line {exc_tb.tb_lineno} while trying to get context: {e}")
	return None

	logger.info("Retrieved context, augmenting prompt..")
	try:
	prompt = pg.augment_prompt(
	query=query,
	context=context,
	params=context_params
	)
	except Exception as e:
	exc_type, exc_obj, exc_tb = sys.exc_info()
	logger.error(f"Error at line {exc_tb.tb_lineno} while trying to augment prompt: {e}")
	return None

	# return prompt

	logger.info(f"Augmented prompt, initializing {model} and generating response..")
	try:
	response = tg.generate_response(model, prompt)
	except Exception as e:
	exc_type, exc_obj, exc_tb = sys.exc_info()
	logger.info(f"Error at line {exc_tb.tb_lineno} while generating response: {e}")
	return None

	if test:
	return retrieved_cities, prompt[1]['content'], response

	else:
	return response


	if __name__ == "__main__":
	# sample_query = "I'm planning a trip in the summer and I love art, history, and visiting museums. Can you
	# suggest " \ "some " \ "European cities? "
	sample_query = "I'm planning a trip in July and enjoy beaches, nightlife, and vibrant cities. Recommend some " \
	"cities. "
	model = "GPT-4"

	pipeline_response = pipeline(
	query=sample_query,
	model_name=model,
	sustainability=1
	)

	print(pipeline_response)