Spaces:

ashmib
/

green-city-finder

Running

green-city-finder / src /augmentation /prompt_generation.py

Ashmi Banerjee

update sustainability prompt and post processing

adbebe0 8 months ago

5.16 kB

	from src.information_retrieval import info_retrieval as ir
	import logging

	logger = logging.getLogger(__name__)
	logging.basicConfig(encoding='utf-8', level=logging.DEBUG)
	from src.augmentation.prompts import SYSTEM_PROMPT, SUSTAINABILITY_PROMPT, USER_PROMPT

	def generate_prompt(query, context, template=None):
	"""
	Function that generates the prompt given the user query and retrieved context. A specific prompt template will be
	used if provided, otherwise the default base_prompt template is used.

	Args:
	- query: str
	- context: list[dict]
	- template: str

	"""

	if template:
	SYS_PROMPT = template
	else:
	SYS_PROMPT = SYSTEM_PROMPT

	formatted_prompt = f"{USER_PROMPT.format(query, context)}"
	messages = [
	{"role": "system", "content": SYS_PROMPT},
	{"role": "user", "content": formatted_prompt}
	]

	return messages


	def format_context(context):
	"""
	Function that formats the retrieved context in a way that is easy for the LLM to understand.

	Args:
	- context: list[dict]; retrieved context

	"""

	formatted_context = ''

	for i, (city, info) in enumerate(context.items()):

	text = f"Option {i + 1}: {city} is a city in {info['country']}."
	info_text = f"Here is some information about the city. {info['text']}"

	attractions_text = "Here are some attractions: "
	att_flag = 0
	restaurants_text = "Here are some places to eat/drink: "
	rest_flag = 0

	hotels_text = "Here are some hotels: "
	hotel_flag = 0

	if len(info['listings']):
	for listing in info['listings']:
	if listing['type'] in ['see', 'do', 'go', 'view']:
	att_flag = 1
	attractions_text += f"{listing['name']} ({listing['description']}), "
	elif listing['type'] in ['eat', 'drink']:
	rest_flag = 1
	restaurants_text += f"{listing['name']} ({listing['description']}), "
	else:
	hotel_flag = 1
	hotels_text += f"{listing['name']} ({listing['description']}), "

	# If we add sustainability in the end then it could get truncated because of context window
	if "sustainability" in info:
	if info['sustainability']['month'] == 'No data available':
	sfairness_text = "This city has no sustainability (or s-fairness) score available."

	else:
	sfairness_text = f"The sustainability (or s-fairness) score for {city} in {info['sustainability']['month']} is {info['sustainability']['s-fairness']}. \n "

	text += sfairness_text

	text += info_text

	if att_flag:
	text += f"\n{attractions_text}"

	if rest_flag:
	text += f"\n{restaurants_text}"

	if hotel_flag:
	text += f"\n{hotels_text}"

	formatted_context += text + "\n\n "

	return formatted_context


	def augment_prompt(query: str, starting_point: str, context: dict, **params: dict):
	"""
	Function that accepts the user query as input, obtains relevant documents and augments the prompt with the
	retrieved context, which can be passed to the LLM.

	Args: - query: str - context: retrieved context, must be formatted otherwise the LLM cannot understand the nested
	dictionaries! - sustainability: bool; if true, then the prompt is appended to instruct the LLM to use s-fairness
	scores while generating the answer - params: key-value parameters to be passed to the get_context function; sets
	the limit of results and whether to rerank the results

	"""

	# what about the cities without s-fairness scores? i.e. they don't have seasonality data
	updated_query = f"With {starting_point} as the starting point, {query}"
	prompt_with_sustainability = SUSTAINABILITY_PROMPT

	# format context
	formatted_context = format_context(context)

	if "sustainability" in params["params"] and params["params"]["sustainability"]:
	prompt = generate_prompt(updated_query, formatted_context, prompt_with_sustainability)
	else:
	prompt = generate_prompt(updated_query, formatted_context)

	return prompt


	def test():
	context_params = {
	'limit': 3,
	'reranking': 0,
	'sustainability': 0
	}

	query = "Suggest some places to visit during winter. I like hiking, nature and the mountains and I enjoy skiing " \
	"in winter. "

	# without sustainability
	context = ir.get_context(query, **context_params)

	without_sfairness = augment_prompt(
	query=query,
	context=context,
	params=context_params
	)

	# with sustainability
	context_params.update({'sustainability': 1})
	s_context = ir.get_context(query, **context_params)
	# s_formatted_context = format_context(s_context)

	with_sfairness = augment_prompt(
	query=query,
	context=s_context,
	params=context_params
	)

	return with_sfairness


	if __name__ == "__main__":
	prompt = test()
	print(prompt)