Spaces:

CandidAI
/

ask-candid

Running

App Files Files Community

ask-candid / ask_candid /tools /recommendation.py

brainsqueeze

Adding optional news data source

bea5044 verified 3 months ago

raw

history blame contribute delete

8.51 kB

	import os

	from openai import OpenAI
	from langchain_core.prompts import ChatPromptTemplate
	import requests

	from ask_candid.agents.schema import AgentState, Context
	from ask_candid.base.api_base import BaseAPI

	class AutocodingAPI(BaseAPI):
	def __init__(self):
	super().__init__(
	url=os.getenv("AUTOCODING_API_URL"),
	headers={
	'x-api-key': os.getenv("AUTOCODING_API_KEY"),
	'Content-Type': 'application/json'
	}
	)

	def __call__(self, text: str, taxonomy: str = 'pcs-v3'):
	params = {
	'text': text,
	'taxonomy': taxonomy
	}
	return self.get(**params)

	class GeoAPI(BaseAPI):
	def __init__(self):
	super().__init__(
	url=os.getenv("GEO_API_URL"),
	headers={
	'x-api-key': os.getenv("GEO_API_KEY"),
	'Content-Type': 'application/json'
	}
	)

	def __call__(self, text: str):
	payload = {
	'text': text
	}
	return self.post(payload=payload)

	class EntitiesAPI(BaseAPI):
	def __init__(self):
	super().__init__(
	url=f'{os.getenv("DOCUMENT_API_URL")}/entities',
	headers={
	'x-api-key': os.getenv("DOCUMENT_API_KEY"),
	'Content-Type': 'application/json'
	}
	)

	def __call__(self, text: str):
	payload = {
	'text': text
	}
	return self.post(payload=payload)



	class FunderRecommendationAPI(BaseAPI):
	def __init__(self):
	super().__init__(
	url=os.getenv("FUNDER_REC_API_URL"),
	headers={"x-api-key": os.getenv("FUNDER_REC_API_KEY")}
	)

	def __call__(self, subjects, populations, geos):
	params = {
	"subjects": subjects,
	"populations": populations,
	"geos": geos
	}
	return self.get(**params)

	class RFPRecommendationAPI(BaseAPI):
	def __init__(self):
	super().__init__(
	url= f'{os.getenv("FUNDER_REC_API_URL")}/rfp',
	headers={"x-api-key": os.getenv("FUNDER_REC_API_KEY")}
	)

	def __call__(self, org_id, subjects, populations, geos):
	params = {
	"candid_entity_id": org_id,
	"subjects": subjects,
	"populations": populations,
	"geos": geos
	}
	return self.get(**params)




	def detect_intent_with_llm(state: AgentState, llm) -> AgentState:
	"""Detect query intent (which type of recommendation) and update the state using the specified LLM."""
	print("running detect intent")

	query = state["messages"][-1].content

	prompt_template = ChatPromptTemplate.from_messages(
	[
	("system", """
	Please classify the following query by stating ONLY the category name: 'none', 'funder', or 'rfp'.
	Please answer WITHOUT any reasoning.
	- 'none': The query does not ask for any recommendations.
	- 'funder': The query asks for recommendations about funders, such as foundations or donors.
	- 'rfp': The query asks for recommendations about specific Requests for Proposals (RFPs).

	Consider:
	- If the query seeks broad, long-term funding sources or organizations, classify as 'funder'.
	- If the query seeks specific, time-bound funding opportunities with a deadline, classify as 'rfp'.
	- If the query does not seek any recommendations, classify as 'none'.

	Query: """),
	("human", f"{query}")
	]
	)

	chain = prompt_template \| llm
	response = chain.invoke({"query": query})

	intent = response.content.strip().lower()
	state["intent"] = intent.strip("'").strip('"') # Remove extra quotes if necessary
	print(state["intent"])
	return state


	def determine_context(state: AgentState) -> AgentState:
	print("running context")
	query = state["messages"][-1].content

	autocoding_api = AutocodingAPI()
	entities_api = EntitiesAPI()

	subject_codes, population_codes, geo_ids = [], [], []

	try:
	autocoding_response = autocoding_api(text=query)
	returned_pcs = autocoding_response.get("data", {})
	population_codes = [item['full_code'] for item in returned_pcs.get("population", [])]
	subject_codes = [item['full_code'] for item in returned_pcs.get("subject", [])]
	except Exception as e:
	print(f"Failed to retrieve autocoding data: {e}")

	try:
	geo_response = entities_api(text=query)
	entities = geo_response.get('entities', [])
	geo_ids = [match['geonames_id'] for entity in entities if entity['type'] == 'geo' and 'match' in entity
	for match in entity['match'] if 'geonames_id' in match]
	except Exception as e:
	print(f"Failed to retrieve geographic data: {e}")

	state["context"] = Context(
	subject=subject_codes,
	population=population_codes,
	geography=geo_ids
	)
	return state



	def format_recommendations(intent, data):
	if 'recommendations' not in data:
	return "No recommendations available."

	recommendations = data['recommendations']
	if not recommendations:
	return "No recommendations found."

	recommendation_texts = []
	if intent == "funder":
	for rec in recommendations:
	main_sort_name = rec['funder_data']['main_sort_name']
	profile_url = f"https://app.candid.org/profile/{rec['funder_id']}"
	recommendation_texts.append(f"{main_sort_name} - Profile: {profile_url}")
	elif intent == "rfp":
	for rec in recommendations:
	title = rec.get('title', 'N/A')
	funder_name = rec.get('funder_name', 'N/A')
	amount = rec.get('amount', 'Not specified')
	description = rec.get('description', 'No description available')
	deadline = rec.get('deadline', 'No deadline provided')
	application_url = rec.get('application_url', 'No URL available')
	text = (f"Title: {title}\n"
	f"Funder: {funder_name}\n"
	f"Amount: {amount}\n"
	f"Description: {description}\n"
	f"Deadline: {deadline}\n"
	f"Application URL: {application_url}\n")
	recommendation_texts.append(text)
	else:
	return "Only funder recommendation or RFP recommendation are supported."

	return "\n".join(recommendation_texts)



	def make_recommendation(state: AgentState) -> AgentState:
	print("running recommendation")
	org_id = "6908122" # Example organization ID (Candid)
	funder_or_rfp = state["intent"]

	contexts = state["context"]
	subject_codes = ",".join(contexts.get("subject", []))
	population_codes = ",".join(contexts.get("population", []))
	geo_ids = ",".join([str(geo) for geo in contexts.get("geography", [])])

	recommendation_display_text = ""

	try:
	if funder_or_rfp == "funder":
	funder_api = FunderRecommendationAPI()
	recommendations = funder_api(subject_codes, population_codes, geo_ids)
	elif funder_or_rfp == "rfp":
	rfp_api = RFPRecommendationAPI()
	recommendations = rfp_api(org_id, subject_codes, population_codes, geo_ids)
	else:
	recommendation_display_text = "Unknown intent. Intent 'funder' or 'rfp' expected."
	state["recommendation"] = recommendation_display_text
	return state

	if recommendations:
	recommendation_display_text = format_recommendations(funder_or_rfp, recommendations)
	else:
	recommendation_display_text = "No recommendations were found for your query. Please try refining your search criteria."

	except requests.exceptions.HTTPError as e:
	# Handle HTTP errors raised by raise_for_status()
	print(f"HTTP error occurred: {e.response.status_code} - {e.response.reason}")
	recommendation_display_text = "HTTP error occurred, please report this to datascience@candid.org"
	except Exception as e:
	# Catch-all for any other exceptions that are not HTTP errors
	print(f"An unexpected error occurred: {str(e)}")
	recommendation_display_text = "Unexpected error occurred, please report this to datascience@candid.org"

	state["recommendation"] = recommendation_display_text
	return state