Spaces:

Soumyajit9979
/

backend_port

Running

App Files Files Community

backend_port / app.py

Soumyajit94298

gemini key

c396ba7 3 months ago

raw

history blame contribute delete

3.42 kB

	import asyncio
	from aiohttp import web, WSMsgType
	from google import genai
	from google.genai import types
	from PyPDF2 import PdfReader
	from sentence_transformers import SentenceTransformer
	import faiss
	import numpy as np
	import os

	def load_pdf_chunks(pdf_path, max_chunk_length=500):
	reader = PdfReader(pdf_path)
	full_text = ""

	for page in reader.pages:
	text = page.extract_text()
	if text:
	full_text += text + "\n"

	# Split into smaller chunks
	chunks = [full_text[i:i + max_chunk_length] for i in range(0, len(full_text), max_chunk_length)]
	return chunks


	PDF_PATH = "resume.pdf"
	chunks = load_pdf_chunks(PDF_PATH)


	embedding_model = SentenceTransformer('all-MiniLM-L6-v2')
	chunk_embeddings = embedding_model.encode(chunks, convert_to_numpy=True)

	dimension = chunk_embeddings.shape[1]
	index = faiss.IndexFlatL2(dimension)
	index.add(chunk_embeddings)

	def retrieve_context(query, top_k=7):
	query_embedding = embedding_model.encode([query], convert_to_numpy=True)
	distances, indices = index.search(query_embedding, top_k)
	return [chunks[i] for i in indices[0]]

	GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
	if not GEMINI_API_KEY:
	raise ValueError("GEMINI_API_KEY environment variable not set!")
	# Initialize Gemini client
	client = genai.Client(api_key=GEMINI_API_KEY)
	model = "gemini-2.0-flash-live-001"
	config = types.LiveConnectConfig(
	response_modalities=["TEXT"],
	system_instruction=types.Content(
	parts=[
	types.Part.from_text(
	text="You are Soumyajit's AI Assistant which is chatbot on Soumyajit's profile website, you have to act like a professional AI Assistant, and answer precisely in maximum 2-3 lines."
	)
	],
	role="user"
	)
	)

	# WebSocket handler
	async def ws_handler(request):
	ws = web.WebSocketResponse()
	await ws.prepare(request)

	async with client.aio.live.connect(model=model, config=config) as session:
	async for msg in ws:
	if msg.type == WSMsgType.TEXT:
	user_query = msg.data

	# 🔍 RAG Retrieval
	retrieved_docs = retrieve_context(user_query)
	context_text = "\n".join(retrieved_docs)

	# Combine into final prompt
	final_prompt = f"Context:\n{context_text}\n\nQuestion:\n{user_query}"

	await session.send_client_content(
	turns={"role": "user", "parts": [{"text": final_prompt}]},
	turn_complete=True
	)

	full_response = ""
	async for response in session.receive():
	if response.text:
	full_response += response.text

	await ws.send_str(full_response)

	elif msg.type == WSMsgType.ERROR:
	print('WebSocket connection closed with exception:', ws.exception())

	return ws

	# Health check
	async def health_check(request):
	return web.Response(text="OK")

	# Main app setup
	app = web.Application()
	app.router.add_get("/", health_check)
	app.router.add_get("/ws", ws_handler) # WebSocket endpoint

	if __name__ == "__main__":
	port = int(os.environ.get("PORT", 7860)) # Hugging Face uses 7860
	web.run_app(app, port=port, host="0.0.0.0")