Spaces:

TalatMasud
/

chatbot-backend

Running

App Files Files Community

chatbot-backend / src /agents /rag_agent.py

TalatMasood

DOne some testing and fixed the retrieving context by date.

f36ab64 3 months ago

raw

history blame

14.6 kB

	from typing import List, Dict, Optional, Tuple
	import uuid

	from .excel_aware_rag import ExcelAwareRAGAgent
	from .enhanced_context_manager import EnhancedContextManager
	from ..llms.base_llm import BaseLLM
	from src.embeddings.base_embedding import BaseEmbedding
	from src.vectorstores.base_vectorstore import BaseVectorStore
	from src.utils.conversation_manager import ConversationManager
	from src.db.mongodb_store import MongoDBStore
	from src.models.rag import RAGResponse
	from src.utils.logger import logger

	class RAGAgent(ExcelAwareRAGAgent):
	def __init__(
	self,
	llm: BaseLLM,
	embedding: BaseEmbedding,
	vector_store: BaseVectorStore,
	mongodb: MongoDBStore,
	max_history_tokens: int = 4000,
	max_history_messages: int = 10
	):
	"""Initialize RAG Agent with enhanced context management"""
	super().__init__() # Initialize ExcelAwareRAGAgent
	self.llm = llm
	self.embedding = embedding
	self.vector_store = vector_store
	self.mongodb = mongodb
	self.conversation_manager = ConversationManager(
	max_tokens=max_history_tokens,
	max_messages=max_history_messages
	)
	# Add enhanced context management while preserving existing functionality
	self.context_manager = EnhancedContextManager()
	logger.info("RAGAgent initialized with enhanced context management")

	async def generate_response(
	self,
	query: str,
	conversation_id: Optional[str],
	temperature: float,
	max_tokens: Optional[int] = None,
	context_docs: Optional[List[str]] = None,
	stream: bool = False,
	custom_roles: Optional[List[Dict[str, str]]] = None
	) -> RAGResponse:
	"""
	Generate a response with comprehensive context and role management

	Args:
	query (str): User query
	conversation_id (Optional[str]): Conversation identifier
	temperature (float): LLM temperature for response generation
	max_tokens (Optional[int]): Maximum tokens for response
	context_docs (Optional[List[str]]): Pre-retrieved context documents
	stream (bool): Whether to stream the response
	custom_roles (Optional[List[Dict[str, str]]]): Custom role instructions

	Returns:
	RAGResponse: Generated response with context and metadata
	"""
	try:
	logger.info(f"Generating response for query: {query}")

	# Apply custom roles if provided
	if custom_roles:
	for role in custom_roles:
	# Modify query or context based on role
	if role.get('name') == 'introduction_specialist':
	query += " Provide a concise, welcoming response."
	elif role.get('name') == 'knowledge_based_specialist':
	query += " Ensure response is precise and directly from available knowledge."

	# Introduction Handling
	is_introduction = (
	"wants support" in query and
	"This is Introduction" in query and
	("A new user with name:" in query or "An old user with name:" in query)
	)

	if is_introduction:
	logger.info("Processing introduction message")
	welcome_message = self._handle_contact_query(query)
	return RAGResponse(
	response=welcome_message,
	context_docs=[],
	sources=[],
	scores=None
	)

	# Conversation History Processing
	history = []
	last_context = None
	if conversation_id:
	logger.info(f"Retrieving conversation history for ID: {conversation_id}")
	history = await self.mongodb.get_recent_messages(
	conversation_id,
	limit=self.conversation_manager.max_messages
	)

	# Process history for conversation manager
	history = self.conversation_manager.get_relevant_history(
	messages=history,
	current_query=query
	)

	# Process in enhanced context manager
	for msg in history:
	self.context_manager.process_turn(
	msg.get('query', ''),
	msg.get('response', '')
	)

	# Get last context if available
	if history and history[-1].get('response'):
	last_context = history[-1]['response']

	# Query Enhancement
	enhanced_query = self.context_manager.enhance_query(query)

	# Manual Pronoun Handling Fallback
	if enhanced_query == query:
	pronoun_map = {
	'his': 'he',
	'her': 'she',
	'their': 'they'
	}
	words = query.lower().split()
	for pronoun, replacement in pronoun_map.items():
	if pronoun in words:
	# Try to use last context
	if last_context:
	self.context_manager.record_last_context(last_context)
	enhanced_query = self.context_manager.enhance_query(query)
	break

	logger.info(f"Enhanced query: {enhanced_query}")

	# Context Retrieval
	if not context_docs:
	logger.info("Retrieving context for enhanced query")
	context_docs, sources, scores = await self.retrieve_context(
	enhanced_query,
	conversation_history=history
	)
	else:
	sources = []
	scores = None

	# Context Fallback Mechanism
	if not context_docs:
	# If no context and last context exists, use it
	if last_context:
	context_docs = [last_context]
	sources = [{"source": "previous_context"}]
	scores = [1.0]
	else:
	logger.info("No relevant context found")
	return RAGResponse(
	response="Information about this is not available, do you want to inquire about something else?",
	context_docs=[],
	sources=[],
	scores=None
	)

	# Excel-specific Content Handling
	has_excel_content = any('Sheet:' in doc for doc in context_docs)
	if has_excel_content:
	logger.info("Processing Excel-specific content")
	try:
	context_docs = self._process_excel_context(context_docs, enhanced_query)
	except Exception as e:
	logger.warning(f"Error processing Excel context: {str(e)}")

	# Prompt Generation with Conversation History
	prompt = self.conversation_manager.generate_prompt_with_history(
	current_query=enhanced_query,
	history=history,
	context_docs=context_docs
	)

	# Streaming Response Generation
	if stream:
	# TODO: Implement actual streaming logic
	# This is a placeholder and needs proper implementation
	logger.warning("Streaming not fully implemented")

	# Standard Response Generation
	response = self.llm.generate(
	prompt=prompt,
	temperature=temperature,
	max_tokens=max_tokens
	)

	# Response Cleaning
	cleaned_response = self._clean_response(response)

	# Excel Response Enhancement
	if has_excel_content:
	try:
	enhanced_response = await self.enhance_excel_response(
	query=enhanced_query,
	response=cleaned_response,
	context_docs=context_docs
	)
	if enhanced_response:
	cleaned_response = enhanced_response
	except Exception as e:
	logger.warning(f"Error enhancing Excel response: {str(e)}")

	# Context Tracking
	self.context_manager.process_turn(query, cleaned_response)

	# Metadata Generation
	metadata = {
	'llm_provider': getattr(self.llm, 'model_name', 'unknown'),
	'temperature': temperature,
	'conversation_id': conversation_id,
	'context_sources': sources,
	'has_excel_content': has_excel_content
	}

	logger.info("Successfully generated response")
	return RAGResponse(
	response=cleaned_response,
	context_docs=context_docs,
	sources=sources,
	scores=scores,
	metadata=metadata # Added metadata
	)

	except Exception as e:
	logger.error(f"Error in generate_response: {str(e)}")
	raise

	async def retrieve_context(
	self,
	query: str,
	conversation_history: Optional[List[Dict]] = None,
	top_k: int = 3
	) -> Tuple[List[str], List[Dict], Optional[List[float]]]:
	"""Retrieve context with both original and enhanced handling"""
	try:
	logger.info(f"Retrieving context for query: {query}")

	# Enhance query using both managers
	if conversation_history:
	# Get the last two messages for immediate context
	recent_messages = conversation_history[-2:]

	# Extract queries and responses for context
	context_parts = []
	for msg in recent_messages:
	if msg.get('query'):
	context_parts.append(msg['query'])
	if msg.get('response'):
	response = msg['response']
	if "Information about this is not available" not in response:
	context_parts.append(response)

	# Combine with current query
	enhanced_query = f"{' '.join(context_parts)} {query}".strip()
	logger.info(f"Enhanced query with history: {enhanced_query}")
	else:
	enhanced_query = query

	# Debug log the enhanced query
	logger.info(f"Final enhanced query: {enhanced_query}")

	# Embed the enhanced query
	query_embedding = self.embedding.embed_query(enhanced_query)

	# Debug log embedding shape
	logger.info(f"Query embedding shape: {len(query_embedding)}")

	# Retrieve similar documents
	results = self.vector_store.similarity_search(
	query_embedding,
	top_k=top_k
	)

	# Debug log search results
	logger.info(f"Number of search results: {len(results)}")
	for i, result in enumerate(results):
	logger.info(f"Result {i} score: {result.get('score', 'N/A')}")
	logger.info(f"Result {i} text preview: {result.get('text', '')[:100]}...")

	if not results:
	logger.info("No results found in similarity search")
	return [], [], None

	# Process results
	documents = [doc['text'] for doc in results]
	sources = [self._convert_metadata_to_strings(doc['metadata'])
	for doc in results]
	scores = [doc['score'] for doc in results
	if doc.get('score') is not None]

	# Return scores only if available for all documents
	if len(scores) != len(documents):
	scores = None

	logger.info(f"Retrieved {len(documents)} relevant documents")
	return documents, sources, scores

	except Exception as e:
	logger.error(f"Error in retrieve_context: {str(e)}")
	raise

	def _clean_response(self, response: str) -> str:
	"""Clean response text while preserving key information"""
	if not response:
	return response

	# Keep only the most common phrases to remove
	phrases_to_remove = [
	"Based on the context,",
	"According to the documents,",
	"From the information available,",
	"Based on the provided information,",
	"I apologize,"
	]

	cleaned_response = response
	for phrase in phrases_to_remove:
	cleaned_response = cleaned_response.replace(phrase, "").strip()

	cleaned_response = " ".join(cleaned_response.split())

	if not cleaned_response:
	return response

	if cleaned_response[0].islower():
	cleaned_response = cleaned_response[0].upper() + cleaned_response[1:]

	return cleaned_response

	def _convert_metadata_to_strings(self, metadata: Dict) -> Dict:
	"""Convert metadata values to strings"""
	try:
	return {
	key: str(value) if isinstance(value, (int, float)) else value
	for key, value in metadata.items()
	}
	except Exception as e:
	logger.error(f"Error converting metadata: {str(e)}")
	return metadata

	def _handle_contact_query(self, query: str) -> str:
	"""Handle contact/introduction queries"""
	try:
	name_start = query.find('name: "') + 7
	name_end = query.find('"', name_start)
	name = query[name_start:name_end] if name_start > 6 and name_end != -1 else "there"

	is_returning = (
	"An old user with name:" in query and
	"wants support again" in query
	)

	return f"Welcome back {name}, How can I help you?" if is_returning else f"Welcome {name}, How can I help you?"

	except Exception as e:
	logger.error(f"Error handling contact query: {str(e)}")
	return "Welcome, How can I help you?"