Spaces:

minhan6559
/

viettelpay-chatbot

Sleeping

App Files Files Community

viettelpay-chatbot / src /agent /viettelpay_agent.py

minhan6559

Upload 73 files

60d1d13 verified 5 months ago

raw

history blame contribute delete

15.9 kB

	"""
	ViettelPay AI Agent using LangGraph
	Multi-turn conversation support with short-term memory using InMemorySaver
	"""

	import os
	from typing import Dict, Optional
	from functools import partial
	from langgraph.graph import StateGraph, END
	from langgraph.checkpoint.memory import InMemorySaver
	from langchain_core.messages import HumanMessage

	from src.agent.nodes import (
	ViettelPayState,
	classify_intent_node,
	query_enhancement_node,
	knowledge_retrieval_node,
	script_response_node,
	generate_response_node,
	route_after_intent_classification,
	route_after_query_enhancement,
	route_after_knowledge_retrieval,
	)

	# Import configuration utility
	from src.utils.config import get_knowledge_base_path, get_llm_provider


	class ViettelPayAgent:
	"""Main ViettelPay AI Agent using LangGraph workflow with multi-turn conversation support"""

	def __init__(
	self,
	knowledge_base_path: str = None,
	scripts_file: Optional[str] = None,
	llm_provider: str = None,
	):
	knowledge_base_path = knowledge_base_path or get_knowledge_base_path()
	scripts_file = scripts_file or "./viettelpay_docs/processed/kich_ban.csv"
	llm_provider = llm_provider or get_llm_provider()

	self.knowledge_base_path = knowledge_base_path
	self.scripts_file = scripts_file
	self.llm_provider = llm_provider

	# Initialize LLM client once during agent creation
	print(f"🧠 Initializing LLM client ({self.llm_provider})...")
	from src.llm.llm_client import LLMClientFactory

	self.llm_client = LLMClientFactory.create_client(self.llm_provider)
	print(f"✅ LLM client initialized and ready")

	# Initialize knowledge retriever once during agent creation
	print(f"📚 Initializing knowledge retriever...")
	try:
	from src.knowledge_base.viettel_knowledge_base import ViettelKnowledgeBase

	self.knowledge_base = ViettelKnowledgeBase()
	ensemble_retriever = self.knowledge_base.load_knowledge_base(
	knowledge_base_path
	)
	if not ensemble_retriever:
	raise ValueError(
	f"Knowledge base not found at {knowledge_base_path}. Run build_database_script.py first."
	)
	print(f"✅ Knowledge retriever initialized and ready")
	except Exception as e:
	print(f"⚠️ Knowledge retriever initialization failed: {e}")
	self.knowledge_base = None

	# Initialize checkpointer for short-term memory
	self.checkpointer = InMemorySaver()

	# Build workflow with pre-initialized components
	self.workflow = self._build_workflow()
	self.app = self.workflow.compile(checkpointer=self.checkpointer)

	print("✅ ViettelPay Agent initialized with multi-turn conversation support")

	def _build_workflow(self) -> StateGraph:
	"""Build LangGraph workflow with pre-initialized components"""

	# Create workflow graph
	workflow = StateGraph(ViettelPayState)

	# Create node functions with pre-bound components using functools.partial
	# This eliminates the need to initialize components in each node call
	classify_intent_with_llm = partial(
	classify_intent_node, llm_client=self.llm_client
	)
	query_enhancement_with_llm = partial(
	query_enhancement_node, llm_client=self.llm_client
	)
	knowledge_retrieval_with_retriever = partial(
	knowledge_retrieval_node, knowledge_retriever=self.knowledge_base
	)
	generate_response_with_llm = partial(
	generate_response_node, llm_client=self.llm_client
	)

	# Add nodes (some with pre-bound components, some without)
	workflow.add_node("classify_intent", classify_intent_with_llm)
	workflow.add_node("query_enhancement", query_enhancement_with_llm)
	workflow.add_node("knowledge_retrieval", knowledge_retrieval_with_retriever)
	workflow.add_node(
	"script_response", script_response_node
	) # No pre-bound components needed
	workflow.add_node("generate_response", generate_response_with_llm)

	# Set entry point
	workflow.set_entry_point("classify_intent")

	# Add conditional routing after intent classification
	workflow.add_conditional_edges(
	"classify_intent",
	route_after_intent_classification,
	{
	"script_response": "script_response",
	"query_enhancement": "query_enhancement",
	},
	)

	# Script responses go directly to end
	workflow.add_edge("script_response", END)

	# Query enhancement goes to knowledge retrieval
	workflow.add_edge("query_enhancement", "knowledge_retrieval")

	# Knowledge retrieval goes to response generation
	workflow.add_edge("knowledge_retrieval", "generate_response")
	workflow.add_edge("generate_response", END)

	print("🔄 LangGraph workflow built successfully with optimized component usage")
	return workflow

	def process_message(self, user_message: str, thread_id: str = "default") -> Dict:
	"""Process a user message in a multi-turn conversation"""

	print(f"\n💬 Processing message: '{user_message}' (thread: {thread_id})")
	print("=" * 50)

	# Create configuration with thread_id for conversation memory
	config = {"configurable": {"thread_id": thread_id}}

	try:
	# Create human message
	human_message = HumanMessage(content=user_message)

	# Initialize state with the new message
	# Note: conversation_context is set to None so it gets recomputed with fresh message history
	initial_state = {
	"messages": [human_message],
	"intent": None,
	"confidence": None,
	"enhanced_query": None,
	"retrieved_docs": None,
	"conversation_context": None, # Reset to ensure fresh context computation
	"response_type": None,
	"error": None,
	"processing_info": None,
	}

	# Run workflow with memory
	result = self.app.invoke(initial_state, config)

	# Extract response from the last AI message
	messages = result.get("messages", [])
	if messages:
	# Get the last AI message
	last_message = messages[-1]
	if hasattr(last_message, "content"):
	response = last_message.content
	else:
	response = str(last_message)
	else:
	response = "Xin lỗi, em không thể xử lý yêu cầu này."

	response_type = result.get("response_type", "unknown")
	intent = result.get("intent", "unknown")
	confidence = result.get("confidence", 0.0)
	enhanced_query = result.get("enhanced_query", "")
	error = result.get("error")

	# Build response info
	response_info = {
	"response": response,
	"intent": intent,
	"confidence": confidence,
	"response_type": response_type,
	"enhanced_query": enhanced_query,
	"success": error is None,
	"error": error,
	"thread_id": thread_id,
	"message_count": len(messages),
	}

	print(f"✅ Response generated successfully")
	print(f" Intent: {intent} (confidence: {confidence})")
	print(f" Type: {response_type}")
	if enhanced_query and enhanced_query != user_message:
	print(f" Enhanced query: {enhanced_query}")
	print(f" Thread: {thread_id}")

	return response_info

	except Exception as e:
	print(f"❌ Workflow error: {e}")

	return {
	"response": "Xin lỗi, em gặp lỗi kỹ thuật. Vui lòng thử lại sau.",
	"intent": "error",
	"confidence": 0.0,
	"response_type": "error",
	"enhanced_query": "",
	"success": False,
	"error": str(e),
	"thread_id": thread_id,
	"message_count": 0,
	}

	def chat(self, user_message: str, thread_id: str = "default") -> str:
	"""Simple chat interface - returns just the response text"""
	result = self.process_message(user_message, thread_id)
	return result["response"]

	def get_conversation_history(self, thread_id: str = "default") -> list:
	"""Get conversation history for a specific thread"""
	try:
	config = {"configurable": {"thread_id": thread_id}}

	# Get the current state to access message history
	current_state = self.app.get_state(config)

	if current_state and current_state.values.get("messages"):
	messages = current_state.values["messages"]
	history = []

	for msg in messages:
	if hasattr(msg, "type") and hasattr(msg, "content"):
	role = "user" if msg.type == "human" else "assistant"
	history.append({"role": role, "content": msg.content})
	elif hasattr(msg, "role") and hasattr(msg, "content"):
	history.append({"role": msg.role, "content": msg.content})

	return history
	else:
	return []

	except Exception as e:
	print(f"❌ Error getting conversation history: {e}")
	return []

	def clear_conversation(self, thread_id: str = "default") -> bool:
	"""Clear conversation history for a specific thread"""
	try:
	# Note: InMemorySaver doesn't have a direct clear method
	# The conversation will be cleared when the app is restarted
	# For persistent memory, you'd need to implement a clear method
	print(f"📝 Conversation clearing requested for thread: {thread_id}")
	print(" Note: InMemorySaver conversations clear on app restart")
	return True
	except Exception as e:
	print(f"❌ Error clearing conversation: {e}")
	return False

	def get_workflow_info(self) -> Dict:
	"""Get information about the workflow structure"""
	return {
	"nodes": [
	"classify_intent",
	"query_enhancement",
	"knowledge_retrieval",
	"script_response",
	"generate_response",
	],
	"entry_point": "classify_intent",
	"knowledge_base_path": self.knowledge_base_path,
	"scripts_file": self.scripts_file,
	"llm_provider": self.llm_provider,
	"memory_type": "InMemorySaver",
	"multi_turn": True,
	"query_enhancement": True,
	"optimizations": {
	"llm_client": "Single initialization with functools.partial",
	"knowledge_retriever": "Single initialization with functools.partial",
	"conversation_context": "Cached in state to avoid repeated computation",
	},
	}

	def health_check(self) -> Dict:
	"""Check if all components are working"""

	health_status = {
	"agent": True,
	"workflow": True,
	"memory": True,
	"llm": False,
	"knowledge_base": False,
	"scripts": False,
	"overall": False,
	}

	try:
	# Test LLM client (already initialized)
	test_response = self.llm_client.generate("Hello", temperature=0.1)
	health_status["llm"] = bool(test_response)
	print("✅ LLM client working")

	except Exception as e:
	print(f"⚠️ LLM health check failed: {e}")
	health_status["llm"] = False

	try:
	# Test memory/checkpointer
	test_config = {"configurable": {"thread_id": "health_check"}}
	test_state = {"messages": [HumanMessage(content="test")]}

	# Try to invoke with memory
	self.app.invoke(test_state, test_config)
	health_status["memory"] = True
	print("✅ Memory/checkpointer working")

	except Exception as e:
	print(f"⚠️ Memory health check failed: {e}")
	health_status["memory"] = False

	try:
	# Test knowledge base (using pre-initialized retriever)
	if self.knowledge_base:
	# Test a simple search to verify it's working
	test_docs = self.knowledge_base.search("test", top_k=1)
	health_status["knowledge_base"] = True
	print("✅ Knowledge retriever working")
	else:
	health_status["knowledge_base"] = False
	print("❌ Knowledge retriever not initialized")

	except Exception as e:
	print(f"⚠️ Knowledge base health check failed: {e}")
	health_status["knowledge_base"] = False

	try:
	# Test scripts
	from src.agent.scripts import ConversationScripts

	scripts = ConversationScripts(self.scripts_file)
	health_status["scripts"] = len(scripts.get_all_script_types()) > 0

	except Exception as e:
	print(f"⚠️ Scripts health check failed: {e}")

	# Overall health
	health_status["overall"] = all(
	[
	health_status["agent"],
	health_status["memory"],
	health_status["llm"],
	health_status["knowledge_base"],
	health_status["scripts"],
	]
	)

	return health_status


	# Usage example and testing
	if __name__ == "__main__":
	# Initialize agent
	agent = ViettelPayAgent()

	# Health check
	print("\n🏥 Health Check:")
	health = agent.health_check()
	for component, status in health.items():
	status_icon = "✅" if status else "❌"
	print(f" {component}: {status_icon}")

	if not health["overall"]:
	print("\n⚠️ Some components are not healthy. Check requirements and data files.")
	exit(1)

	print(f"\n🤖 Agent ready! Workflow info: {agent.get_workflow_info()}")

	# Test multi-turn conversation with query enhancement
	test_thread = "test_conversation"

	print(
	f"\n🧪 Testing multi-turn conversation with query enhancement (thread: {test_thread}):"
	)

	test_messages = [
	"Xin chào!",
	"Mã lỗi 606 là gì?",
	"Làm sao khắc phục?", # This should be enhanced to "làm sao khắc phục lỗi 606"
	"Còn lỗi nào khác tương tự không?", # This should be enhanced with error context
	"Cảm ơn bạn!",
	]

	for i, message in enumerate(test_messages, 1):
	print(f"\n--- Turn {i} ---")
	result = agent.process_message(message, test_thread)
	print(f"User: {message}")
	print(f"Bot: {result['response'][:150]}...")

	if result.get("enhanced_query") and result["enhanced_query"] != message:
	print(f"🚀 Query enhanced: {result['enhanced_query']}")

	# Show conversation history
	if i > 1:
	history = agent.get_conversation_history(test_thread)
	print(f"History length: {len(history)} messages")

	print(f"\n📜 Final conversation history:")
	history = agent.get_conversation_history(test_thread)
	for i, msg in enumerate(history, 1):
	print(f" {i}. {msg['role']}: {msg['content'][:100]}...")