Spaces:

lapnt3
/

my-gradio-app

Runtime error

my-gradio-app / agents /core /coordinator.py

Nguyen Trong Lap

Recreate history without binary blobs

eeb0f9c about 2 months ago

23.9 kB

	"""
	Agent Coordinator - Manages agent collaboration and handoffs
	Enables multi-agent responses and smooth transitions
	"""

	from typing import Dict, List, Optional, Any
	import asyncio
	from concurrent.futures import ThreadPoolExecutor
	from utils.memory import ConversationMemory
	from utils.session_store import get_session_store
	from utils.conversation_summarizer import get_summarizer
	from agents.core.router import route_to_agent, get_router
	from fine_tuning import get_data_collector
	from health_data import HealthContext, HealthDataStore
	import hashlib
	import json


	class AgentCoordinator:
	"""
	Coordinates multiple agents and manages handoffs
	Provides multi-agent collaboration capabilities
	"""

	def __init__(self, user_id: Optional[str] = None, use_embedding_router=True, enable_cache=True, enable_data_collection=True, enable_session_persistence=True):
	"""
	Initialize coordinator with shared memory and data store

	Args:
	user_id: Unique user identifier for session persistence
	use_embedding_router: Use embedding-based routing (faster)
	enable_cache: Enable response caching
	enable_data_collection: Enable conversation logging for fine-tuning
	enable_session_persistence: Enable session persistence across restarts
	"""
	# Session persistence
	self.user_id = user_id
	self.session_store = get_session_store() if enable_session_persistence else None

	# Initialize memory with session persistence
	self.memory = ConversationMemory(
	user_id=user_id,
	session_store=self.session_store
	)

	self.data_store = HealthDataStore()
	self.health_context = None
	self.agents = {}

	# Enable embedding router (faster than LLM routing)
	self.use_embedding_router = use_embedding_router
	if use_embedding_router:
	self.router = get_router(use_embeddings=True)
	else:
	self.router = None

	# Enable response cache
	self.enable_cache = enable_cache
	self.response_cache = {} if enable_cache else None

	# Enable data collection for fine-tuning
	self.enable_data_collection = enable_data_collection
	if enable_data_collection:
	self.data_collector = get_data_collector()
	else:
	self.data_collector = None

	# Conversation summarizer
	self.summarizer = get_summarizer()

	self._initialize_agents()

	def _initialize_agents(self) -> None:
	"""Initialize all agents with shared memory"""
	# Import agents (lazy import to avoid circular dependencies)
	from agents.specialized.nutrition_agent import NutritionAgent
	from agents.specialized.exercise_agent import ExerciseAgent
	from agents.specialized.symptom_agent import SymptomAgent
	from agents.specialized.mental_health_agent import MentalHealthAgent
	from agents.specialized.general_health_agent import GeneralHealthAgent

	# Create agents with shared memory
	self.agents = {
	'nutrition_agent': NutritionAgent(memory=self.memory),
	'exercise_agent': ExerciseAgent(memory=self.memory),
	'symptom_agent': SymptomAgent(memory=self.memory),
	'mental_health_agent': MentalHealthAgent(memory=self.memory),
	'general_health_agent': GeneralHealthAgent(memory=self.memory)
	}

	def handle_query(self, message: str, chat_history: Optional[List] = None, user_id: Optional[str] = None) -> str:
	"""
	Main entry point - handles user query with coordination

	Args:
	message: User's message
	chat_history: Conversation history
	user_id: User ID for data persistence

	Returns:
	str: Response (possibly from multiple agents)
	"""
	chat_history = chat_history or []

	# Create or update health context for user
	if user_id:
	self.health_context = HealthContext(user_id, self.data_store)
	# Inject health context into all agents
	for agent in self.agents.values():
	if hasattr(agent, 'set_health_context'):
	agent.set_health_context(self.health_context)

	# Update memory from chat history
	self._update_memory_from_history(chat_history)

	# Summarize if conversation is too long
	if self.summarizer.should_summarize(chat_history):
	chat_history = self._summarize_if_needed(chat_history)

	# Check if multi-agent collaboration is needed
	if self._needs_multi_agent(message):
	return self._handle_multi_agent_query(message, chat_history)

	# Single agent routing
	return self._handle_single_agent_query(message, chat_history)

	def _get_cache_key(self, message: str, chat_history: List) -> str:
	"""Generate cache key from message and recent history"""
	# Include last 2 exchanges for context
	recent_history = chat_history[-4:] if len(chat_history) > 4 else chat_history
	cache_data = {
	"message": message.lower().strip(),
	"history": [(h[0].lower().strip() if h[0] else "", h[1][:50] if len(h) > 1 else "") for h in recent_history]
	}
	cache_str = json.dumps(cache_data, sort_keys=True)
	return hashlib.md5(cache_str.encode()).hexdigest()

	def _handle_single_agent_query(self, message: str, chat_history: List, file_data: Optional[Dict] = None) -> str:
	"""Handle query with single agent (with potential handoff)"""
	# Check cache first
	if self.enable_cache:
	cache_key = self._get_cache_key(message, chat_history)
	if cache_key in self.response_cache:
	# print("[CACHE HIT] Returning cached response")
	return self.response_cache[cache_key]

	# Route to appropriate agent (use embedding router if available)
	if self.router:
	routing_result = self.router.route(message, chat_history)
	else:
	routing_result = route_to_agent(message, chat_history)

	agent_name = routing_result['agent']
	parameters = routing_result['parameters']

	# Update current agent in memory
	self.memory.set_current_agent(agent_name)

	# Get agent
	agent = self.agents.get(agent_name)
	if not agent:
	return "Xin lỗi, không tìm thấy agent phù hợp."

	# Let agent handle the request
	response = agent.handle(parameters, chat_history)

	# Log conversation for fine-tuning (with cleaned data)
	if self.enable_data_collection and self.data_collector:
	user_data = self.memory.get_full_profile()

	# Clean user data before logging to prevent learning from errors
	cleaned_user_data = self._clean_user_data_for_training(user_data)

	self.data_collector.log_conversation(
	agent_name=agent_name,
	user_message=message,
	agent_response=response,
	user_data=cleaned_user_data,
	metadata={'data_cleaned': True} # Flag that data was cleaned
	)

	# Cache the response
	if self.enable_cache:
	cache_key = self._get_cache_key(message, chat_history)
	self.response_cache[cache_key] = response
	# Limit cache size to 100 entries
	if len(self.response_cache) > 100:
	# Remove oldest entry (simple FIFO)
	self.response_cache.pop(next(iter(self.response_cache)))

	# Check if handoff is needed
	if hasattr(agent, 'should_handoff') and agent.should_handoff(message, chat_history):
	next_agent_name = agent.suggest_next_agent(message)
	if next_agent_name and next_agent_name in self.agents:
	return self._perform_handoff(agent, next_agent_name, response, message, chat_history)

	return response

	def _handle_multi_agent_query(self, message: str, chat_history: List) -> str:
	"""Handle query that needs multiple agents (with parallel execution)"""
	# Detect which agents are needed
	agents_needed = self._detect_required_agents(message)

	if len(agents_needed) <= 1:
	# Fallback to single agent
	return self._handle_single_agent_query(message, chat_history)

	# Use async for parallel execution (faster!)
	try:
	loop = asyncio.new_event_loop()
	asyncio.set_event_loop(loop)
	responses = loop.run_until_complete(
	self._handle_multi_agent_async(message, chat_history, agents_needed)
	)
	loop.close()
	except Exception as e:
	print(f"Async multi-agent failed, falling back to sequential: {e}")
	# Fallback to sequential if async fails
	responses = {}
	for agent_name in agents_needed:
	agent = self.agents.get(agent_name)
	if agent:
	parameters = {'user_query': message}
	responses[agent_name] = agent.handle(parameters, chat_history)

	# Combine responses
	return self._combine_responses(responses, agents_needed)

	async def _handle_multi_agent_async(self, message: str, chat_history: List, agents_needed: List[str]) -> Dict[str, str]:
	"""Execute multiple agents in parallel using asyncio"""
	async def call_agent(agent_name: str):
	"""Async wrapper for agent.handle()"""
	agent = self.agents.get(agent_name)
	if not agent:
	return None

	# Run in thread pool (since agent.handle is sync)
	loop = asyncio.get_event_loop()
	with ThreadPoolExecutor() as pool:
	parameters = {'user_query': message}
	response = await loop.run_in_executor(
	pool,
	agent.handle,
	parameters,
	chat_history
	)
	return response

	# Create tasks for all agents
	tasks = {agent_name: call_agent(agent_name) for agent_name in agents_needed}

	# Execute in parallel
	results = await asyncio.gather(*tasks.values(), return_exceptions=True)

	# Map results back to agent names
	responses = {}
	for agent_name, result in zip(tasks.keys(), results):
	if isinstance(result, Exception):
	print(f"Agent {agent_name} failed: {result}")
	responses[agent_name] = f"Xin lỗi, {agent_name} gặp lỗi."
	elif result:
	responses[agent_name] = result

	return responses

	def _perform_handoff(
	self,
	from_agent: Any,
	to_agent_name: str,
	current_response: str,
	message: str,
	chat_history: List
	) -> str:
	"""
	Perform smooth handoff between agents

	Args:
	from_agent: Current agent
	to_agent_name: Name of agent to hand off to
	current_response: Current agent's response
	message: User's message
	chat_history: Conversation history

	Returns:
	str: Combined response with handoff
	"""
	# Create handoff message
	handoff_msg = from_agent.create_handoff_message(to_agent_name, current_response)

	# Update memory
	self.memory.set_current_agent(to_agent_name)

	return handoff_msg

	def _needs_multi_agent(self, message: str) -> bool:
	"""
	Determine if query needs multiple agents

	Args:
	message: User's message

	Returns:
	bool: True if multiple agents needed
	"""
	agents_needed = self._detect_required_agents(message)
	return len(agents_needed) > 1

	def _detect_required_agents(self, message: str) -> List[str]:
	"""
	Detect which agents are needed for this query

	Args:
	message: User's message

	Returns:
	List[str]: List of agent names needed
	"""
	agents_needed = []
	message_lower = message.lower()

	# PRIORITY 1: Symptom keywords (highest priority - health emergencies)
	symptom_keywords = ['đau', 'sốt', 'ho', 'buồn nôn', 'chóng mặt', 'triệu chứng', 'khó tiêu', 'đầy bụng', 'ợ hơi']
	has_symptoms = any(kw in message_lower for kw in symptom_keywords)

	# PRIORITY 2: Nutrition keywords (but NOT if it's a symptom context)
	nutrition_keywords = ['thực đơn', 'calo', 'giảm cân', 'tăng cân', 'dinh dưỡng', 'rau củ', 'thực phẩm']
	# Special handling: 'ăn' only counts as nutrition if NOT in symptom context
	has_nutrition = any(kw in message_lower for kw in nutrition_keywords)
	if not has_symptoms and 'ăn' in message_lower:
	has_nutrition = True

	# PRIORITY 3: Exercise keywords
	exercise_keywords = ['tập', 'gym', 'cardio', 'yoga', 'chạy bộ', 'exercise', 'workout']
	has_exercise = any(kw in message_lower for kw in exercise_keywords)

	# PRIORITY 4: Mental health keywords
	mental_keywords = ['stress', 'lo âu', 'trầm cảm', 'mất ngủ', 'burnout', 'mental']
	has_mental = any(kw in message_lower for kw in mental_keywords)

	# IMPORTANT: Only trigger multi-agent if CLEARLY needs multiple domains
	# Example: "Tôi bị đau bụng, nên ăn gì?" -> symptom + nutrition
	# But: "WHO khuyến nghị ăn bao nhiêu rau củ?" -> ONLY nutrition

	# Count how many domains are triggered
	domain_count = sum([has_symptoms, has_nutrition, has_exercise, has_mental])

	# If only 1 domain -> single agent (no multi-agent)
	if domain_count <= 1:
	if has_symptoms:
	agents_needed.append('symptom_agent')
	elif has_nutrition:
	agents_needed.append('nutrition_agent')
	elif has_exercise:
	agents_needed.append('exercise_agent')
	elif has_mental:
	agents_needed.append('mental_health_agent')
	else:
	# Multiple domains detected
	# Check if it's a REAL multi-domain question or false positive

	# False positive patterns (should be single agent)
	false_positives = [
	'who khuyến nghị', # WHO recommendations -> single domain
	'bao nhiêu', # Quantitative questions -> single domain
	'khó tiêu', # Digestive issues -> symptom only
	'đầy bụng', # Bloating -> symptom only
	'đau bụng', # Stomach pain -> symptom only
	'ợ hơi', # Burping -> symptom only
	]

	is_false_positive = any(pattern in message_lower for pattern in false_positives)

	if is_false_positive:
	# Use primary domain only
	if has_nutrition:
	agents_needed.append('nutrition_agent')
	elif has_exercise:
	agents_needed.append('exercise_agent')
	elif has_symptoms:
	agents_needed.append('symptom_agent')
	elif has_mental:
	agents_needed.append('mental_health_agent')
	else:
	# Real multi-domain question
	if has_symptoms:
	agents_needed.append('symptom_agent')
	if has_nutrition:
	agents_needed.append('nutrition_agent')
	if has_exercise:
	agents_needed.append('exercise_agent')
	if has_mental:
	agents_needed.append('mental_health_agent')

	return agents_needed

	def _combine_responses(self, responses: Dict[str, str], agents_order: List[str]) -> str:
	"""
	Combine responses from multiple agents

	Args:
	responses: Dict of agent_name -> response
	agents_order: Order of agents

	Returns:
	str: Combined response
	"""
	# For natural flow, just combine responses without headers
	# Make it feel like ONE person giving comprehensive advice

	responses_list = [responses[agent] for agent in agents_order if agent in responses]

	if len(responses_list) == 1:
	# Single agent - return as is
	return responses_list[0]

	# Multiple agents - combine naturally
	combined = ""

	# First response (usually symptom assessment)
	combined += responses_list[0]

	# Add other responses with smooth transitions
	for i in range(1, len(responses_list)):
	# Natural transition phrases
	transitions = [
	"\n\nNgoài ra, ",
	"\n\nBên cạnh đó, ",
	"\n\nĐồng thời, ",
	"\n\nVề mặt khác, "
	]
	transition = transitions[min(i-1, len(transitions)-1)]
	combined += transition + responses_list[i]

	# Natural closing (not too formal)
	combined += "\n\nBạn thử làm theo xem có đỡ không nhé. Có gì thắc mắc cứ hỏi mình!"

	return combined

	def _update_memory_from_history(self, chat_history: List) -> None:
	"""Extract and update SHARED memory from chat history to prevent duplicate questions"""
	if not chat_history:
	return

	# Extract user info from ALL conversations (not just current agent)
	user_info = self._extract_user_info_from_all_history(chat_history)

	# Update SHARED memory that ALL agents can access
	if user_info:
	for key, value in user_info.items():
	self.memory.update_profile(key, value)

	def _extract_user_info_from_all_history(self, chat_history: List) -> Dict:
	"""Extract user information from entire conversation history"""
	user_info = {}

	# Common patterns to extract
	patterns = {
	'age': [r'(\d+)\stuổi', r'tôi\s(\d+)', r'(\d+)\syears?\sold'],
	'gender': [r'tôi là (nam\|nữ)', r'giới tính[:\s]*(nam\|nữ)', r'(male\|female\|nam\|nữ)'],
	'weight': [r'(\d+)\skg', r'nặng\s(\d+)', r'cân nặng[:\s]*(\d+)'],
	'height': [r'(\d+)\scm', r'cao\s(\d+)', r'chiều cao[:\s]*(\d+)'],
	'goal': [r'muốn\s(giảm cân\|tăng cân\|tăng cơ\|khỏe mạnh)', r'mục tiêu[:\s](.+)']
	}

	# Search through all user messages
	import re
	for user_msg, _ in chat_history:
	if not user_msg:
	continue

	for field, field_patterns in patterns.items():
	if field not in user_info: # Only extract if not already found
	for pattern in field_patterns:
	match = re.search(pattern, user_msg.lower())
	if match:
	user_info[field] = match.group(1)
	break

	return user_info

	# Extract gender
	if not self.memory.get_profile('gender'):
	if re.search(r'\bnam\b\|male', all_messages.lower()):
	self.memory.update_profile('gender', 'male')
	elif re.search(r'\bnữ\b\|female', all_messages.lower()):
	self.memory.update_profile('gender', 'female')

	# Extract weight
	if not self.memory.get_profile('weight'):
	weight_match = re.search(r'(\d+)\skg\|nặng\s(\d+)', all_messages.lower())
	if weight_match:
	weight = float([g for g in weight_match.groups() if g][0])
	self.memory.update_profile('weight', weight)

	# Extract height
	if not self.memory.get_profile('height'):
	height_match = re.search(r'(\d+)\scm\|cao\s(\d+)', all_messages.lower())
	if height_match:
	height = float([g for g in height_match.groups() if g][0])
	self.memory.update_profile('height', height)

	def _summarize_if_needed(self, chat_history: List) -> List:
	"""
	Summarize conversation if it's too long

	Args:
	chat_history: Full conversation history

	Returns:
	Compressed history with summary
	"""
	user_profile = self.memory.get_full_profile()
	compressed = self.summarizer.compress_history(
	chat_history,
	target_turns=10 # Keep last 10 turns + summary
	)

	# print(f"📝 Summarized {len(chat_history)} turns → {len(compressed)} turns")
	return compressed

	def get_conversation_stats(self, chat_history: List) -> Dict[str, Any]:
	"""Get statistics about current conversation"""
	return self.summarizer.get_summary_stats(chat_history)

	def get_memory_summary(self) -> str:
	"""Get summary of current memory state"""
	return self.memory.get_context_summary()

	def _clean_user_data_for_training(self, user_data: Dict[str, Any]) -> Dict[str, Any]:
	"""
	Clean user data before logging for training
	Ensures only valid, corrected data is used for fine-tuning

	This prevents the model from learning bad patterns like:
	- "cao 200m" (should be 200cm)
	- "nặng 75g" (should be 75kg)
	- Invalid BMI values
	"""
	cleaned = user_data.copy()

	# Validate and clean height (should be 50-300 cm)
	if 'height' in cleaned and cleaned['height'] is not None:
	height = float(cleaned['height'])
	if not (50 <= height <= 300):
	# Invalid height - don't log it
	cleaned['height'] = None

	# Validate and clean weight (should be 20-300 kg)
	if 'weight' in cleaned and cleaned['weight'] is not None:
	weight = float(cleaned['weight'])
	if not (20 <= weight <= 300):
	# Invalid weight - don't log it
	cleaned['weight'] = None

	# Validate and clean age (should be 1-120)
	if 'age' in cleaned and cleaned['age'] is not None:
	age = int(cleaned['age'])
	if not (1 <= age <= 120):
	# Invalid age - don't log it
	cleaned['age'] = None

	# Validate and clean body fat (should be 3-60%)
	if 'body_fat_percentage' in cleaned and cleaned['body_fat_percentage'] is not None:
	bf = float(cleaned['body_fat_percentage'])
	if not (3 <= bf <= 60):
	# Invalid body fat - don't log it
	cleaned['body_fat_percentage'] = None

	# Remove any None values to keep training data clean
	cleaned = {k: v for k, v in cleaned.items() if v is not None}

	return cleaned

	def clear_memory(self) -> None:
	"""Clear all memory (start fresh)"""
	self.memory.clear()

	def __repr__(self) -> str:
	return f"<AgentCoordinator: {self.get_memory_summary()}>"