Spaces:

minhan6559
/

Log-Analysis-MultiAgent

Sleeping

App Files Files Community

Log-Analysis-MultiAgent / src /agents /log_analysis_agent /agent.py

minhan6559

Upload 102 files

9e3d618 verified 16 days ago

raw

history blame contribute delete

43.6 kB

	"""
	LogAnalysisAgent - Main orchestrator for cybersecurity log analysis
	"""

	import os
	import json
	import time
	from datetime import datetime
	from pathlib import Path
	from typing import List, Dict, Optional

	from langchain_core.messages import HumanMessage
	from langgraph.prebuilt import create_react_agent
	from langchain_core.tools import tool
	from langgraph.graph import StateGraph, END
	from langchain.chat_models import init_chat_model

	from langsmith import traceable, Client, get_current_run_tree

	from src.agents.log_analysis_agent.state_models import AnalysisState
	from src.agents.log_analysis_agent.utils import (
	get_llm,
	get_tools,
	format_execution_time,
	truncate_to_tokens,
	)
	from src.agents.log_analysis_agent.prompts import (
	ANALYSIS_PROMPT,
	CRITIC_FEEDBACK_TEMPLATE,
	SELF_CRITIC_PROMPT,
	)


	ls_client = Client(api_key=os.getenv("LANGSMITH_API_KEY"))


	class LogAnalysisAgent:
	"""
	Main orchestrator for cybersecurity log analysis.
	Coordinates the entire workflow: load → preprocess → analyze → save → display
	"""

	def __init__(
	self,
	model_name: str = "google_genai:gemini-2.0-flash",
	temperature: float = 0.1,
	output_dir: str = "analysis",
	max_iterations: int = 2,
	llm_client=None,
	):
	"""
	Initialize the Log Analysis Agent

	Args:
	model_name: Name of the model to use (e.g. "google_genai:gemini-2.0-flash")
	temperature: Temperature for the model
	output_dir: Directory name for saving outputs (relative to package directory)
	max_iterations: Maximum number of iterations for the ReAct agent
	llm_client: Optional pre-initialized LLM client (overrides model_name/temperature)
	"""
	if llm_client:
	self.llm = llm_client
	print(f"[INFO] Log Analysis Agent: Using provided LLM client")
	else:
	self.llm = init_chat_model(model_name, temperature=temperature)
	print(f"[INFO] Log Analysis Agent: Using default LLM model: {model_name}")

	self.base_tools = get_tools()

	self.output_root = Path(output_dir)
	self.output_root.mkdir(exist_ok=True)

	# Initialize helper components
	self.log_processor = LogProcessor(model_name=model_name)
	self.react_analyzer = ReactAnalyzer(
	self.llm, self.base_tools, max_iterations=max_iterations
	)
	self.result_manager = ResultManager(self.output_root)

	# Create workflow graph
	self.workflow = self._create_workflow()

	def _create_workflow(self) -> StateGraph:
	"""Create and configure the analysis workflow graph"""
	workflow = StateGraph(AnalysisState)

	# Add nodes using instance methods
	workflow.add_node("load_logs", self.log_processor.load_logs)
	workflow.add_node("preprocess_logs", self.log_processor.preprocess_logs)
	workflow.add_node("react_agent_analysis", self.react_analyzer.analyze)
	workflow.add_node("save_results", self.result_manager.save_results)
	workflow.add_node("display_results", self.result_manager.display_results)

	# Define workflow edges
	workflow.set_entry_point("load_logs")
	workflow.add_edge("load_logs", "preprocess_logs")
	workflow.add_edge("preprocess_logs", "react_agent_analysis")
	workflow.add_edge("react_agent_analysis", "save_results")
	workflow.add_edge("save_results", "display_results")
	workflow.add_edge("display_results", END)

	return workflow.compile(name="log_analysis_agent")

	def _log_workflow_metrics(
	self,
	workflow_step: str,
	execution_time: float,
	success: bool,
	details: dict = None,
	):
	"""Log workflow step performance metrics to LangSmith."""
	try:
	current_run = get_current_run_tree()
	if current_run:
	ls_client.create_feedback(
	run_id=current_run.id,
	key="log_analysis_workflow_performance",
	score=1.0 if success else 0.0,
	value={
	"workflow_step": workflow_step,
	"execution_time": execution_time,
	"success": success,
	"details": details or {},
	"agent_type": "log_analysis_workflow",
	},
	)
	except Exception as e:
	print(f"Failed to log workflow metrics: {e}")

	def _log_security_analysis_results(self, analysis_result: dict):
	"""Log security analysis findings to LangSmith."""
	try:
	current_run = get_current_run_tree()
	if current_run:
	assessment = analysis_result.get("overall_assessment", "UNKNOWN")
	abnormal_events = analysis_result.get("abnormal_events", [])
	total_events = analysis_result.get("total_events_analyzed", 0)

	# Calculate threat score
	threat_score = 0.0
	if assessment == "CRITICAL":
	threat_score = 1.0
	elif assessment == "HIGH":
	threat_score = 0.8
	elif assessment == "MEDIUM":
	threat_score = 0.5
	elif assessment == "LOW":
	threat_score = 0.2

	ls_client.create_feedback(
	run_id=current_run.id,
	key="security_analysis_results",
	score=threat_score,
	value={
	"overall_assessment": assessment,
	"abnormal_events_count": len(abnormal_events),
	"total_events_analyzed": total_events,
	"execution_time": analysis_result.get(
	"execution_time_formatted", "Unknown"
	),
	"iteration_count": analysis_result.get("iteration_count", 1),
	"abnormal_events": abnormal_events[
	:5
	], # Limit to first 5 for logging
	},
	)
	except Exception as e:
	print(f"Failed to log security analysis results: {e}")

	def _log_batch_analysis_metrics(
	self,
	total_files: int,
	successful: int,
	start_time: datetime,
	end_time: datetime,
	):
	"""Log batch analysis performance metrics."""
	try:
	current_run = get_current_run_tree()
	if current_run:
	duration = (end_time - start_time).total_seconds()
	success_rate = successful / total_files if total_files > 0 else 0

	ls_client.create_feedback(
	run_id=current_run.id,
	key="batch_analysis_performance",
	score=success_rate,
	value={
	"total_files": total_files,
	"successful_files": successful,
	"failed_files": total_files - successful,
	"success_rate": success_rate,
	"duration_seconds": duration,
	"files_per_minute": (
	(total_files / duration) * 60 if duration > 0 else 0
	),
	},
	)
	except Exception as e:
	print(f"Failed to log batch analysis metrics: {e}")

	@traceable(name="log_analysis_agent_full_workflow")
	def analyze(self, log_file: str) -> Dict:
	"""
	Analyze a single log file

	Args:
	log_file: Path to the log file to analyze

	Returns:
	Dictionary containing the analysis result
	"""
	state = self._initialize_state(log_file)
	result = self.workflow.invoke(state, config={"recursion_limit": 100})

	analysis_result = result.get("analysis_result", {})
	if analysis_result:
	self._log_security_analysis_results(analysis_result)

	return analysis_result

	@traceable(name="log_analysis_agent_batch_workflow")
	def analyze_batch(
	self, dataset_dir: str, skip_existing: bool = False
	) -> List[Dict]:
	"""
	Analyze all log files in a dataset directory

	Args:
	dataset_dir: Path to directory containing log files
	skip_existing: Whether to skip already analyzed files

	Returns:
	List of result dictionaries for each file
	"""
	print("=" * 60)
	print("BATCH MODE: Analyzing all files in dataset")
	print("=" * 60 + "\n")

	files = self._find_dataset_files(dataset_dir)

	if not files:
	print("No JSON files found in dataset directory")
	return []

	print(f"Found {len(files)} files to analyze")
	if skip_existing:
	print("Skip mode enabled: Already analyzed files will be skipped")
	print()

	results = []
	batch_start = datetime.now()

	for idx, file_path in enumerate(files, 1):
	filename = os.path.basename(file_path)
	print(f"\n[{idx}/{len(files)}] Processing: {filename}")
	print("-" * 60)

	result = self._analyze_single_file(file_path, skip_existing)
	results.append(result)

	if result["success"]:
	print(f"Status: {result['message']}")
	else:
	print(f"Status: FAILED - {result['message']}")

	batch_end = datetime.now()

	successful = sum(1 for r in results if r["success"])
	self._log_batch_analysis_metrics(len(files), successful, batch_start, batch_end)

	self.result_manager.display_batch_summary(results, batch_start, batch_end)

	return results

	def _initialize_state(self, log_file: str) -> Dict:
	"""Initialize the analysis state with default values"""
	return {
	"log_file": log_file,
	"raw_logs": "",
	"prepared_logs": "",
	"analysis_result": {},
	"messages": [],
	"agent_reasoning": "",
	"agent_observations": [],
	"iteration_count": 0,
	"critic_feedback": "",
	"iteration_history": [],
	"start_time": 0.0,
	"end_time": 0.0,
	}

	def _analyze_single_file(self, log_file: str, skip_existing: bool = False) -> Dict:
	"""Analyze a single log file with error handling"""
	try:
	if skip_existing:
	existing = self.result_manager.get_existing_output(log_file)
	if existing:
	return {
	"success": True,
	"log_file": log_file,
	"message": "Skipped (already analyzed)",
	"result": None,
	}

	state = self._initialize_state(log_file)
	self.workflow.invoke(state, config={"recursion_limit": 100})

	return {
	"success": True,
	"log_file": log_file,
	"message": "Analysis completed",
	"result": state.get("analysis_result"),
	}

	except Exception as e:
	return {
	"success": False,
	"log_file": log_file,
	"message": f"Error: {str(e)}",
	"result": None,
	}

	def _find_dataset_files(self, dataset_dir: str) -> List[str]:
	"""Find all JSON files in the dataset directory"""
	import glob

	if not os.path.exists(dataset_dir):
	print(f"Error: Dataset directory not found: {dataset_dir}")
	return []

	json_files = glob.glob(os.path.join(dataset_dir, "*.json"))
	return sorted(json_files)


	class LogProcessor:
	"""
	Handles log loading and preprocessing operations
	"""

	def __init__(self, max_size: int = 30000, model_name: str = ""):
	"""
	Initialize the log processor

	Args:
	max_size: Maximum character size before applying sampling
	model_name: Model name to adjust limits accordingly
	"""
	if "gpt-oss" in model_name.lower():
	self.max_size = 5000 # Conservative limit for GPT-OSS models
	print(
	f"[INFO] Using reduced sampling size ({self.max_size}) for GPT-OSS model"
	)
	else:
	self.max_size = max_size

	self.model_name = model_name

	def _get_max_input_tokens(self, model_name: str) -> int:
	"""
	Determine maximum input tokens based on model capabilities

	Args:
	model_name: Name of the model to determine token limits for

	Returns:
	Maximum input tokens for the model
	"""
	model_lower = model_name.lower()

	# Gemini models: 300k tokens
	if "gemini" in model_lower:
	return 200_000

	# elif "gpt-5" in model_lower:
	# return 80_000

	# Default for other models: 45k tokens
	else:
	return 45_000

	@traceable(name="log_processor_load_logs")
	def load_logs(self, state: AnalysisState) -> AnalysisState:
	"""Load logs from file and initialize state"""
	filename = os.path.basename(state["log_file"])
	print(f"Loading logs from: {filename}")

	# Record start time
	state["start_time"] = time.time()
	start_time = time.time()

	try:
	with open(state["log_file"], "r", encoding="utf-8") as f:
	raw = f.read()
	success = True
	except Exception as e:
	print(f"Error reading file: {e}")
	raw = f"Error loading file: {e}"
	success = False

	execution_time = time.time() - start_time
	self._log_loading_metrics(filename, len(raw), execution_time, success)

	state["raw_logs"] = raw
	state["max_input_token"] = self._get_max_input_tokens(self.model_name)
	state["messages"] = []
	state["agent_reasoning"] = ""
	state["agent_observations"] = []
	state["iteration_count"] = 0
	state["critic_feedback"] = ""
	state["iteration_history"] = []
	state["end_time"] = 0.0

	return state

	@traceable(name="log_processor_preprocess_logs")
	def preprocess_logs(self, state: AnalysisState) -> AnalysisState:
	"""Preprocess logs for analysis - token-based truncation based on model capabilities"""
	raw = state["raw_logs"]
	line_count = raw.count("\n")
	max_tokens = state["max_input_token"]
	print(
	f"Loaded {line_count} lines, {len(raw)} characters (max tokens: {max_tokens:,})"
	)

	start_time = time.time()

	# Truncate by tokens to keep context windows manageable
	truncated = truncate_to_tokens(raw, max_tokens)

	token_truncation_applied = len(truncated) < len(raw)

	# Prepare final text with minimal header
	state["prepared_logs"] = f"TOTAL LINES: {line_count}\n\n{truncated}"

	execution_time = time.time() - start_time
	self._log_preprocessing_metrics(
	line_count,
	len(raw),
	len(truncated),
	token_truncation_applied,
	execution_time,
	)

	return state

	def _log_loading_metrics(
	self, filename: str, file_size: int, execution_time: float, success: bool
	):
	"""Log file loading performance metrics."""
	try:
	current_run = get_current_run_tree()
	if current_run:
	ls_client.create_feedback(
	run_id=current_run.id,
	key="log_loading_performance",
	score=1.0 if success else 0.0,
	value={
	"filename": filename,
	"file_size_chars": file_size,
	"execution_time": execution_time,
	"success": success,
	},
	)
	except Exception as e:
	print(f"Failed to log loading metrics: {e}")

	def _log_preprocessing_metrics(
	self,
	line_count: int,
	original_size: int,
	processed_size: int,
	sampling_applied: bool,
	execution_time: float,
	):
	"""Log preprocessing performance metrics."""
	try:
	current_run = get_current_run_tree()
	if current_run:
	ls_client.create_feedback(
	run_id=current_run.id,
	key="log_preprocessing_performance",
	score=1.0,
	value={
	"line_count": line_count,
	"original_size_chars": original_size,
	"processed_size_chars": processed_size,
	"sampling_applied": sampling_applied,
	"size_reduction": (
	(original_size - processed_size) / original_size
	if original_size > 0
	else 0
	),
	"execution_time": execution_time,
	},
	)
	except Exception as e:
	print(f"Failed to log preprocessing metrics: {e}")

	def _apply_sampling(self, raw: str) -> str:
	"""Apply sampling strategy with line-aware boundaries"""
	lines = raw.split("\n")
	total_lines = len(lines)

	if total_lines <= 50: # Small files, return as-is
	return raw

	# Take proportional samples but respect line boundaries
	first_lines = lines[: int(total_lines * 0.25)] # First 25%
	middle_start = int(total_lines * 0.4)
	middle_end = int(total_lines * 0.6)
	middle_lines = lines[middle_start:middle_end] # Middle 20%
	last_lines = lines[-int(total_lines * 0.25) :] # Last 25%

	return f"""=== BEGINNING ({len(first_lines)} lines) ===
	{chr(10).join(first_lines)}

	=== MIDDLE (lines {middle_start}-{middle_end}) ===
	{chr(10).join(middle_lines)}

	=== END ({len(last_lines)} lines) ===
	{chr(10).join(last_lines)}"""


	class ReactAnalyzer:
	"""
	Handles ReAct agent analysis with iterative refinement
	Combines react_engine + criticism_engine logic
	"""

	def __init__(self, llm, base_tools, max_iterations: int = 2):
	"""
	Initialize the ReAct analyzer

	Args:
	llm: Language model instance
	base_tools: List of base tools for the agent
	max_iterations: Maximum refinement iterations
	"""
	self.llm = llm
	self.base_tools = base_tools
	self.max_iterations = max_iterations

	@traceable(name="react_analyzer_analysis")
	def analyze(self, state: AnalysisState) -> AnalysisState:
	"""Perform ReAct agent analysis with iterative refinement"""
	print("Starting ReAct agent analysis with iterative refinement...")

	start_time = time.time()

	# Create state-aware tools
	tools = self._create_state_aware_tools(state)

	# Create ReAct agent
	agent_executor = create_react_agent(
	self.llm, tools, name="react_agent_analysis"
	)

	# System context
	system_context = """You are Agent A, an autonomous cybersecurity analyst.

	IMPORTANT CONTEXT - RAW LOGS AVAILABLE:
	The complete raw logs are available for certain tools automatically.
	When you call event_id_extractor_with_logs or timeline_builder_with_logs,
	you only need to provide the required parameters - the tools will automatically
	access the raw logs to perform their analysis.

	"""

	try:
	# Iterative refinement loop
	for iteration in range(self.max_iterations):
	state["iteration_count"] = iteration
	print(f"\n{'='*60}")
	print(f"ITERATION {iteration + 1}/{self.max_iterations}")
	print(f"{'='*60}")

	# Prepare prompt with optional feedback
	messages = self._prepare_messages(state, iteration, system_context)

	# Run ReAct agent
	print(f"Running agent analysis...")
	result = agent_executor.invoke(
	{"messages": messages}, config={"recursion_limit": 100}
	)
	state["messages"] = result["messages"]

	# Extract and process final analysis
	final_analysis = self._extract_final_analysis(state["messages"])

	# Calculate execution time
	state["end_time"] = time.time()
	execution_time = format_execution_time(
	state["end_time"] - state["start_time"]
	)

	# Extract reasoning
	state["agent_reasoning"] = final_analysis.get("reasoning", "")

	# Format result
	state["analysis_result"] = self._format_analysis_result(
	final_analysis,
	execution_time,
	iteration + 1,
	state["agent_reasoning"],
	)

	# Run self-critic review
	print("Running self-critic review...")
	original_analysis = state["analysis_result"].copy()
	critic_result = self._critic_review(state)

	# Store iteration in history
	state["iteration_history"].append(
	{
	"iteration": iteration + 1,
	"original_analysis": original_analysis,
	"critic_evaluation": {
	"quality_acceptable": critic_result["quality_acceptable"],
	"issues": critic_result["issues"],
	"feedback": critic_result["feedback"],
	},
	"corrected_analysis": critic_result["corrected_analysis"],
	}
	)

	# Use corrected analysis
	corrected = critic_result["corrected_analysis"]
	corrected["execution_time_seconds"] = original_analysis.get(
	"execution_time_seconds", 0
	)
	corrected["execution_time_formatted"] = original_analysis.get(
	"execution_time_formatted", "Unknown"
	)
	corrected["iteration_count"] = iteration + 1
	state["analysis_result"] = corrected

	# Check if refinement is needed
	if critic_result["quality_acceptable"]:
	print(
	f"✓ Quality acceptable - stopping at iteration {iteration + 1}"
	)
	break
	elif iteration < self.max_iterations - 1:
	print(
	f"✗ Quality needs improvement - proceeding to iteration {iteration + 2}"
	)
	state["critic_feedback"] = critic_result["feedback"]
	else:
	print(f"✗ Max iterations reached - using current analysis")

	print(
	f"\nAnalysis complete after {state['iteration_count'] + 1} iteration(s)"
	)
	print(f"Total messages: {len(state['messages'])}")

	except Exception as e:
	print(f"Error in analysis: {e}")
	import traceback

	traceback.print_exc()
	state["end_time"] = time.time()
	execution_time = format_execution_time(
	state["end_time"] - state["start_time"]
	)

	state["analysis_result"] = {
	"overall_assessment": "ERROR",
	"total_events_analyzed": 0,
	"execution_time_seconds": execution_time["total_seconds"],
	"execution_time_formatted": execution_time["formatted_time"],
	"analysis_summary": f"Analysis failed: {e}",
	"agent_reasoning": "",
	"abnormal_event_ids": [],
	"abnormal_events": [],
	"iteration_count": state.get("iteration_count", 0),
	}

	return state

	def _create_state_aware_tools(self, state: AnalysisState):
	"""Create state-aware versions of tools that need raw logs"""

	# Create state-aware event_id_extractor
	@tool
	def event_id_extractor_with_logs(suspected_event_id: str) -> dict:
	"""Validates and corrects Windows Event IDs identified in log analysis."""
	from .tools.event_id_extractor_tool import _event_id_extractor_tool

	return _event_id_extractor_tool.run(
	{
	"suspected_event_id": suspected_event_id,
	"raw_logs": state["raw_logs"],
	}
	)

	# Create state-aware timeline_builder
	@tool
	def timeline_builder_with_logs(
	pivot_entity: str, pivot_type: str, time_window_minutes: int = 5
	) -> dict:
	"""Build a focused timeline around suspicious events to understand attack sequences.

	Use this when you suspect coordinated activity or want to understand what happened
	before and after a suspicious event. Analyzes the sequence of events to identify patterns.

	Args:
	pivot_entity: The entity to build timeline around (e.g., "powershell.exe", "admin", "192.168.1.100")
	pivot_type: Type of entity - "user", "process", "ip", "file", "computer", "event_id", or "registry"
	time_window_minutes: Minutes before and after pivot events to include (default: 5)

	Returns:
	Timeline analysis showing events before and after the pivot, helping identify attack sequences.
	"""
	from .tools.timeline_builder_tool import _timeline_builder_tool

	return _timeline_builder_tool.run(
	{
	"pivot_entity": pivot_entity,
	"pivot_type": pivot_type,
	"time_window_minutes": time_window_minutes,
	"raw_logs": state["raw_logs"],
	}
	)

	# Replace base tools with state-aware versions
	tools = [
	t
	for t in self.base_tools
	if t.name not in ["event_id_extractor", "timeline_builder"]
	]
	tools.append(event_id_extractor_with_logs)
	tools.append(timeline_builder_with_logs)

	return tools

	def _prepare_messages(
	self, state: AnalysisState, iteration: int, system_context: str
	):
	"""Prepare messages for the ReAct agent"""
	if iteration == 0:
	# First iteration - no feedback
	critic_feedback_section = ""
	full_prompt = system_context + ANALYSIS_PROMPT.format(
	logs=state["prepared_logs"],
	critic_feedback_section=critic_feedback_section,
	)
	messages = [HumanMessage(content=full_prompt)]
	else:
	# Subsequent iterations - include feedback and preserve messages
	critic_feedback_section = CRITIC_FEEDBACK_TEMPLATE.format(
	iteration=iteration + 1, feedback=state["critic_feedback"]
	)
	# ONLY COPY LANGCHAIN MESSAGE OBJECTS, NOT DICTS
	messages = [msg for msg in state["messages"] if not isinstance(msg, dict)]
	messages.append(HumanMessage(content=critic_feedback_section))

	return messages

	def _extract_final_analysis(self, messages):
	"""Extract the final analysis from agent messages"""
	final_message = None
	for msg in reversed(messages):
	if (
	hasattr(msg, "__class__")
	and msg.__class__.__name__ == "AIMessage"
	and hasattr(msg, "content")
	and msg.content
	and (not hasattr(msg, "tool_calls") or not msg.tool_calls)
	):
	final_message = msg.content
	break

	if not final_message:
	raise Exception("No final analysis message found")

	return self._parse_agent_output(final_message)

	def _parse_agent_output(self, content: str) -> dict:
	"""Parse agent's final output"""
	try:
	if "```json" in content:
	json_str = content.split("```json")[1].split("```")[0].strip()
	elif "```" in content:
	json_str = content.split("```")[1].split("```")[0].strip()
	else:
	json_str = content.strip()

	return json.loads(json_str)
	except Exception as e:
	print(f"Failed to parse agent output: {e}")
	return {
	"overall_assessment": "UNKNOWN",
	"total_events_analyzed": 0,
	"analysis_summary": content[:500],
	"reasoning": "",
	"abnormal_event_ids": [],
	"abnormal_events": [],
	}

	def _format_analysis_result(
	self, final_analysis, execution_time, iteration_count, agent_reasoning
	):
	"""Format the analysis result into the expected structure"""
	abnormal_events = []
	for event in final_analysis.get("abnormal_events", []):
	event_with_tools = {
	"event_id": event.get("event_id", ""),
	"event_description": event.get("event_description", ""),
	"why_abnormal": event.get("why_abnormal", ""),
	"severity": event.get("severity", ""),
	"indicators": event.get("indicators", []),
	"potential_threat": event.get("potential_threat", ""),
	"attack_category": event.get("attack_category", ""),
	"tool_enrichment": event.get("tool_enrichment", {}),
	}
	abnormal_events.append(event_with_tools)

	return {
	"overall_assessment": final_analysis.get("overall_assessment", "UNKNOWN"),
	"total_events_analyzed": final_analysis.get("total_events_analyzed", 0),
	"execution_time_seconds": execution_time["total_seconds"],
	"execution_time_formatted": execution_time["formatted_time"],
	"analysis_summary": final_analysis.get("analysis_summary", ""),
	"agent_reasoning": agent_reasoning,
	"abnormal_event_ids": final_analysis.get("abnormal_event_ids", []),
	"abnormal_events": abnormal_events,
	"iteration_count": iteration_count,
	}

	# ========== CRITIC ENGINE METHODS ==========

	def _critic_review(self, state: dict) -> dict:
	"""Run self-critic review with quality evaluation"""
	critic_input = SELF_CRITIC_PROMPT.format(
	final_json=json.dumps(state["analysis_result"], indent=2),
	messages="\n".join(
	[str(m.content) for m in state["messages"] if hasattr(m, "content")]
	),
	logs=state["prepared_logs"],
	)

	resp = self.llm.invoke(critic_input)
	full_response = resp.content

	try:
	# Parse critic response
	quality_acceptable, issues, feedback, corrected_json = (
	self._parse_critic_response(full_response)
	)

	return {
	"quality_acceptable": quality_acceptable,
	"issues": issues,
	"feedback": feedback,
	"corrected_analysis": corrected_json,
	"full_response": full_response,
	}
	except Exception as e:
	print(f"[Critic] Failed to parse review: {e}")
	# If critic fails, accept current analysis
	return {
	"quality_acceptable": True,
	"issues": [],
	"feedback": "",
	"corrected_analysis": state["analysis_result"],
	"full_response": full_response,
	}

	def _parse_critic_response(self, content: str) -> tuple:
	"""Parse critic response and evaluate quality"""

	# Extract sections
	issues_section = ""
	feedback_section = ""

	if "## ISSUES FOUND" in content:
	parts = content.split("## ISSUES FOUND")
	if len(parts) > 1:
	issues_part = parts[1].split("##")[0].strip()
	issues_section = issues_part

	if "## FEEDBACK FOR AGENT" in content:
	parts = content.split("## FEEDBACK FOR AGENT")
	if len(parts) > 1:
	feedback_part = parts[1].split("##")[0].strip()
	feedback_section = feedback_part

	# Extract corrected JSON
	if "```json" in content:
	json_str = content.split("```json")[1].split("```")[0].strip()
	elif "```" in content:
	json_str = content.split("```")[1].split("```")[0].strip()
	else:
	json_str = "{}"

	corrected_json = json.loads(json_str)

	# Evaluate quality based on issues
	issues = self._extract_issues(issues_section)
	quality_acceptable = self._evaluate_quality(issues, issues_section)

	return quality_acceptable, issues, feedback_section, corrected_json

	def _extract_issues(self, issues_text: str) -> list:
	"""Extract structured issues from text"""
	issues = []

	# Check for "None" or "no issues"
	if (
	"none" in issues_text.lower()
	and "analysis is acceptable" in issues_text.lower()
	):
	return issues

	# Extract issue types
	issue_types = {
	"MISSING_EVENT_IDS": "missing_event_ids",
	"SEVERITY_MISMATCH": "severity_mismatch",
	"IGNORED_TOOLS": "ignored_tool_results",
	"INCOMPLETE_EVENTS": "incomplete_abnormal_events",
	"EVENT_ID_FORMAT": "event_id_format",
	"SCHEMA_ISSUES": "schema_issues",
	"UNDECODED_COMMANDS": "undecoded_commands",
	}

	for keyword, issue_type in issue_types.items():
	if keyword in issues_text:
	issues.append({"type": issue_type, "text": issues_text})

	return issues

	def _evaluate_quality(self, issues: list, issues_text: str) -> bool:
	"""Evaluate if quality is acceptable"""
	# If no issues found
	if not issues:
	return True

	# Critical issue types that trigger iteration
	critical_types = {
	"missing_event_ids",
	"severity_mismatch",
	"ignored_tool_results",
	"incomplete_abnormal_events",
	"undecoded_commands",
	}

	# Count critical issues
	critical_count = sum(1 for issue in issues if issue["type"] in critical_types)

	# Quality threshold: max 1 critical issue is acceptable
	if critical_count >= 2:
	return False

	# Additional check: if issues_text indicates major problems
	if any(
	word in issues_text.lower() for word in ["critical", "major", "serious"]
	):
	return False

	return True


	class ResultManager:
	"""
	Handles saving results to disk and displaying to console
	"""

	def __init__(self, output_root: Path):
	"""
	Initialize the result manager

	Args:
	output_root: Root directory for saving outputs
	"""
	self.output_root = output_root

	@traceable(name="result_manager_save_results")
	def save_results(self, state: AnalysisState) -> AnalysisState:
	"""Save analysis results and messages to files"""
	input_name = os.path.splitext(os.path.basename(state["log_file"]))[0]
	analysis_dir = self.output_root / input_name

	analysis_dir.mkdir(exist_ok=True)
	ts = datetime.now().strftime("%Y%m%d_%H%M%S")

	start_time = time.time()
	success = True

	try:
	# Save main analysis result
	out_file = analysis_dir / f"analysis_{ts}.json"
	with open(out_file, "w", encoding="utf-8") as f:
	json.dump(state["analysis_result"], f, indent=2)

	# Save iteration history
	history_file = analysis_dir / f"iterations_{ts}.json"
	with open(history_file, "w", encoding="utf-8") as f:
	json.dump(state.get("iteration_history", []), f, indent=2)

	# Save messages history
	messages_file = analysis_dir / f"messages_{ts}.json"
	serializable_messages = self._serialize_messages(state.get("messages", []))
	with open(messages_file, "w", encoding="utf-8") as f:
	json.dump(serializable_messages, f, indent=2)

	except Exception as e:
	print(f"Error saving results: {e}")
	success = False

	execution_time = time.time() - start_time
	self._log_save_metrics(input_name, execution_time, success)

	return state

	def _log_save_metrics(self, input_name: str, execution_time: float, success: bool):
	"""Log file saving performance metrics."""
	try:
	current_run = get_current_run_tree()
	if current_run:
	ls_client.create_feedback(
	run_id=current_run.id,
	key="result_save_performance",
	score=1.0 if success else 0.0,
	value={
	"input_name": input_name,
	"execution_time": execution_time,
	"success": success,
	},
	)
	except Exception as e:
	print(f"Failed to log save metrics: {e}")

	@traceable(name="result_manager_display_results")
	def display_results(self, state: AnalysisState) -> AnalysisState:
	"""Display formatted analysis results"""
	result = state["analysis_result"]
	assessment = result.get("overall_assessment", "UNKNOWN")
	execution_time = result.get("execution_time_formatted", "Unknown")
	abnormal_events = result.get("abnormal_events", [])
	iteration_count = result.get("iteration_count", 1)

	print("\n" + "=" * 60)
	print("ANALYSIS COMPLETE")
	print("=" * 60)

	print(f"ASSESSMENT: {assessment}")
	print(f"ITERATIONS: {iteration_count}")
	print(f"EXECUTION TIME: {execution_time}")
	print(f"EVENTS ANALYZED: {result.get('total_events_analyzed', 'Unknown')}")

	# Tools Used
	tools_used = self._extract_tools_used(state.get("messages", []))

	if tools_used:
	print(f"TOOLS USED: {len(tools_used)} tools")
	print(f" Types: {', '.join(sorted(tools_used))}")
	else:
	print("TOOLS USED: None")

	# Abnormal Events
	if abnormal_events:
	print(f"\nABNORMAL EVENTS: {len(abnormal_events)}")
	for event in abnormal_events:
	severity = event.get("severity", "UNKNOWN")
	event_id = event.get("event_id", "N/A")
	print(f" EventID {event_id} [{severity}]")
	else:
	print("\nNO ABNORMAL EVENTS")

	print("=" * 60)

	return state

	def display_batch_summary(
	self, results: List[Dict], start_time: datetime, end_time: datetime
	):
	"""Print summary of batch processing results"""
	total = len(results)
	successful = sum(1 for r in results if r["success"])
	skipped = sum(1 for r in results if "Skipped" in r["message"])
	failed = total - successful

	duration = (end_time - start_time).total_seconds()

	print("\n" + "=" * 60)
	print("BATCH ANALYSIS SUMMARY")
	print("=" * 60)
	print(f"Total files: {total}")
	print(f"Successful: {successful}")
	print(f"Skipped: {skipped}")
	print(f"Failed: {failed}")
	print(f"Total time: {duration:.2f} seconds ({duration/60:.2f} minutes)")

	if failed > 0:
	print(f"\nFailed files:")
	for r in results:
	if not r["success"]:
	filename = os.path.basename(r["log_file"])
	print(f" - {filename}: {r['message']}")

	print("=" * 60 + "\n")

	def get_existing_output(self, log_file: str) -> Optional[str]:
	"""Get the output file path for a given log file if it exists"""
	import glob

	input_name = os.path.splitext(os.path.basename(log_file))[0]
	analysis_dir = self.output_root / input_name

	if analysis_dir.exists():
	existing_files = list(analysis_dir.glob("analysis_*.json"))
	if existing_files:
	return str(existing_files[0])
	return None

	def _serialize_messages(self, messages) -> List[dict]:
	"""Serialize messages for JSON storage"""
	serializable_messages = []
	for msg in messages:
	if isinstance(msg, dict):
	serializable_messages.append(msg)
	else:
	msg_dict = {
	"type": msg.__class__.__name__,
	"content": msg.content if hasattr(msg, "content") else str(msg),
	}
	if hasattr(msg, "tool_calls") and msg.tool_calls:
	msg_dict["tool_calls"] = [
	{"name": tc.get("name", ""), "args": tc.get("args", {})}
	for tc in msg.tool_calls
	]
	serializable_messages.append(msg_dict)

	return serializable_messages

	def _extract_tools_used(self, messages) -> set:
	"""Extract set of tool names used during analysis"""
	tools_used = set()
	for msg in messages:
	if hasattr(msg, "tool_calls") and msg.tool_calls:
	for tc in msg.tool_calls:
	tool_name = tc.get("name", "")
	if tool_name:
	tools_used.add(tool_name)
	return tools_used