AI-Life-Coach-Streamlit2

Running

App Files Files Community

AI-Life-Coach-Streamlit2 / core /providers /ollama.py

rdune71

Targeted chat response fix: enhanced debugging, improved session handling, and better error reporting

dac104e 2 months ago

raw

history blame

6.88 kB

	import requests
	import logging
	import re
	from datetime import datetime
	from typing import List, Dict, Optional, Union
	from core.providers.base import LLMProvider
	from utils.config import config
	from services.weather import weather_service

	logger = logging.getLogger(__name__)

	class OllamaProvider(LLMProvider):
	"""Ollama LLM provider implementation"""

	def __init__(self, model_name: str, timeout: int = 60, max_retries: int = 3):
	# Increased timeout from 30 to 60
	super().__init__(model_name, timeout, max_retries)
	self.host = self._sanitize_host(config.ollama_host or "http://localhost:11434")
	# Headers to skip ngrok browser warning
	self.headers = {
	"ngrok-skip-browser-warning": "true",
	"User-Agent": "CosmicCat-AI-Assistant"
	}

	def _sanitize_host(self, host: str) -> str:
	"""Sanitize host URL by removing whitespace and control characters"""
	if not host:
	return "http://localhost:11434"
	# Remove leading/trailing whitespace and control characters
	host = host.strip()
	# Remove any newlines or control characters
	host = re.sub(r'[\r\n\t\0]+', '', host)
	# Ensure URL has a scheme
	if not host.startswith(('http://', 'https://')):
	host = 'http://' + host
	return host

	def generate(self, prompt: str, conversation_history: List[Dict]) -> Optional[str]:
	"""Generate a response synchronously"""
	try:
	return self._retry_with_backoff(self._generate_impl, prompt, conversation_history)
	except Exception as e:
	logger.error(f"Ollama generation failed: {e}")
	return None

	def stream_generate(self, prompt: str, conversation_history: List[Dict]) -> Optional[Union[str, List[str]]]:
	"""Generate a response with streaming support"""
	try:
	return self._retry_with_backoff(self._stream_generate_impl, prompt, conversation_history)
	except Exception as e:
	logger.error(f"Ollama stream generation failed: {e}")
	return None

	def validate_model(self) -> bool:
	"""Validate if the model is available"""
	try:
	response = requests.get(
	f"{self.host}/api/tags",
	headers=self.headers,
	timeout=self.timeout
	)
	if response.status_code == 200:
	models = response.json().get("models", [])
	model_names = [model.get("name") for model in models]
	return self.model_name in model_names
	elif response.status_code == 404:
	# Try alternative endpoint
	response2 = requests.get(
	f"{self.host}",
	headers=self.headers,
	timeout=self.timeout
	)
	return response2.status_code == 200
	return False
	except Exception as e:
	logger.error(f"Model validation failed: {e}")
	return False

	def _generate_impl(self, prompt: str, conversation_history: List[Dict]) -> str:
	"""Implementation of synchronous generation with enhanced debugging"""
	url = f"{self.host}/api/chat"

	# Prepare messages - ensure proper format
	messages = []
	for msg in conversation_history:
	if isinstance(msg, dict) and "role" in msg and "content" in msg:
	messages.append({
	"role": msg["role"],
	"content": str(msg["content"])
	})

	# Add the current prompt if not already in history
	if not messages or messages[-1].get("content") != prompt:
	messages.append({"role": "user", "content": prompt})

	payload = {
	"model": self.model_name,
	"messages": messages,
	"stream": False
	}

	logger.info(f"Ollama request URL: {url}")
	logger.info(f"Ollama request payload: {payload}")
	logger.info(f"Ollama headers: {self.headers}")

	try:
	response = requests.post(
	url,
	json=payload,
	headers=self.headers,
	timeout=self.timeout
	)
	logger.info(f"Ollama response status: {response.status_code}")
	logger.info(f"Ollama response headers: {dict(response.headers)}")

	response.raise_for_status()
	result = response.json()
	logger.info(f"Ollama response body: {result}")

	# Extract content properly
	if "message" in result and "content" in result["message"]:
	content = result["message"]["content"]
	logger.info(f"Extracted content: {content[:100] if content else 'None'}")
	return content
	elif "response" in result:
	content = result["response"]
	logger.info(f"Extracted response: {content[:100] if content else 'None'}")
	return content
	else:
	content = str(result)
	logger.info(f"Raw result as string: {content[:100]}")
	return content

	except requests.exceptions.RequestException as e:
	logger.error(f"Ollama API request error: {str(e)}")
	raise Exception(f"Ollama API error: {str(e)}")
	except Exception as e:
	logger.error(f"Failed to parse Ollama response: {str(e)}")
	raise Exception(f"Failed to parse Ollama response: {str(e)}")

	def _stream_generate_impl(self, prompt: str, conversation_history: List[Dict]) -> List[str]:
	"""Implementation of streaming generation"""
	url = f"{self.host}/api/chat"
	messages = conversation_history.copy()
	# Add the current prompt if not already in history
	if not messages or messages[-1].get("content") != prompt:
	messages.append({"role": "user", "content": prompt})
	payload = {
	"model": self.model_name,
	"messages": messages,
	"stream": True
	}
	response = requests.post(
	url,
	json=payload,
	headers=self.headers,
	timeout=self.timeout,
	stream=True
	)
	response.raise_for_status()
	chunks = []
	for line in response.iter_lines():
	if line:
	chunk = line.decode('utf-8')
	try:
	data = eval(chunk) # Simplified JSON parsing
	content = data.get("message", {}).get("content", "")
	if content:
	chunks.append(content)
	except:
	continue
	return chunks