Spaces:

rohannsinghal
/

hackrx6.0-final

Paused

App Files Files Community

rohannsinghal commited on Aug 8, 2025

Commit

0c4f4d8

1 Parent(s): f479732

made changes to main_api.py

Browse files

Files changed (2) hide show

app/main_api.py +298 -57
run.py +6 -4

app/main_api.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# --- FIXED main_api.py ---
 import psutil
 import os
@@ -10,13 +10,15 @@ from typing import List, Dict, Any, Optional
 import logging
 import asyncio
 from collections import defaultdict
 # FastAPI and core dependencies
 from fastapi import FastAPI, Body, HTTPException, Request
 from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
-# LangChain imports
 from langchain_community.embeddings import HuggingFaceEmbeddings
 from langchain_community.vectorstores import Chroma
 from langchain.chains import RetrievalQA
@@ -25,11 +27,18 @@ from langchain.llms.base import LLM
 from langchain.callbacks.manager import CallbackManagerForLLMRun
 from langchain.schema.document import Document as LangChainDocument
 # LLM Integration
 import groq
-# Document processing and environment
-from .parser import FastDocumentParserService  # Fixed import
 import httpx
 from dotenv import load_dotenv
@@ -38,7 +47,7 @@ load_dotenv()
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
-app = FastAPI(title="Fixed RAG System", version="1.0.0")
 # CORS Middleware
 app.add_middleware(
@@ -46,7 +55,245 @@ app.add_middleware(
     allow_origins=["*"], allow_credentials=True, allow_methods=["*"], allow_headers=["*"],
 )
-# --- CUSTOM GROQ LLM FOR LANGCHAIN ---
 class GroqLLM(LLM):
     """Custom Groq LLM wrapper for LangChain"""
     groq_client: Any
@@ -66,8 +313,8 @@ class GroqLLM(LLM):
             response = self.groq_client.chat.completions.create(
                 model="llama-3.3-70b-versatile",
                 messages=[{"role": "user", "content": prompt}],
-                temperature=0.1,  # Slightly higher for more flexible responses
-                max_tokens=800,   # Increased token limit
                 top_p=0.9,
                 stop=stop
             )
@@ -75,10 +322,10 @@ class GroqLLM(LLM):
         except Exception as e:
             logger.error(f"Groq LLM call failed: {e}")
             return "Error generating response"
-# --- IMPROVED RAG PIPELINE ---
 class ImprovedRAGPipeline:
-    """Improved RAG pipeline with better debugging and retrieval."""
     def __init__(self, collection_name: str, request: Request):
         self.collection_name = collection_name
@@ -90,38 +337,35 @@ class ImprovedRAGPipeline:
             persist_directory=CHROMA_PERSIST_DIR
         )
         self.qa_chain = None
-        logger.info(f"✅ Improved RAG pipeline initialized for collection: {collection_name}")
     def add_documents(self, chunks: List[Dict[str, Any]]):
-        """Adds documents to the vectorstore and creates the QA chain."""
         if not chunks:
-            logger.error("❌ No chunks provided to add_documents!")
             return
         logger.info(f"📚 Adding {len(chunks)} chunks to vectorstore...")
-        # Debug: Log first few chunks
         for i, chunk in enumerate(chunks[:3]):
-            logger.info(f"Chunk {i}: {chunk['content'][:200]}...")
         langchain_docs = [
-            LangChainDocument(
-                page_content=chunk['content'],
-                metadata=chunk['metadata']
-            )
             for chunk in chunks
         ]
         self.vectorstore.add_documents(langchain_docs)
         logger.info(f"✅ Added {len(langchain_docs)} documents to vectorstore")
-        # Create retriever with more chunks and lower threshold
         retriever = self.vectorstore.as_retriever(
             search_type="similarity",
-            search_kwargs={"k": 10}  # Increased from 6 to 10
         )
-        # Improved prompt template - less restrictive
         prompt_template = PromptTemplate(
             input_variables=["context", "question"],
             template="""You are an expert insurance policy analyst. Use the following policy document context to answer the question.
@@ -134,6 +378,7 @@ Question: {question}
 Instructions:
 - Provide a clear, direct answer based on the policy document context above
 - If you find relevant information, provide specific details including numbers, percentages, time periods, etc.
 - If the exact answer is not in the context but related information exists, provide what you can find
 - Only say "information not available" if absolutely no relevant information exists in the context
@@ -145,36 +390,36 @@ Answer:"""
             chain_type="stuff",
             retriever=retriever,
             chain_type_kwargs={"prompt": prompt_template},
-            return_source_documents=True  # This helps with debugging
         )
-        logger.info(f"✅ QA Chain is ready with improved retrieval")
     async def answer_question(self, question: str) -> str:
         if not self.qa_chain:
             return "Error: QA chain not initialized. Please add documents first."
-        logger.info(f"🤔 Answering question: {question}")
         try:
-            # First, let's test retrieval directly
             retriever = self.vectorstore.as_retriever(search_kwargs={"k": 5})
             retrieved_docs = retriever.get_relevant_documents(question)
-            logger.info(f"🔍 Retrieved {len(retrieved_docs)} documents for question")
             for i, doc in enumerate(retrieved_docs):
-                logger.info(f"Retrieved Doc {i}: {doc.page_content[:150]}...")
-            # Now run the QA chain
             result = await asyncio.to_thread(self.qa_chain, {"query": question})
             answer = result.get("result", "Failed to get an answer.")
-            logger.info(f"✅ Generated answer: {answer[:200]}...")
             return answer
         except Exception as e:
-            logger.error(f"❌ Error during QA chain execution: {e}")
             return "An error occurred while processing the question."
-# --- GROQ API KEY MANAGER (unchanged) ---
 class GroqAPIKeyManager:
     def __init__(self, api_keys: List[str]):
         self.api_keys = [key.strip() for key in api_keys if key.strip()]
@@ -182,7 +427,7 @@ class GroqAPIKeyManager:
         self.key_last_used = defaultdict(float)
         self.current_key_index = 0
         self.max_requests_per_key = 45
-        logger.info(f"🔑 API Key Manager initialized with {len(self.api_keys)} keys")
     def get_next_api_key(self):
         current_time = time.time()
@@ -196,14 +441,11 @@ class GroqAPIKeyManager:
         self.key_usage_count[best_key] += 1
         self.key_last_used[best_key] = current_time
         return best_key
-    def get_key_stats(self):
-        return {f"...{key[-4:]}": {"usage_count": self.key_usage_count[key], "last_used": self.key_last_used[key]} for key in self.api_keys}
-# --- APP STARTUP & CONFIG ---
 GROQ_API_KEYS = os.getenv("GROQ_API_KEYS", "").split(',')
 EMBEDDING_MODEL = "BAAI/bge-small-en-v1.5"
-CHROMA_PERSIST_DIR = "./chroma_db"  # Simplified path
 UPLOAD_DIR = "/tmp/docs"
 @app.on_event("startup")
@@ -219,13 +461,13 @@ async def startup_event():
         first_key = app.state.api_key_manager.get_next_api_key()
         app.state.groq_client = groq.Groq(api_key=first_key)
         app.state.groq_llm = GroqLLM(groq_client=app.state.groq_client, api_key_manager=app.state.api_key_manager)
-        app.state.parsing_service = FastDocumentParserService()
-        logger.info("✅ All services initialized successfully!")
     except Exception as e:
-        logger.error(f"💥 FATAL: Could not initialize services. Error: {e}")
         raise e
-# --- API MODELS (unchanged) ---
 class SubmissionRequest(BaseModel):
     documents: List[str]
     questions: List[str]
@@ -237,10 +479,10 @@ class Answer(BaseModel):
 class SubmissionResponse(BaseModel):
     answers: List[Answer]
-# --- MAIN API ENDPOINT ---
 @app.post("/hackrx/run", response_model=SubmissionResponse)
 async def run_submission(request: Request, submission_request: SubmissionRequest = Body(...)):
-    logger.info(f"🎯 Processing {len(submission_request.documents)} documents and {len(submission_request.questions)} questions")
     parsing_service = request.app.state.parsing_service
     session_collection_name = f"hackrx_session_{uuid.uuid4().hex}"
@@ -251,7 +493,7 @@ async def run_submission(request: Request, submission_request: SubmissionRequest
     async with httpx.AsyncClient(timeout=120.0) as client:
         for doc_idx, doc_url in enumerate(submission_request.documents):
             try:
-                logger.info(f"📥 Downloading document {doc_idx + 1}/{len(submission_request.documents)}: {doc_url}")
                 response = await client.get(doc_url, follow_redirects=True)
                 response.raise_for_status()
@@ -267,36 +509,35 @@ async def run_submission(request: Request, submission_request: SubmissionRequest
                 chunk_dicts = [chunk.to_dict() for chunk in chunks]
                 all_chunks.extend(chunk_dicts)
-                # Clean up
                 os.remove(temp_file_path)
                 logger.info(f"✅ Processed {len(chunks)} chunks from {file_name}")
             except Exception as e:
-                logger.error(f"❌ Failed to process document at {doc_url}: {e}")
                 continue
-    logger.info(f"📊 Total chunks collected: {len(all_chunks)}")
     if not all_chunks:
-        logger.error("❌ No chunks were successfully processed!")
         failed_answers = [Answer(question=q, answer="No valid documents could be processed.") for q in submission_request.questions]
         return SubmissionResponse(answers=failed_answers)
-    # Add documents to RAG pipeline
     rag_pipeline.add_documents(all_chunks)
     # Answer questions
-    logger.info(f"❓ Answering {len(submission_request.questions)} questions...")
     tasks = [rag_pipeline.answer_question(q) for q in submission_request.questions]
     results = await asyncio.gather(*tasks)
     answers = [Answer(question=q, answer=ans) for q, ans in zip(submission_request.questions, results)]
-    logger.info(f"🎉 Successfully processed all questions!")
     return SubmissionResponse(answers=answers)
 @app.get("/")
 def read_root():
-    return {"message": "Fixed RAG System is running.", "status": "healthy"}
 @app.get("/health")
 def health_check():
@@ -305,12 +546,12 @@ def health_check():
 # Debug endpoint
 @app.post("/debug/test-chunks")
 async def test_chunks(request: Request, submission_request: SubmissionRequest = Body(...)):
-    """Debug endpoint to test document chunking"""
     parsing_service = request.app.state.parsing_service
     all_chunks = []
     async with httpx.AsyncClient(timeout=120.0) as client:
-        for doc_url in submission_request.documents[:1]:  # Test only first document
             try:
                 response = await client.get(doc_url, follow_redirects=True)
                 response.raise_for_status()
@@ -338,6 +579,6 @@ async def test_chunks(request: Request, submission_request: SubmissionRequest =
                 "content": chunk["content"][:300] + "...",
                 "metadata": chunk["metadata"]
             }
-            for chunk in all_chunks[:3]
         ]
     }

+# --- STANDALONE main_api.py with embedded parser ---
 import psutil
 import os
 import logging
 import asyncio
 from collections import defaultdict
+from pathlib import Path
+import gc
 # FastAPI and core dependencies
 from fastapi import FastAPI, Body, HTTPException, Request
 from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
+# LangChain imports (using updated non-deprecated imports)
 from langchain_community.embeddings import HuggingFaceEmbeddings
 from langchain_community.vectorstores import Chroma
 from langchain.chains import RetrievalQA
 from langchain.callbacks.manager import CallbackManagerForLLMRun
 from langchain.schema.document import Document as LangChainDocument
+# Document processing imports
+import fitz  # PyMuPDF
+import pdfplumber
+import mammoth
+import email
+import email.policy
+from bs4 import BeautifulSoup
 # LLM Integration
 import groq
+# Other dependencies
 import httpx
 from dotenv import load_dotenv
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
+app = FastAPI(title="Standalone Fixed RAG System", version="1.0.0")
 # CORS Middleware
 app.add_middleware(
     allow_origins=["*"], allow_credentials=True, allow_methods=["*"], allow_headers=["*"],
 )
+# --- EMBEDDED DOCUMENT PARSER ---
+class DocumentChunk:
+    """Simple data class for document chunks"""
+    def __init__(self, content: str, metadata: Dict[str, Any], chunk_id: str):
+        self.content = content
+        self.metadata = metadata
+        self.chunk_id = chunk_id
+    def to_dict(self):
+        return {
+            "content": self.content,
+            "metadata": self.metadata,
+            "chunk_id": self.chunk_id
+        }
+class EmbeddedDocumentParser:
+    """Embedded document parsing service"""
+    def __init__(self):
+        self.chunk_size = 2000
+        self.chunk_overlap = 200
+        self.max_chunks = 500
+        self.table_row_limit = 20
+        logger.info("EmbeddedDocumentParser initialized")
+    def fast_text_split(self, text: str, source: str) -> List[str]:
+        """Super fast text splitting with hard limits"""
+        if not text or len(text) < 100:
+            return [text] if text else []
+        if len(text) <= self.chunk_size:
+            return [text]
+        chunks = []
+        start = 0
+        chunk_count = 0
+        while start < len(text) and chunk_count < self.max_chunks:
+            end = min(start + self.chunk_size, len(text))
+            if end < len(text):
+                search_start = max(start, end - 200)
+                period_pos = text.rfind('.', search_start, end)
+                if period_pos > search_start:
+                    end = period_pos + 1
+            chunk = text[start:end].strip()
+            if chunk:
+                chunks.append(chunk)
+                chunk_count += 1
+            start = end - self.chunk_overlap
+            if start <= 0:
+                start = end
+        logger.info(f"Split {source} into {len(chunks)} chunks")
+        return chunks[:self.max_chunks]
+    def extract_tables_fast(self, file_path: str) -> str:
+        """Fast table extraction"""
+        table_text = ""
+        table_count = 0
+        max_tables = 25
+        try:
+            with pdfplumber.open(file_path) as pdf:
+                total_pages = len(pdf.pages)
+                if total_pages <= 20:
+                    step = 1
+                elif total_pages <= 40:
+                    step = 2
+                else:
+                    step = 3
+                pages_to_process = list(range(0, min(total_pages, 50), step))
+                logger.info(f"📊 Processing {len(pages_to_process)} of {total_pages} pages for tables")
+                for page_num in pages_to_process:
+                    if table_count >= max_tables:
+                        break
+                    page = pdf.pages[page_num]
+                    tables = page.find_tables()
+                    for table in tables:
+                        if table_count >= max_tables:
+                            break
+                        try:
+                            table_data = table.extract()
+                            if table_data and len(table_data) >= 2 and len(table_data[0]) <= 6:
+                                limited_data = table_data[:min(30, len(table_data))]
+                                header = " | ".join(str(cell or "").strip()[:60] for cell in limited_data[0])
+                                separator = " | ".join(["---"] * len(limited_data[0]))
+                                rows = []
+                                for row in limited_data[1:]:
+                                    padded_row = list(row) + [None] * (len(limited_data[0]) - len(row))
+                                    row_str = " | ".join(str(cell or "").strip()[:60] for cell in padded_row)
+                                    rows.append(row_str)
+                                table_md = f"\n**TABLE {table_count + 1} - Page {page_num + 1}**\n"
+                                table_md += f"| {header} |\n| {separator} |\n"
+                                for row in rows:
+                                    table_md += f"| {row} |\n"
+                                table_md += "\n"
+                                table_text += table_md
+                                table_count += 1
+                        except Exception as e:
+                            logger.warning(f"Skip table on page {page_num + 1}: {e}")
+                logger.info(f"🎯 Extracted {table_count} tables")
+        except Exception as e:
+            logger.error(f"❌ Table extraction failed: {e}")
+        return table_text
+    def process_pdf_ultrafast(self, file_path: str) -> List[DocumentChunk]:
+        """Ultra-fast PDF processing"""
+        logger.info(f"🚀 Processing PDF: {os.path.basename(file_path)}")
+        start_time = time.time()
+        chunks = []
+        try:
+            # Extract tables
+            logger.info("📊 Extracting tables...")
+            table_content = self.extract_tables_fast(file_path)
+            # Extract text
+            logger.info("📄 Extracting text...")
+            doc = fitz.open(file_path)
+            full_text = ""
+            total_pages = len(doc)
+            if total_pages > 40:
+                pages_to_process = list(range(0, min(total_pages, 60), 2))
+                logger.info(f"📑 Processing {len(pages_to_process)} of {total_pages} pages")
+            else:
+                pages_to_process = list(range(total_pages))
+            for page_num in pages_to_process:
+                try:
+                    page = doc[page_num]
+                    page_text = page.get_text()
+                    page_text = page_text.strip()
+                    if len(page_text) > 10000:
+                        page_text = page_text[:10000] + f"\n[Page {page_num + 1} truncated]"
+                    full_text += f"\n\n--- Page {page_num + 1} ---\n{page_text}"
+                except Exception as e:
+                    logger.warning(f"Error processing page {page_num + 1}: {e}")
+            doc.close()
+            # Append tables
+            if table_content:
+                full_text += f"\n\n{'='*50}\nEXTRACTED TABLES\n{'='*50}\n{table_content}"
+            # Create chunks
+            logger.info("📦 Creating chunks...")
+            text_chunks = self.fast_text_split(full_text, os.path.basename(file_path))
+            for idx, chunk_text in enumerate(text_chunks):
+                has_tables = "**TABLE" in chunk_text or "EXTRACTED TABLES" in chunk_text
+                chunks.append(DocumentChunk(
+                    content=chunk_text,
+                    metadata={
+                        "source": os.path.basename(file_path),
+                        "chunk_index": idx,
+                        "document_type": "pdf_ultrafast",
+                        "has_tables": has_tables,
+                        "total_pages": total_pages,
+                        "pages_processed": len(pages_to_process)
+                    },
+                    chunk_id=str(uuid.uuid4())
+                ))
+            elapsed = time.time() - start_time
+            logger.info(f"✅ Processing complete in {elapsed:.2f}s: {len(chunks)} chunks")
+            return chunks
+        except Exception as e:
+            logger.error(f"❌ Processing failed: {e}")
+            return self._emergency_fallback(file_path)
+    def _emergency_fallback(self, file_path: str) -> List[DocumentChunk]:
+        """Emergency fallback"""
+        logger.info("🆘 Emergency fallback")
+        try:
+            doc = fitz.open(file_path)
+            max_pages = min(10, len(doc))
+            text_parts = []
+            for page_num in range(max_pages):
+                page = doc[page_num]
+                page_text = page.get_text()
+                if len(page_text) > 5000:
+                    page_text = page_text[:5000] + f"\n[Page {page_num + 1} truncated]"
+                text_parts.append(f"Page {page_num + 1}:\n{page_text}")
+            doc.close()
+            full_text = "\n\n".join(text_parts)
+            chunks = []
+            chunk_size = len(full_text) // 10 + 1
+            for i in range(0, len(full_text), chunk_size):
+                chunk_text = full_text[i:i + chunk_size]
+                chunks.append(DocumentChunk(
+                    content=chunk_text,
+                    metadata={
+                        "source": os.path.basename(file_path),
+                        "chunk_index": len(chunks),
+                        "document_type": "pdf_emergency_fallback",
+                        "has_tables": False,
+                        "pages_processed": max_pages
+                    },
+                    chunk_id=str(uuid.uuid4())
+                ))
+            return chunks
+        except Exception as e:
+            logger.error(f"Emergency fallback failed: {e}")
+            raise Exception("All processing methods failed")
+# --- GROQ LLM WRAPPER ---
 class GroqLLM(LLM):
     """Custom Groq LLM wrapper for LangChain"""
     groq_client: Any
             response = self.groq_client.chat.completions.create(
                 model="llama-3.3-70b-versatile",
                 messages=[{"role": "user", "content": prompt}],
+                temperature=0.1,
+                max_tokens=800,
                 top_p=0.9,
                 stop=stop
             )
         except Exception as e:
             logger.error(f"Groq LLM call failed: {e}")
             return "Error generating response"
+# --- RAG PIPELINE ---
 class ImprovedRAGPipeline:
+    """Improved RAG pipeline"""
     def __init__(self, collection_name: str, request: Request):
         self.collection_name = collection_name
             persist_directory=CHROMA_PERSIST_DIR
         )
         self.qa_chain = None
+        logger.info(f"✅ RAG pipeline initialized: {collection_name}")
     def add_documents(self, chunks: List[Dict[str, Any]]):
+        """Add documents to vectorstore"""
         if not chunks:
+            logger.error("❌ No chunks provided!")
             return
         logger.info(f"📚 Adding {len(chunks)} chunks to vectorstore...")
+        # Debug first few chunks
         for i, chunk in enumerate(chunks[:3]):
+            logger.info(f"Sample chunk {i}: {chunk['content'][:200]}...")
         langchain_docs = [
+            LangChainDocument(page_content=chunk['content'], metadata=chunk['metadata'])
             for chunk in chunks
         ]
         self.vectorstore.add_documents(langchain_docs)
         logger.info(f"✅ Added {len(langchain_docs)} documents to vectorstore")
+        # Create retriever
         retriever = self.vectorstore.as_retriever(
             search_type="similarity",
+            search_kwargs={"k": 10}
         )
+        # Create prompt template - less restrictive
         prompt_template = PromptTemplate(
             input_variables=["context", "question"],
             template="""You are an expert insurance policy analyst. Use the following policy document context to answer the question.
 Instructions:
 - Provide a clear, direct answer based on the policy document context above
 - If you find relevant information, provide specific details including numbers, percentages, time periods, etc.
+- Quote exact text when possible
 - If the exact answer is not in the context but related information exists, provide what you can find
 - Only say "information not available" if absolutely no relevant information exists in the context
             chain_type="stuff",
             retriever=retriever,
             chain_type_kwargs={"prompt": prompt_template},
+            return_source_documents=True
         )
+        logger.info("✅ QA Chain ready")
     async def answer_question(self, question: str) -> str:
         if not self.qa_chain:
             return "Error: QA chain not initialized. Please add documents first."
+        logger.info(f"🤔 Answering: {question}")
         try:
+            # Test retrieval
             retriever = self.vectorstore.as_retriever(search_kwargs={"k": 5})
             retrieved_docs = retriever.get_relevant_documents(question)
+            logger.info(f"🔍 Retrieved {len(retrieved_docs)} documents")
             for i, doc in enumerate(retrieved_docs):
+                logger.info(f"Retrieved {i}: {doc.page_content[:150]}...")
+            # Run QA chain
             result = await asyncio.to_thread(self.qa_chain, {"query": question})
             answer = result.get("result", "Failed to get an answer.")
+            logger.info(f"✅ Answer: {answer[:200]}...")
             return answer
         except Exception as e:
+            logger.error(f"❌ Error during QA: {e}")
             return "An error occurred while processing the question."
+# --- API KEY MANAGER ---
 class GroqAPIKeyManager:
     def __init__(self, api_keys: List[str]):
         self.api_keys = [key.strip() for key in api_keys if key.strip()]
         self.key_last_used = defaultdict(float)
         self.current_key_index = 0
         self.max_requests_per_key = 45
+        logger.info(f"🔑 API Key Manager: {len(self.api_keys)} keys")
     def get_next_api_key(self):
         current_time = time.time()
         self.key_usage_count[best_key] += 1
         self.key_last_used[best_key] = current_time
         return best_key
+# --- CONFIGURATION ---
 GROQ_API_KEYS = os.getenv("GROQ_API_KEYS", "").split(',')
 EMBEDDING_MODEL = "BAAI/bge-small-en-v1.5"
+CHROMA_PERSIST_DIR = "./chroma_db"
 UPLOAD_DIR = "/tmp/docs"
 @app.on_event("startup")
         first_key = app.state.api_key_manager.get_next_api_key()
         app.state.groq_client = groq.Groq(api_key=first_key)
         app.state.groq_llm = GroqLLM(groq_client=app.state.groq_client, api_key_manager=app.state.api_key_manager)
+        app.state.parsing_service = EmbeddedDocumentParser()
+        logger.info("✅ All services initialized!")
     except Exception as e:
+        logger.error(f"💥 FATAL: {e}")
         raise e
+# --- API MODELS ---
 class SubmissionRequest(BaseModel):
     documents: List[str]
     questions: List[str]
 class SubmissionResponse(BaseModel):
     answers: List[Answer]
+# --- MAIN ENDPOINT ---
 @app.post("/hackrx/run", response_model=SubmissionResponse)
 async def run_submission(request: Request, submission_request: SubmissionRequest = Body(...)):
+    logger.info(f"🎯 Processing {len(submission_request.documents)} documents, {len(submission_request.questions)} questions")
     parsing_service = request.app.state.parsing_service
     session_collection_name = f"hackrx_session_{uuid.uuid4().hex}"
     async with httpx.AsyncClient(timeout=120.0) as client:
         for doc_idx, doc_url in enumerate(submission_request.documents):
             try:
+                logger.info(f"📥 Downloading document {doc_idx + 1}: {doc_url}")
                 response = await client.get(doc_url, follow_redirects=True)
                 response.raise_for_status()
                 chunk_dicts = [chunk.to_dict() for chunk in chunks]
                 all_chunks.extend(chunk_dicts)
                 os.remove(temp_file_path)
                 logger.info(f"✅ Processed {len(chunks)} chunks from {file_name}")
             except Exception as e:
+                logger.error(f"❌ Failed to process document: {e}")
                 continue
+    logger.info(f"📊 Total chunks: {len(all_chunks)}")
     if not all_chunks:
+        logger.error("❌ No chunks processed!")
         failed_answers = [Answer(question=q, answer="No valid documents could be processed.") for q in submission_request.questions]
         return SubmissionResponse(answers=failed_answers)
+    # Add to RAG pipeline
     rag_pipeline.add_documents(all_chunks)
     # Answer questions
+    logger.info(f"❓ Answering questions...")
     tasks = [rag_pipeline.answer_question(q) for q in submission_request.questions]
     results = await asyncio.gather(*tasks)
     answers = [Answer(question=q, answer=ans) for q, ans in zip(submission_request.questions, results)]
+    logger.info("🎉 All questions processed!")
     return SubmissionResponse(answers=answers)
 @app.get("/")
 def read_root():
+    return {"message": "Standalone Fixed RAG System", "status": "healthy"}
 @app.get("/health")
 def health_check():
 # Debug endpoint
 @app.post("/debug/test-chunks")
 async def test_chunks(request: Request, submission_request: SubmissionRequest = Body(...)):
+    """Debug endpoint"""
     parsing_service = request.app.state.parsing_service
     all_chunks = []
     async with httpx.AsyncClient(timeout=120.0) as client:
+        for doc_url in submission_request.documents[:1]:
             try:
                 response = await client.get(doc_url, follow_redirects=True)
                 response.raise_for_status()
                 "content": chunk["content"][:300] + "...",
                 "metadata": chunk["metadata"]
             }
+            for chunk in all_chunks[:5]  # Show more samples
         ]
     }

run.py CHANGED Viewed

@@ -1,14 +1,16 @@
-# run.py
 import uvicorn
 import os
 if __name__ == "__main__":
-    # This makes the app compatible with hosting providers like Render.
-    # It will use the PORT environment variable if it exists, otherwise it defaults to 8000.
     port = int(os.environ.get("PORT", 8000))
     print(f"🚀 Starting HackRx 6.0 RAG Server on port {port}...")
-    # Use the standard 'app.module:variable' format for Uvicorn
     uvicorn.run("app.main_api:app", host="0.0.0.0", port=port, reload=False)

+# Fixed run.py
 import uvicorn
 import os
 if __name__ == "__main__":
     port = int(os.environ.get("PORT", 8000))
     print(f"🚀 Starting HackRx 6.0 RAG Server on port {port}...")
+    # Use the correct path - adjust based on your file structure
+    # If main_api.py is in the root directory:
+    #uvicorn.run("main_api:app", host="0.0.0.0", port=port, reload=False)
+    # If main_api.py is in app/ directory, use:
     uvicorn.run("app.main_api:app", host="0.0.0.0", port=port, reload=False)