Spaces:

Refat81
/

Social_Media_Data_Extractor_Chatbot

Sleeping

App Files Files Community

Refat81 commited on Oct 21

Commit

6bf8f95

verified ·

1 Parent(s): 77ccd8c

Update pages/facebook_extractor_pro.py

Browse files

Files changed (1) hide show

pages/facebook_extractor_pro.py +233 -83

pages/facebook_extractor_pro.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# let_deploy.py
 import streamlit as st
 import time
 from bs4 import BeautifulSoup
@@ -81,6 +81,20 @@ st.markdown("""
         background: #374151;
         color: white;
     }
 </style>
 """, unsafe_allow_html=True)
@@ -175,6 +189,10 @@ class FacebookDataExtractor:
             og_description = soup.find('meta', property='og:description')
             og_image = soup.find('meta', property='og:image')
             # Structure the extracted data
             extracted_data = {
                 "page_info": {
@@ -183,7 +201,11 @@ class FacebookDataExtractor:
                     "og_title": og_title['content'] if og_title else "",
                     "og_description": og_description['content'] if og_description else "",
                     "og_image": og_image['content'] if og_image else "",
-                    "url": url
                 },
                 "content_blocks": self._extract_content_blocks(clean_text),
                 "extraction_time": datetime.now().isoformat(),
@@ -208,18 +230,42 @@ class FacebookDataExtractor:
         # Split into paragraphs/sentences
         paragraphs = [p.strip() for p in text.split('.') if p.strip()]
-        for i, paragraph in enumerate(paragraphs[:20]):  # Limit to first 20 paragraphs
             if len(paragraph) > 30:  # Only include substantial content
                 block = {
                     "id": i + 1,
                     "content": paragraph,
                     "length": len(paragraph),
-                    "word_count": len(paragraph.split())
                 }
                 blocks.append(block)
         return blocks
     def analyze_facebook_url(self, url: str) -> str:
         """Analyze Facebook URL and return structured information"""
         url_lower = url.lower()
@@ -232,6 +278,8 @@ class FacebookDataExtractor:
             return "Facebook Event (Limited access)"
         elif 'profile' in url_lower or 'user' in url_lower:
             return "Facebook Profile (Limited access - requires login)"
         else:
             return "Facebook Content (General)"
@@ -241,29 +289,49 @@ def process_extracted_data(extracted_data: dict):
         return None, []
     # Combine all content into a single text
-    all_text = f"Page Title: {extracted_data['page_info']['title']}\n\n"
-    if extracted_data['page_info']['description']:
-        all_text += f"Description: {extracted_data['page_info']['description']}\n\n"
-    if extracted_data['page_info']['og_description']:
-        all_text += f"OpenGraph Description: {extracted_data['page_info']['og_description']}\n\n"
-    all_text += f"Data Type: {extracted_data['data_type']}\n"
     all_text += f"Extraction Time: {extracted_data['extraction_time']}\n"
-    all_text += f"Content Blocks: {len(extracted_data['content_blocks'])}\n\n"
-    # Add content blocks
     for i, block in enumerate(extracted_data['content_blocks']):
-        all_text += f"--- Content Block {i+1} ---\n"
-        all_text += f"Words: {block['word_count']} | Characters: {block['length']}\n"
-        all_text += f"Content: {block['content']}\n\n"
     # Split into chunks
     splitter = CharacterTextSplitter(
         separator="\n",
-        chunk_size=800,
-        chunk_overlap=150,
         length_function=len
     )
@@ -296,7 +364,7 @@ def create_chatbot(vectorstore):
         chain = ConversationalRetrievalChain.from_llm(
             llm=llm,
-            retriever=vectorstore.as_retriever(search_kwargs={"k": 3}),
             memory=memory,
             return_source_documents=True,
             output_key="answer"
@@ -327,6 +395,48 @@ def display_status_indicator(status: str, message: str):
     </div>
     """, unsafe_allow_html=True)
 def main():
     """Main application function"""
@@ -334,7 +444,7 @@ def main():
     st.markdown("""
     <div class="main-header">
         <h1 style="margin:0; font-size: 2.5rem;">🔥 Facebook Extractor 2.0</h1>
-        <p style="margin:0; opacity: 0.9; font-size: 1.2rem;">Enhanced Version - AI-Powered Analysis</p>
     </div>
     """, unsafe_allow_html=True)
@@ -373,7 +483,7 @@ def main():
     # Sidebar
     with st.sidebar:
-        st.markdown("### ⚙️ Configuration")
         # URL input
         st.subheader("🔗 Facebook URL")
@@ -386,27 +496,35 @@ def main():
         # Data type selection
         data_type = st.selectbox(
             "Content Type",
-            ["page", "group", "profile", "event", "post"],
             help="Select the type of Facebook content"
         )
         # Extraction settings
-        st.subheader("🔧 Settings")
         analyze_depth = st.select_slider(
             "Analysis Depth",
-            options=["Basic", "Standard", "Detailed"],
-            value="Standard"
         )
         # Extract button
-        if st.button("🚀 Extract & Analyze", type="primary", use_container_width=True):
             if not facebook_url.strip():
                 st.warning("⚠️ Please enter a Facebook URL")
             elif not facebook_url.startswith('https://www.facebook.com/'):
                 st.error("❌ Please enter a valid Facebook URL")
             else:
                 st.session_state.processing = True
-                with st.spinner("🔄 Extracting data from Facebook..."):
                     extracted_data = st.session_state.extractor.extract_public_data(facebook_url, data_type)
                     if extracted_data.get("status") == "success":
@@ -419,6 +537,7 @@ def main():
                             st.session_state.chatbot = create_chatbot(vectorstore)
                             st.session_state.chat_history = []
                             st.success(f"✅ Successfully processed {len(chunks)} content chunks!")
                         else:
                             st.error("❌ Failed to process extracted data")
                     else:
@@ -430,150 +549,181 @@ def main():
         # Chat management
         if st.session_state.chatbot and st.session_state.extracted_data:
             st.markdown("---")
-            st.subheader("💬 Chat Management")
-            if st.button("🗑️ Clear Chat History", type="secondary", use_container_width=True):
-                clear_chat_history()
     # Main content area
     col1, col2 = st.columns([1, 1])
     with col1:
-        st.markdown("### 📊 Extraction Results")
         if st.session_state.processing:
-            display_status_indicator("warning", "🔄 Processing...")
-            st.info("Extracting data from Facebook. This may take a few seconds.")
         elif st.session_state.extracted_data:
             data = st.session_state.extracted_data
             page_info = data['page_info']
             content_blocks = data['content_blocks']
-            display_status_indicator("success", "✅ Extraction Complete")
             # Display page info
-            st.markdown("#### 🏷️ Page Information")
             st.write(f"**Title:** {page_info['title']}")
             if page_info['description']:
-                st.write(f"**Description:** {page_info['description'][:200]}...")
             if page_info['og_description']:
-                st.write(f"**OG Description:** {page_info['og_description'][:200]}...")
             st.write(f"**URL:** {page_info['url']}")
             st.write(f"**Data Type:** {data['data_type'].title()}")
             st.write(f"**Content Blocks:** {len(content_blocks)}")
             st.write(f"**Extraction Time:** {data['extraction_time'][:19]}")
-            # Display sample content
-            st.markdown("#### 📝 Sample Content")
-            for i, block in enumerate(content_blocks[:3]):
-                with st.expander(f"Content Block {i+1} ({block['word_count']} words)"):
-                    st.write(block['content'])
-            if len(content_blocks) > 3:
-                st.info(f"📄 And {len(content_blocks) - 3} more content blocks...")
         else:
-            display_status_indicator("warning", "⏳ Ready for Extraction")
             st.info("""
-            **To get started:**
-            1. Enter a Facebook URL in the sidebar
-            2. Select content type
-            3. Click "Extract & Analyze"
-            **Supported URLs:**
-            - 🏢 Facebook Pages (best results)
-            - 📘 Public Groups (limited)
-            - 👤 Public Profiles (limited)
-            - 🎉 Events (limited)
-            - 📝 Posts (limited)
-            **Note:** This version extracts public data only.
-            Private content requires manual login (available in local deployment).
             """)
     with col2:
-        st.markdown("### 💬 AI Analysis")
         if st.session_state.chatbot and st.session_state.extracted_data:
             # Display chat history
             for i, chat in enumerate(st.session_state.chat_history):
                 if chat["role"] == "user":
-                    st.markdown(f'<div class="chat-message user-message"><strong>👤 You:</strong> {chat["content"]}</div>',
                                unsafe_allow_html=True)
                 elif chat["role"] == "assistant":
-                    st.markdown(f'<div class="chat-message assistant-message"><strong>🤖 Assistant:</strong> {chat["content"]}</div>',
                                unsafe_allow_html=True)
             # Chat input
-            user_input = st.chat_input("Ask about the Facebook data...")
             if user_input:
                 # Add user message
                 st.session_state.chat_history.append({"role": "user", "content": user_input})
                 # Generate AI response
-                with st.spinner("🤔 Analyzing..."):
                     try:
                         response = st.session_state.chatbot.invoke({"question": user_input})
-                        answer = response.get("answer", "I couldn't generate a response based on the available data.")
                         st.session_state.chat_history.append({"role": "assistant", "content": answer})
                         st.rerun()
                     except Exception as e:
-                        error_msg = f"❌ Error generating response: {str(e)}"
                         st.session_state.chat_history.append({"role": "assistant", "content": error_msg})
                         st.rerun()
-            # Suggested questions
             if not st.session_state.chat_history:
-                st.markdown("#### 💡 Suggested Questions")
                 suggestions = [
-                    "Summarize the main content of this page",
-                    "What is this page primarily about?",
-                    "Extract key information from the content",
-                    "What are the main topics discussed?",
-                    "Provide an overview of this Facebook content"
                 ]
                 for suggestion in suggestions:
-                    if st.button(suggestion, key=f"suggest_{suggestion}", use_container_width=True):
-                        st.info(f"💡 Try asking: '{suggestion}'")
         elif st.session_state.extracted_data:
-            st.info("💬 Extract data first to start chatting with AI")
         else:
-            st.info("🔍 Extract Facebook data to enable AI analysis")
-    # Features section
     st.markdown("---")
-    st.markdown("### 🚀 Enhanced Features")
-    feature_cols = st.columns(3)
     with feature_cols[0]:
         st.markdown("""
         <div class="feature-card">
-            <h4>🔍 Smart Extraction</h4>
-            <p>Advanced algorithms for better content recognition and structure analysis</p>
         </div>
         """, unsafe_allow_html=True)
     with feature_cols[1]:
         st.markdown("""
         <div class="feature-card">
-            <h4>🤖 AI-Powered Analysis</h4>
-            <p>HuggingFace integration for intelligent content understanding and Q&A</p>
         </div>
         """, unsafe_allow_html=True)
     with feature_cols[2]:
         st.markdown("""
         <div class="feature-card">
-            <h4>💬 Contextual Memory</h4>
-            <p>Maintains conversation context for more meaningful interactions</p>
         </div>
         """, unsafe_allow_html=True)

+# pages/facebook_extractor_pro.py
 import streamlit as st
 import time
 from bs4 import BeautifulSoup
         background: #374151;
         color: white;
     }
+    .extraction-card {
+        background: linear-gradient(135deg, #1e3c72, #2a5298);
+        padding: 1.5rem;
+        border-radius: 10px;
+        margin: 1rem 0;
+        border-left: 4px solid #FF6B35;
+    }
+    .metric-card {
+        background: #262730;
+        padding: 1rem;
+        border-radius: 8px;
+        text-align: center;
+        border: 1px solid #444;
+    }
 </style>
 """, unsafe_allow_html=True)
             og_description = soup.find('meta', property='og:description')
             og_image = soup.find('meta', property='og:image')
+            # Extract additional metadata
+            keywords = soup.find('meta', attrs={'name': 'keywords'})
+            viewport = soup.find('meta', attrs={'name': 'viewport'})
             # Structure the extracted data
             extracted_data = {
                 "page_info": {
                     "og_title": og_title['content'] if og_title else "",
                     "og_description": og_description['content'] if og_description else "",
                     "og_image": og_image['content'] if og_image else "",
+                    "keywords": keywords['content'] if keywords else "",
+                    "viewport": viewport['content'] if viewport else "",
+                    "url": url,
+                    "response_code": response.status_code,
+                    "content_length": len(response.text)
                 },
                 "content_blocks": self._extract_content_blocks(clean_text),
                 "extraction_time": datetime.now().isoformat(),
         # Split into paragraphs/sentences
         paragraphs = [p.strip() for p in text.split('.') if p.strip()]
+        for i, paragraph in enumerate(paragraphs[:25]):  # Limit to first 25 paragraphs
             if len(paragraph) > 30:  # Only include substantial content
+                # Analyze content type
+                content_type = self._analyze_content_type(paragraph)
                 block = {
                     "id": i + 1,
                     "content": paragraph,
                     "length": len(paragraph),
+                    "word_count": len(paragraph.split()),
+                    "content_type": content_type,
+                    "has_links": 'http' in paragraph.lower(),
+                    "has_mentions": '@' in paragraph,
+                    "has_hashtags": '#' in paragraph
                 }
                 blocks.append(block)
         return blocks
+    def _analyze_content_type(self, text: str) -> str:
+        """Analyze the type of content"""
+        text_lower = text.lower()
+        if any(word in text_lower for word in ['login', 'sign in', 'password', 'email']):
+            return "authentication"
+        elif any(word in text_lower for word in ['post', 'share', 'comment', 'like']):
+            return "social_interaction"
+        elif any(word in text_lower for word in ['group', 'community', 'member']):
+            return "community"
+        elif any(word in text_lower for word in ['event', 'calendar', 'date', 'time']):
+            return "event"
+        elif any(word in text_lower for word in ['marketplace', 'buy', 'sell', 'price']):
+            return "commerce"
+        else:
+            return "general"
     def analyze_facebook_url(self, url: str) -> str:
         """Analyze Facebook URL and return structured information"""
         url_lower = url.lower()
             return "Facebook Event (Limited access)"
         elif 'profile' in url_lower or 'user' in url_lower:
             return "Facebook Profile (Limited access - requires login)"
+        elif 'marketplace' in url_lower:
+            return "Facebook Marketplace (Limited access)"
         else:
             return "Facebook Content (General)"
         return None, []
     # Combine all content into a single text
+    all_text = f"FACEBOOK DATA EXTRACTION REPORT\n"
+    all_text += "=" * 60 + "\n\n"
+    page_info = extracted_data['page_info']
+    all_text += f"📄 PAGE INFORMATION:\n"
+    all_text += f"Title: {page_info['title']}\n"
+    if page_info['description']:
+        all_text += f"Description: {page_info['description']}\n"
+    if page_info['og_description']:
+        all_text += f"OpenGraph: {page_info['og_description']}\n"
+    all_text += f"URL: {page_info['url']}\n"
+    all_text += f"Data Type: {extracted_data['data_type'].upper()}\n"
     all_text += f"Extraction Time: {extracted_data['extraction_time']}\n"
+    all_text += f"Response Code: {page_info['response_code']}\n"
+    all_text += f"Content Length: {page_info['content_length']} characters\n\n"
+    all_text += f"📊 CONTENT ANALYSIS:\n"
+    all_text += f"Total Content Blocks: {len(extracted_data['content_blocks'])}\n\n"
+    # Add content blocks with enhanced information
     for i, block in enumerate(extracted_data['content_blocks']):
+        all_text += f"--- BLOCK {i+1} ---\n"
+        all_text += f"Type: {block['content_type'].upper()}\n"
+        all_text += f"Words: {block['word_count']} | Chars: {block['length']}\n"
+        all_text += f"Features: "
+        features = []
+        if block['has_links']: features.append("Links")
+        if block['has_mentions']: features.append("Mentions")
+        if block['has_hashtags']: features.append("Hashtags")
+        all_text += ", ".join(features) if features else "None"
+        all_text += f"\nContent: {block['content']}\n\n"
+    all_text += "=" * 60 + "\n"
+    all_text += "END OF EXTRACTION REPORT"
     # Split into chunks
     splitter = CharacterTextSplitter(
         separator="\n",
+        chunk_size=1000,
+        chunk_overlap=200,
         length_function=len
     )
         chain = ConversationalRetrievalChain.from_llm(
             llm=llm,
+            retriever=vectorstore.as_retriever(search_kwargs={"k": 4}),
             memory=memory,
             return_source_documents=True,
             output_key="answer"
     </div>
     """, unsafe_allow_html=True)
+def display_metrics(extracted_data):
+    """Display extraction metrics"""
+    if not extracted_data:
+        return
+    page_info = extracted_data['page_info']
+    content_blocks = extracted_data['content_blocks']
+    col1, col2, col3, col4 = st.columns(4)
+    with col1:
+        st.markdown("""
+        <div class="metric-card">
+            <h3>📄 Content Blocks</h3>
+            <h2>{}</h2>
+        </div>
+        """.format(len(content_blocks)), unsafe_allow_html=True)
+    with col2:
+        st.markdown("""
+        <div class="metric-card">
+            <h3>📊 Total Words</h3>
+            <h2>{}</h2>
+        </div>
+        """.format(sum(block['word_count'] for block in content_blocks)), unsafe_allow_html=True)
+    with col3:
+        st.markdown("""
+        <div class="metric-card">
+            <h3>🔗 Links Found</h3>
+            <h2>{}</h2>
+        </div>
+        """.format(sum(1 for block in content_blocks if block['has_links'])), unsafe_allow_html=True)
+    with col4:
+        st.markdown("""
+        <div class="metric-card">
+            <h3>⏱️ Response Code</h3>
+            <h2>{}</h2>
+        </div>
+        """.format(page_info['response_code']), unsafe_allow_html=True)
 def main():
     """Main application function"""
     st.markdown("""
     <div class="main-header">
         <h1 style="margin:0; font-size: 2.5rem;">🔥 Facebook Extractor 2.0</h1>
+        <p style="margin:0; opacity: 0.9; font-size: 1.2rem;">Professional Version - Enhanced AI-Powered Analysis</p>
     </div>
     """, unsafe_allow_html=True)
     # Sidebar
     with st.sidebar:
+        st.markdown("### ⚙️ Professional Configuration")
         # URL input
         st.subheader("🔗 Facebook URL")
         # Data type selection
         data_type = st.selectbox(
             "Content Type",
+            ["page", "group", "profile", "event", "post", "marketplace"],
             help="Select the type of Facebook content"
         )
         # Extraction settings
+        st.subheader("🔧 Advanced Settings")
         analyze_depth = st.select_slider(
             "Analysis Depth",
+            options=["Basic", "Standard", "Detailed", "Comprehensive"],
+            value="Detailed"
+        )
+        content_limit = st.slider(
+            "Max Content Blocks",
+            min_value=10,
+            max_value=50,
+            value=25,
+            help="Limit the number of content blocks extracted"
         )
         # Extract button
+        if st.button("🚀 Advanced Extraction", type="primary", use_container_width=True):
             if not facebook_url.strip():
                 st.warning("⚠️ Please enter a Facebook URL")
             elif not facebook_url.startswith('https://www.facebook.com/'):
                 st.error("❌ Please enter a valid Facebook URL")
             else:
                 st.session_state.processing = True
+                with st.spinner("🔄 Performing advanced data extraction..."):
                     extracted_data = st.session_state.extractor.extract_public_data(facebook_url, data_type)
                     if extracted_data.get("status") == "success":
                             st.session_state.chatbot = create_chatbot(vectorstore)
                             st.session_state.chat_history = []
                             st.success(f"✅ Successfully processed {len(chunks)} content chunks!")
+                            st.balloons()
                         else:
                             st.error("❌ Failed to process extracted data")
                     else:
         # Chat management
         if st.session_state.chatbot and st.session_state.extracted_data:
             st.markdown("---")
+            st.subheader("💬 Professional Chat")
+            col1, col2 = st.columns(2)
+            with col1:
+                if st.button("🗑️ Clear History", type="secondary", use_container_width=True):
+                    clear_chat_history()
+            with col2:
+                if st.button("📊 Export Data", type="secondary", use_container_width=True):
+                    st.info("📄 Data export feature - Coming soon!")
     # Main content area
     col1, col2 = st.columns([1, 1])
     with col1:
+        st.markdown("### 📊 Professional Analysis")
         if st.session_state.processing:
+            display_status_indicator("warning", "🔄 Advanced Processing...")
+            st.info("Performing comprehensive data extraction and analysis...")
         elif st.session_state.extracted_data:
             data = st.session_state.extracted_data
             page_info = data['page_info']
             content_blocks = data['content_blocks']
+            display_status_indicator("success", "✅ Professional Extraction Complete")
+            # Display metrics
+            display_metrics(data)
             # Display page info
+            st.markdown("""
+            <div class="extraction-card">
+                <h4>🏷️ Page Information</h4>
+            </div>
+            """, unsafe_allow_html=True)
             st.write(f"**Title:** {page_info['title']}")
             if page_info['description']:
+                st.write(f"**Description:** {page_info['description']}")
             if page_info['og_description']:
+                st.write(f"**OpenGraph:** {page_info['og_description']}")
             st.write(f"**URL:** {page_info['url']}")
             st.write(f"**Data Type:** {data['data_type'].title()}")
             st.write(f"**Content Blocks:** {len(content_blocks)}")
             st.write(f"**Extraction Time:** {data['extraction_time'][:19]}")
+            st.write(f"**Response Code:** {page_info['response_code']}")
+            # Display content analysis
+            st.markdown("#### 📝 Content Analysis")
+            for i, block in enumerate(content_blocks[:5]):
+                with st.expander(f"Block {i+1} - {block['content_type'].title()} ({block['word_count']} words)"):
+                    st.write(f"**Content:** {block['content']}")
+                    st.caption(f"Features: {', '.join(['Links' if block['has_links'] else '', 'Mentions' if block['has_mentions'] else '', 'Hashtags' if block['has_hashtags'] else '']).strip() or 'None'}")
+            if len(content_blocks) > 5:
+                st.info(f"📄 And {len(content_blocks) - 5} more content blocks analyzed...")
         else:
+            display_status_indicator("warning", "⏳ Ready for Professional Extraction")
             st.info("""
+            **🚀 Professional Features:**
+            1. **Advanced URL Analysis** - Intelligent content type detection
+            2. **Enhanced Metadata Extraction** - OpenGraph, keywords, descriptions
+            3. **Content Classification** - Automatic content type categorization
+            4. **Comprehensive Analytics** - Word counts, link analysis, feature detection
+            5. **AI-Powered Insights** - Advanced conversational analysis
+            **📊 Supported Content Types:**
+            - 🏢 Facebook Pages (optimal results)
+            - 📘 Public Groups (enhanced analysis)
+            - 👤 Public Profiles (comprehensive data)
+            - 🎉 Events (detailed extraction)
+            - 📝 Posts (advanced content analysis)
+            - 🛒 Marketplace (commerce detection)
+            **🔧 Professional Tools:**
+            - Multi-level analysis depth
+            - Content block limiting
+            - Real-time metrics
+            - Export capabilities
             """)
     with col2:
+        st.markdown("### 💬 Professional AI Chat")
         if st.session_state.chatbot and st.session_state.extracted_data:
             # Display chat history
             for i, chat in enumerate(st.session_state.chat_history):
                 if chat["role"] == "user":
+                    st.markdown(f'<div class="chat-message user-message"><strong>👤 Professional Analyst:</strong> {chat["content"]}</div>',
                                unsafe_allow_html=True)
                 elif chat["role"] == "assistant":
+                    st.markdown(f'<div class="chat-message assistant-message"><strong>🤖 AI Assistant:</strong> {chat["content"]}</div>',
                                unsafe_allow_html=True)
             # Chat input
+            user_input = st.chat_input("Ask professional questions about the Facebook data...")
             if user_input:
                 # Add user message
                 st.session_state.chat_history.append({"role": "user", "content": user_input})
                 # Generate AI response
+                with st.spinner("🤔 Performing professional analysis..."):
                     try:
                         response = st.session_state.chatbot.invoke({"question": user_input})
+                        answer = response.get("answer", "I couldn't generate a professional response based on the available data.")
                         st.session_state.chat_history.append({"role": "assistant", "content": answer})
                         st.rerun()
                     except Exception as e:
+                        error_msg = f"❌ Professional analysis error: {str(e)}"
                         st.session_state.chat_history.append({"role": "assistant", "content": error_msg})
                         st.rerun()
+            # Professional suggested questions
             if not st.session_state.chat_history:
+                st.markdown("#### 💡 Professional Questions")
                 suggestions = [
+                    "Provide a comprehensive analysis of this page",
+                    "What are the key content patterns and themes?",
+                    "Analyze the engagement potential of this content",
+                    "Extract business intelligence from this data",
+                    "What marketing insights can be derived?",
+                    "Perform competitor analysis based on this content"
                 ]
                 for suggestion in suggestions:
+                    if st.button(suggestion, key=f"pro_suggest_{suggestion}", use_container_width=True):
+                        st.info(f"💡 Professional question: '{suggestion}'")
         elif st.session_state.extracted_data:
+            st.info("💬 Start a professional conversation with the AI assistant")
         else:
+            st.info("🔍 Perform data extraction to enable professional AI analysis")
+    # Professional features section
     st.markdown("---")
+    st.markdown("### 🚀 Professional Features")
+    feature_cols = st.columns(4)
     with feature_cols[0]:
         st.markdown("""
         <div class="feature-card">
+            <h4>🔍 Advanced Extraction</h4>
+            <p>Multi-layer content analysis with intelligent pattern recognition</p>
         </div>
         """, unsafe_allow_html=True)
     with feature_cols[1]:
         st.markdown("""
         <div class="feature-card">
+            <h4>🤖 AI Intelligence</h4>
+            <p>Professional-grade analysis with contextual understanding</p>
         </div>
         """, unsafe_allow_html=True)
     with feature_cols[2]:
         st.markdown("""
         <div class="feature-card">
+            <h4>📊 Analytics Dashboard</h4>
+            <p>Comprehensive metrics and real-time data visualization</p>
+        </div>
+        """, unsafe_allow_html=True)
+    with feature_cols[3]:
+        st.markdown("""
+        <div class="feature-card">
+            <h4>💬 Professional Chat</h4>
+            <p>Advanced conversational AI for business insights</p>
         </div>
         """, unsafe_allow_html=True)