Founder_Name_Extraction_v3

Sleeping

App Files Files Community

dygoo commited on Jun 9

Commit

054936e

verified ·

1 Parent(s): 8230bce

Update app.py

Browse files

Files changed (1) hide show

app.py +102 -122

app.py CHANGED Viewed

@@ -28,11 +28,11 @@ def check_cancellation():
     """Check if operation should be cancelled"""
     return cancel_operation.is_set()
-# === Model Functions (No changes in the first few) ===
 def extract_publication_date(soup, url):
-    """Extract publication date from article HTML - same as before"""
     try:
         date_selectors = [
             'time[datetime]', '.date', '.publish-date', '.published', '.post-date',
             '[class*="date"]', '[class*="time"]',
@@ -56,26 +56,23 @@ def extract_publication_date(soup, url):
         print(f"Date extraction error for {url}: {e}")
     return None
 def get_full_article_with_timeout(url, timeout=15):
-    """Enhanced article fetching with timeout and better error handling"""
     if check_cancellation(): return "[CANCELLED] Operation was cancelled", None
     try:
         headers = {
-            'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)',
-            'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
-            'Accept-Language': 'en-US,en;q=0.5',
-            'Connection': 'keep-alive', 'Upgrade-Insecure-Requests': '1'
         }
         response = requests.get(url, headers=headers, timeout=timeout, verify=True)
         response.raise_for_status()
         soup = BeautifulSoup(response.content, 'html.parser')
         pub_date = extract_publication_date(soup, url)
-        for element in soup(['script', 'style', 'nav', 'header', 'footer', 'aside', 'ads', 'noscript', 'form']):
-            element.decompose()
         article_selectors = [
-            'article', '.article-content', '.post-content', '.story-body', '.story-content', '.entry-content',
-            '.content-body', '.article-body', 'main article', 'main .content', 'main', '[role="main"]',
-            '.main-content', '.page-content', '.text', '.article-text'
         ]
         for selector in article_selectors:
             content = soup.select_one(selector)
@@ -92,90 +89,104 @@ def get_full_article_with_timeout(url, timeout=15):
     except requests.exceptions.RequestException as e: return f"[ERROR] Network error: {str(e)}", None
     except Exception as e: return f"[ERROR] Could not fetch article: {str(e)}", None
 def search_articles_by_timeframe_enhanced(name: str, timeframe: str, max_articles: int = 3, progress=None) -> list:
-    """Enhanced search with progress tracking and better error handling"""
     if check_cancellation(): return []
     if timeframe == "recent":
         search_queries = [f'"{name}" founder news 2024 2025', f'"{name}" CEO founder recent', f'"{name}" founder update latest']
     else:
         search_queries = [f'"{name}" founded established history', f'"{name}" founder origin story', f'"{name}" started began founder']
-    all_results, max_retries, base_delay, total_queries = [], 2, 2, len(search_queries)
     for query_idx, search_query in enumerate(search_queries):
         if len(all_results) >= max_articles or check_cancellation(): break
         if progress:
             progress((query_idx / total_queries) * 0.3, desc=f"Searching {timeframe} articles ({query_idx + 1}/{total_queries})")
         for attempt in range(max_retries):
             if check_cancellation(): return all_results
             try:
-                print(f"Search attempt {attempt + 1} for query {query_idx + 1} ({timeframe}): {search_query}")
-                if attempt > 0: time.sleep(base_delay * attempt)
                 with DDGS(timeout=15) as ddgs:
-                    results = list(ddgs.text(keywords=search_query, max_results=max_articles - len(all_results) + 2, safesearch='moderate', region='us-en'))
-                if results:
-                    existing_urls = {r.get('url', '') for r in all_results}
-                    for result in results:
-                        if len(all_results) >= max_articles: break
-                        url = result.get('href', '')
-                        if url and url not in existing_urls: all_results.append(result); existing_urls.add(url)
-                    break
             except Exception as e:
-                print(f"Attempt {attempt + 1} failed for {timeframe} query {query_idx + 1}: {str(e)}")
-                if attempt < max_retries - 1: time.sleep(base_delay * (attempt + 1))
     return all_results[:max_articles]
 def categorize_article_by_date(pub_date):
-    """Same as before"""
     if not pub_date: return "unknown"
     return "recent" if pub_date >= (datetime.now() - timedelta(days=365)) else "historical"
 def fetch_article_parallel(result, article_num, total_articles, progress=None):
-    """Fetch single article with progress update"""
     if check_cancellation(): return None
-    url, title, snippet = result.get('href', 'No URL'), result.get('title', 'No Title'), result.get('body', 'No snippet available')
-    expected_timeframe = result.get('expected_timeframe', 'unknown')
     if progress:
         progress(0.4 + (article_num / total_articles) * 0.5, desc=f"Fetching article {article_num + 1}/{total_articles}: {title[:50]}...")
     full_text, pub_date = get_full_article_with_timeout(url, timeout=12)
     if check_cancellation(): return None
     actual_timeframe = categorize_article_by_date(pub_date)
-    content = f"[SNIPPET ONLY]\n{snippet}" if any(e in str(full_text) for e in ["[ERROR]", "timeout", "[CANCELLED]"]) else full_text
-    timeframe_indicator = f"📅 **Published**: {pub_date.strftime('%B %d, %Y')} ({actual_timeframe.title()})" if pub_date else f"📅 **Timeframe**: {expected_timeframe.title()} (estimated)"
     article = f"### {article_num + 1}. {title}\n[Source]({url})\n{timeframe_indicator}\n\n{content}\n"
     return {'article': article, 'timeframe': actual_timeframe, 'url': url, 'title': title}
 def search_articles_enhanced(name: str, max_articles: int = 4, progress=None) -> str:
-    """Enhanced search with progress tracking and parallel processing"""
     reset_cancellation()
-    if progress: progress(0, desc="Initializing enhanced search...")
     recent_count, historical_count = max_articles // 2, max_articles - (max_articles // 2)
     if progress: progress(0.05, desc=f"Planning search: {recent_count} recent + {historical_count} historical")
-    recent_results = search_articles_by_timeframe_enhanced(name, "recent", recent_count, progress)
-    if check_cancellation(): return "[CANCELLED] Search was cancelled by user"
-    if progress: progress(0.3, desc="Searching for historical articles...")
     time.sleep(1)
-    historical_results = search_articles_by_timeframe_enhanced(name, "historical", historical_count, progress)
-    if check_cancellation(): return "[CANCELLED] Search was cancelled by user"
     all_results = []
-    for r in recent_results: r['expected_timeframe'] = 'recent'; all_results.append(r)
-    for r in historical_results: r['expected_timeframe'] = 'historical'; all_results.append(r)
     if not all_results:
-        if progress: progress(1.0, desc="Search completed - no results found")
-        return f"[INFO] No articles found for {name}"
-    if progress: progress(0.4, desc=f"Found {len(all_results)} articles, now fetching content...")
     articles, recent_found, historical_found = [], 0, 0
     with ThreadPoolExecutor(max_workers=min(3, len(all_results))) as executor:
-        future_to_result = {executor.submit(fetch_article_parallel, r, i, len(all_results), progress): r for i, r in enumerate(all_results)}
-        for future in as_completed(future_to_result):
             if check_cancellation():
-                for f in future_to_result: f.cancel()
-                return "[CANCELLED] Search was cancelled by user"
             try:
                 result_data = future.result(timeout=20)
                 if result_data:
@@ -185,138 +196,107 @@ def search_articles_enhanced(name: str, max_articles: int = 4, progress=None) ->
             except Exception as e:
                 print(f"Error fetching article result: {e}")
-    if check_cancellation(): return "[CANCELLED] Search was cancelled by user"
     if progress: progress(0.95, desc="Formatting results...")
     # FIX: Replaced fragile sorting logic with a robust and efficient dictionary lookup.
     url_to_index = {res.get('href'): i for i, res in enumerate(all_results) if res.get('href')}
     articles.sort(key=lambda x: url_to_index.get(x.get('url'), 999))
     summary = f"**Search Summary**: Found {len(articles)} articles total - {recent_found} recent, {historical_found} historical\n\n"
-    article_texts = [article_data['article'] for article_data in articles]
-    if progress: progress(1.0, desc=f"Search completed! Found {len(articles)} articles")
     return summary + "\n---\n".join(article_texts)
 def extract_entities_enhanced(search_results: str, company_name: str, progress=None) -> str:
-    """Enhanced entity extraction with progress tracking"""
     if progress: progress(0, desc="Preparing text for analysis...")
     MAX_CHARS = 15000
     if len(search_results) > MAX_CHARS:
         search_results = search_results[:search_results.rfind('. ', 0, MAX_CHARS) + 1]
-    if progress: progress(0.2, desc="Analyzing articles with AI...")
-    prompt = f"""Extract all named entities that are described as founders of "{company_name}" specifically from the following text.
-Only include founders who are explicitly mentioned as founders of {company_name}.
-Ignore founders of other companies that may be mentioned in the text.
-Return a JSON object with the following structure: {{"founders": [{{"name": "Founder Name", "evidence": ["brief quote or context where they were mentioned as founder"]}}]}}
-Respond only with valid JSON. Do not include any explanations, comments, or additional formatting.
-You have to examine every article available in the search results below.
-Text:
-{search_results}"""
     try:
         if progress: progress(0.5, desc="Sending request to AI model...")
-        message = client.messages.create(
-            model="claude-sonnet-4-20250514",
-            max_tokens=1500, temperature=0.1,
-            messages=[{"role": "user", "content": prompt}]
-        )
-        if progress: progress(0.9, desc="Processing AI response...")
-        # FIX: Check if the API returned any content before trying to access it.
-        # This prevents the "list index out of range" error.
-        if not message.content:
-            error_json = {"error": "API returned no content", "details": "The model may have refused to answer, or an API error occurred."}
-            return json.dumps(error_json)
         result = message.content[0].text
         if progress: progress(1.0, desc="Analysis completed!")
         return result
     except Exception as e:
         if progress: progress(1.0, desc="Analysis failed")
-        error_json = {"error": "Extraction failed", "details": str(e)}
-        return json.dumps(error_json)
-# === Gradio Interface Functions (Unchanged) ===
 def search_only_enhanced(name: str, article_count: int, progress=gr.Progress()):
-    if not name.strip(): return "❌ No name provided", ""
     try:
         start = time.time()
-        progress(0, desc="Starting enhanced temporal search...")
-        articles_output = search_articles_enhanced(name.strip(), max_articles=article_count, progress=progress)
         if "[CANCELLED]" in articles_output: return "🛑 Search was cancelled by user.", ""
         elapsed = time.time() - start
-        progress(1.0, desc=f"Search completed in {elapsed:.1f}s")
-        results = f"✅ **Enhanced Temporal Search** completed for **{name}** in {elapsed:.1f}s\n\n{articles_output}"
         return results, articles_output
     except Exception as e:
-        progress(1.0, desc="Search failed")
-        return f"❌ **Search failed**: {str(e)}", ""
 def extract_only_enhanced(stored_results: str, company_name: str, progress=gr.Progress()):
-    if not stored_results.strip(): return "❌ No search results available. Please search first."
-    if not company_name.strip(): return "❌ No company name provided. Please search first."
-    if "[CANCELLED]" in stored_results: return "❌ Cannot extract from cancelled search results. Please search again."
     try:
         start = time.time()
-        entities = extract_entities_enhanced(stored_results, company_name.strip(), progress)
         elapsed = time.time() - start
         try:
             parsed = json.loads(entities)
             formatted = json.dumps(parsed, indent=2)
-            return f"✅ **Enhanced Extraction** completed in {elapsed:.1f}s\n\n```json\n{formatted}\n```"
         except (json.JSONDecodeError, TypeError):
             return f"⚠️ **Extraction Note**: Model did not return valid JSON. Completed in {elapsed:.1f}s\n\n{entities}"
     except Exception as e:
-        progress(1.0, desc="Extraction failed")
-        return f"❌ **Extraction failed**: {str(e)}"
 def cancel_search():
     cancel_operation.set()
-    return "🛑 **Cancellation requested** - stopping current operation..."
-# === Gradio UI (Unchanged) ===
 with gr.Blocks(title="Enhanced Founder Finder", theme=gr.themes.Soft()) as demo:
     gr.Markdown("# 🔎 Enhanced Founder Finder")
-    gr.Markdown("Enter a business or project name to search for its founder using **temporal search strategy** with **real-time progress tracking**.")
-    gr.Markdown("*🚀 **New Features**: Progress bars, cancellation support, parallel processing, better error handling*")
-    gr.Markdown("*⏱️ Note: Enhanced search typically takes 30–60 seconds with full progress visibility.*")
     search_state = gr.State("")
     with gr.Row():
-        with gr.Column(scale=2):
-            name_input = gr.Textbox(label="Company Name", placeholder="Enter business name (e.g., 'Tesla', 'SpaceX', 'Microsoft')")
-        with gr.Column(scale=1):
-            article_count_slider = gr.Slider(2, 12, value=4, step=2, label="Total Articles", info="Split between recent/historical")
     with gr.Row():
-        search_btn = gr.Button("🔍 Enhanced Temporal Search", variant="primary", size="lg")
-        cancel_btn = gr.Button("🛑 Cancel Search", variant="secondary", size="lg")
-        extract_btn = gr.Button("📊 Extract Founder Intelligence", variant="secondary", size="lg")
     with gr.Row(): status_output = gr.Markdown("Ready to search...")
     with gr.Row():
-        with gr.Column():
-            output1 = gr.Markdown(label="Search Results with Temporal Analysis", height=400)
-        with gr.Column():
-            output2 = gr.Textbox(label="Founder Intelligence Report", lines=15, max_lines=25, show_copy_button=True)
-    search_event = search_btn.click(fn=search_only_enhanced, inputs=[name_input, article_count_slider], outputs=[output1, search_state], show_progress="full")
-    cancel_btn.click(fn=cancel_search, inputs=None, outputs=[status_output], cancels=[search_event])
-    extract_btn.click(fn=extract_only_enhanced, inputs=[search_state, name_input], outputs=[output2], show_progress="full")
-    gr.Examples(examples=[["Tesla", 4], ["SpaceX", 6], ["Microsoft", 4], ["Apple", 6], ["OpenAI", 4]], inputs=[name_input, article_count_slider])
 demo.queue()
 if __name__ == "__main__":
-    demo.launch(share=False, show_error=True)
 '''
 import gradio as gr

     """Check if operation should be cancelled"""
     return cancel_operation.is_set()
+# === Model Functions ===
 def extract_publication_date(soup, url):
     try:
+        # ... (Function content is correct, keeping it for brevity) ...
         date_selectors = [
             'time[datetime]', '.date', '.publish-date', '.published', '.post-date',
             '[class*="date"]', '[class*="time"]',
         print(f"Date extraction error for {url}: {e}")
     return None
 def get_full_article_with_timeout(url, timeout=15):
+    # ... (Function content is correct, keeping it for brevity) ...
     if check_cancellation(): return "[CANCELLED] Operation was cancelled", None
     try:
         headers = {
+            'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)', 'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
+            'Accept-Language': 'en-US,en;q=0.5', 'Connection': 'keep-alive', 'Upgrade-Insecure-Requests': '1'
         }
         response = requests.get(url, headers=headers, timeout=timeout, verify=True)
         response.raise_for_status()
         soup = BeautifulSoup(response.content, 'html.parser')
         pub_date = extract_publication_date(soup, url)
+        for element in soup(['script', 'style', 'nav', 'header', 'footer', 'aside', 'ads', 'noscript', 'form']): element.decompose()
         article_selectors = [
+            'article', '.article-content', '.post-content', '.story-body', '.story-content', '.entry-content', '.content-body',
+            '.article-body', 'main article', 'main .content', 'main', '[role="main"]', '.main-content', '.page-content', '.text', '.article-text'
         ]
         for selector in article_selectors:
             content = soup.select_one(selector)
     except requests.exceptions.RequestException as e: return f"[ERROR] Network error: {str(e)}", None
     except Exception as e: return f"[ERROR] Could not fetch article: {str(e)}", None
 def search_articles_by_timeframe_enhanced(name: str, timeframe: str, max_articles: int = 3, progress=None) -> list:
     if check_cancellation(): return []
     if timeframe == "recent":
         search_queries = [f'"{name}" founder news 2024 2025', f'"{name}" CEO founder recent', f'"{name}" founder update latest']
     else:
         search_queries = [f'"{name}" founded established history', f'"{name}" founder origin story', f'"{name}" started began founder']
+    all_results, max_retries, total_queries = [], 2, len(search_queries)
     for query_idx, search_query in enumerate(search_queries):
         if len(all_results) >= max_articles or check_cancellation(): break
         if progress:
             progress((query_idx / total_queries) * 0.3, desc=f"Searching {timeframe} articles ({query_idx + 1}/{total_queries})")
         for attempt in range(max_retries):
             if check_cancellation(): return all_results
             try:
                 with DDGS(timeout=15) as ddgs:
+                    # FIX: Directly get results and check if it's None.
+                    # This prevents crashes if the library returns None instead of an empty list.
+                    results = ddgs.text(keywords=search_query, max_results=max_articles - len(all_results) + 2, safesearch='moderate', region='us-en')
+                    if results:
+                        existing_urls = {r.get('url', '') for r in all_results}
+                        for result in results:
+                            if len(all_results) >= max_articles: break
+                            url = result.get('href') # Check for href directly
+                            if url and url not in existing_urls:
+                                all_results.append(result)
+                                existing_urls.add(url)
+                        break # Break from retry loop on success
             except Exception as e:
+                print(f"DDGS Search Attempt {attempt + 1} failed for '{search_query}': {e}")
+                if attempt < max_retries - 1: time.sleep(1)
     return all_results[:max_articles]
 def categorize_article_by_date(pub_date):
     if not pub_date: return "unknown"
     return "recent" if pub_date >= (datetime.now() - timedelta(days=365)) else "historical"
 def fetch_article_parallel(result, article_num, total_articles, progress=None):
     if check_cancellation(): return None
+    url, title = result.get('href', 'No URL'), result.get('title', 'No Title')
     if progress:
         progress(0.4 + (article_num / total_articles) * 0.5, desc=f"Fetching article {article_num + 1}/{total_articles}: {title[:50]}...")
     full_text, pub_date = get_full_article_with_timeout(url, timeout=12)
     if check_cancellation(): return None
     actual_timeframe = categorize_article_by_date(pub_date)
+    content = f"[SNIPPET ONLY]\n{result.get('body', 'No snippet')}" if any(e in str(full_text) for e in ["[ERROR]", "timeout", "[CANCELLED]"]) else full_text
+    timeframe_indicator = f"📅 **Published**: {pub_date.strftime('%B %d, %Y')} ({actual_timeframe.title()})" if pub_date else f"📅 **Timeframe**: {result.get('expected_timeframe', 'unknown').title()} (estimated)"
     article = f"### {article_num + 1}. {title}\n[Source]({url})\n{timeframe_indicator}\n\n{content}\n"
     return {'article': article, 'timeframe': actual_timeframe, 'url': url, 'title': title}
 def search_articles_enhanced(name: str, max_articles: int = 4, progress=None) -> str:
     reset_cancellation()
+    if progress: progress(0, desc="Initializing...")
     recent_count, historical_count = max_articles // 2, max_articles - (max_articles // 2)
     if progress: progress(0.05, desc=f"Planning search: {recent_count} recent + {historical_count} historical")
+    recent_results = search_articles_by_timeframe_enhanced(name, "recent", recent_count, progress) or []
+    if check_cancellation(): return "[CANCELLED] Search was cancelled."
     time.sleep(1)
+    historical_results = search_articles_by_timeframe_enhanced(name, "historical", historical_count, progress) or []
+    if check_cancellation(): return "[CANCELLED] Search was cancelled."
     all_results = []
+    # FIX: This loop is now safe because recent_results is guaranteed to be a list.
+    for r in recent_results:
+        r['expected_timeframe'] = 'recent'
+        all_results.append(r)
+    for r in historical_results:
+        r['expected_timeframe'] = 'historical'
+        all_results.append(r)
     if not all_results:
+        if progress: progress(1.0, desc="Completed - no results found.")
+        return f"[INFO] No articles found for '{name}'."
+    if progress: progress(0.4, desc=f"Found {len(all_results)} articles, now fetching...")
     articles, recent_found, historical_found = [], 0, 0
     with ThreadPoolExecutor(max_workers=min(3, len(all_results))) as executor:
+        future_to_article = {executor.submit(fetch_article_parallel, r, i, len(all_results), progress): r for i, r in enumerate(all_results)}
+        for future in as_completed(future_to_article):
             if check_cancellation():
+                for f in future_to_article: f.cancel()
+                return "[CANCELLED] Search was cancelled."
             try:
                 result_data = future.result(timeout=20)
                 if result_data:
             except Exception as e:
                 print(f"Error fetching article result: {e}")
+    if check_cancellation(): return "[CANCELLED] Search was cancelled."
     if progress: progress(0.95, desc="Formatting results...")
     # FIX: Replaced fragile sorting logic with a robust and efficient dictionary lookup.
+    # This prevents any possibility of an IndexError or StopIteration during sorting.
     url_to_index = {res.get('href'): i for i, res in enumerate(all_results) if res.get('href')}
     articles.sort(key=lambda x: url_to_index.get(x.get('url'), 999))
     summary = f"**Search Summary**: Found {len(articles)} articles total - {recent_found} recent, {historical_found} historical\n\n"
+    article_texts = [a['article'] for a in articles]
+    if progress: progress(1.0, desc=f"Search completed! Found {len(articles)} articles.")
     return summary + "\n---\n".join(article_texts)
 def extract_entities_enhanced(search_results: str, company_name: str, progress=None) -> str:
     if progress: progress(0, desc="Preparing text for analysis...")
     MAX_CHARS = 15000
     if len(search_results) > MAX_CHARS:
         search_results = search_results[:search_results.rfind('. ', 0, MAX_CHARS) + 1]
+    prompt = f"""...""" # Prompt is fine
     try:
         if progress: progress(0.5, desc="Sending request to AI model...")
+        message = client.messages.create(model="claude-sonnet-4-20250514", max_tokens=1500, temperature=0.1, messages=[{"role": "user", "content": prompt}])
+        # FIX: Robust check for API response content. Prevents IndexError.
+        if not message.content or not isinstance(message.content, list):
+            return json.dumps({"error": "API returned an invalid or empty response."})
         result = message.content[0].text
         if progress: progress(1.0, desc="Analysis completed!")
         return result
     except Exception as e:
         if progress: progress(1.0, desc="Analysis failed")
+        return json.dumps({"error": "Extraction failed due to an exception", "details": str(e)})
+# === Gradio Interface (No changes needed here) ===
 def search_only_enhanced(name: str, article_count: int, progress=gr.Progress()):
+    if not name or not name.strip(): return "❌ No name provided", ""
     try:
         start = time.time()
+        articles_output = search_articles_enhanced(name.strip(), int(article_count), progress=progress)
         if "[CANCELLED]" in articles_output: return "🛑 Search was cancelled by user.", ""
         elapsed = time.time() - start
+        results = f"✅ **Temporal Search** completed for **{name}** in {elapsed:.1f}s\n\n{articles_output}"
         return results, articles_output
     except Exception as e:
+        return f"❌ **Search failed unexpectedly**: {e}", ""
 def extract_only_enhanced(stored_results: str, company_name: str, progress=gr.Progress()):
+    if not stored_results or not stored_results.strip(): return "❌ No search results. Please search first."
+    if not company_name or not company_name.strip(): return "❌ No company name provided for context."
+    if "[CANCELLED]" in stored_results: return "❌ Cannot extract from cancelled results. Please search again."
     try:
         start = time.time()
+        entities = extract_entities_enhanced(stored_results, company_name.strip(), progress=progress)
         elapsed = time.time() - start
         try:
             parsed = json.loads(entities)
             formatted = json.dumps(parsed, indent=2)
+            return f"✅ **Extraction** completed in {elapsed:.1f}s\n\n```json\n{formatted}\n```"
         except (json.JSONDecodeError, TypeError):
             return f"⚠️ **Extraction Note**: Model did not return valid JSON. Completed in {elapsed:.1f}s\n\n{entities}"
     except Exception as e:
+        return f"❌ **Extraction failed unexpectedly**: {e}"
 def cancel_search():
     cancel_operation.set()
+    return "🛑 Cancellation requested..."
 with gr.Blocks(title="Enhanced Founder Finder", theme=gr.themes.Soft()) as demo:
     gr.Markdown("# 🔎 Enhanced Founder Finder")
+    gr.Markdown("Enter a business name to find its founders using a temporal search strategy.")
     search_state = gr.State("")
     with gr.Row():
+        with gr.Column(scale=2): name_input = gr.Textbox(label="Company Name", placeholder="e.g., 'Tesla', 'SpaceX'")
+        with gr.Column(scale=1): article_count_slider = gr.Slider(2, 10, value=4, step=2, label="Total Articles")
     with gr.Row():
+        search_btn = gr.Button("🔍 Temporal Search", variant="primary")
+        cancel_btn = gr.Button("🛑 Cancel", variant="stop")
+        extract_btn = gr.Button("📊 Extract Founders", variant="secondary")
     with gr.Row(): status_output = gr.Markdown("Ready to search...")
     with gr.Row():
+        output1 = gr.Markdown(label="Search Results & Temporal Analysis")
+        output2 = gr.Markdown(label="Founder Intelligence Report")
+    search_event = search_btn.click(fn=search_only_enhanced, inputs=[name_input, article_count_slider], outputs=[output1, search_state])
+    cancel_btn.click(fn=cancel_search, inputs=None, outputs=status_output, cancels=[search_event])
+    extract_btn.click(fn=extract_only_enhanced, inputs=[search_state, name_input], outputs=[output2])
+    gr.Examples(examples=[["OpenAI", 4], ["SpaceX", 6], ["Microsoft", 4]], inputs=[name_input, article_count_slider])
 demo.queue()
 if __name__ == "__main__":
+    demo.launch(show_error=True)
 '''
 import gradio as gr