Spaces:

milwright
/

chatui-helper

Running

milwright commited on Jul 15

Commit

189c33c

1 Parent(s): b1d807d

Remove web search functionality and update template

- Remove enable_web_search parameters and UI components
- Clean up template generation and requirements
- Simplify model selection and dependencies
- Update export functionality with proper encoding
- Fix API key validation in generated spaces

Files changed (3) hide show

app.py +101 -320
requirements.txt +2 -2
support_docs.py +0 -1

app.py CHANGED Viewed

@@ -133,13 +133,15 @@ def enhanced_fetch_url_content(url, enable_search_validation=False):
 # Template for generated space app (based on mvp_simple.py)
 SPACE_TEMPLATE = '''import gradio as gr
 import os
 import requests
 import json
 import re
 from bs4 import BeautifulSoup
 from datetime import datetime
-import tempfile
 # Configuration
 SPACE_NAME = "{name}"
@@ -151,7 +153,6 @@ GROUNDING_URLS = {grounding_urls}
 ACCESS_CODE = os.environ.get("SPACE_ACCESS_CODE", "{access_code}")
 ENABLE_DYNAMIC_URLS = {enable_dynamic_urls}
 ENABLE_VECTOR_RAG = {enable_vector_rag}
-ENABLE_WEB_SEARCH = {enable_web_search}
 RAG_DATA = {rag_data_json}
 # Get API key from environment - customizable variable name with validation
@@ -174,7 +175,7 @@ def validate_api_key():
     elif not API_KEY.startswith('sk-or-'):
         print(f"⚠️  API KEY FORMAT WARNING:")
         print(f"   Variable name: {api_key_var}")
-        print(f"   Current value: {{{{API_KEY[:10]}}}}..." if len(API_KEY) > 10 else API_KEY)
         print(f"   Expected format: sk-or-xxxxxxxxxx")
         print(f"   Note: OpenRouter keys should start with 'sk-or-'")
         return True  # Still try to use it
@@ -185,7 +186,11 @@ def validate_api_key():
         return True
 # Validate on startup
-API_KEY_VALID = validate_api_key()
 def validate_url_domain(url):
     """Basic URL domain validation"""
@@ -396,130 +401,6 @@ def generate_response(message, history):
             if dynamic_context_parts:
                 grounding_context += "\\n".join(dynamic_context_parts)
-    # If web search is enabled, use it for most queries (excluding code blocks and URLs)
-    if ENABLE_WEB_SEARCH:
-        should_search = True
-        # Skip search for messages that are primarily code blocks
-        import re
-        if re.search(r'```[\\s\\S]*```', message):
-            should_search = False
-        # Skip search for messages that are primarily URLs
-        urls_in_message = extract_urls_from_text(message)
-        if urls_in_message and len(' '.join(urls_in_message)) > len(message) * 0.5:
-            should_search = False
-        # Skip search for very short messages (likely greetings)
-        if len(message.strip()) < 5:
-            should_search = False
-        if should_search:
-            # Use the entire message as search query, cleaning it up
-            search_query = message.strip()
-            try:
-                # Perform web search using crawl4ai
-                import urllib.parse
-                import asyncio
-                async def search_with_crawl4ai(search_query):
-                    try:
-                        from crawl4ai import WebCrawler
-                        # Create search URL for DuckDuckGo
-                        encoded_query = urllib.parse.quote_plus(search_query)
-                        search_url = f"https://duckduckgo.com/html/?q={{encoded_query}}"
-                        # Initialize crawler
-                        crawler = WebCrawler(verbose=False)
-                        try:
-                            # Start the crawler
-                            await crawler.astart()
-                            # Crawl the search results
-                            result = await crawler.arun(url=search_url)
-                            if result.success:
-                                # Extract text content from search results
-                                content = result.cleaned_html if result.cleaned_html else result.markdown
-                                # Clean and truncate the content
-                                if content:
-                                    # Remove excessive whitespace and limit length
-                                    lines = [line.strip() for line in content.split('\\n') if line.strip()]
-                                    cleaned_content = '\\n'.join(lines)
-                                    # Truncate to reasonable length for context
-                                    if len(cleaned_content) > 2000:
-                                        cleaned_content = cleaned_content[:2000] + "..."
-                                    return cleaned_content
-                                else:
-                                    return "No content extracted from search results"
-                            else:
-                                return f"Search failed: {{result.error_message if hasattr(result, 'error_message') else 'Unknown error'}}"
-                        finally:
-                            # Clean up the crawler
-                            await crawler.aclose()
-                    except ImportError:
-                        # Fallback to simple DuckDuckGo search without crawl4ai
-                        encoded_query = urllib.parse.quote_plus(search_query)
-                        search_url = f"https://duckduckgo.com/html/?q={{encoded_query}}"
-                        # Use basic fetch as fallback
-                        response = requests.get(search_url, headers={{'User-Agent': 'Mozilla/5.0'}}, timeout=10)
-                        if response.status_code == 200:
-                            from bs4 import BeautifulSoup
-                            soup = BeautifulSoup(response.content, 'html.parser')
-                            # Remove script and style elements
-                            for script in soup(["script", "style", "nav", "header", "footer"]):
-                                script.decompose()
-                            # Get text content
-                            text = soup.get_text()
-                            # Clean up whitespace
-                            lines = (line.strip() for line in text.splitlines())
-                            chunks = (phrase.strip() for line in lines for phrase in line.split("  "))
-                            text = ' '.join(chunk for chunk in chunks if chunk)
-                            # Truncate to ~2000 characters
-                            if len(text) > 2000:
-                                text = text[:2000] + "..."
-                            return text
-                        else:
-                            return f"Failed to fetch search results: {{response.status_code}}"
-                # Run the async search
-                if hasattr(asyncio, 'run'):
-                    search_result = asyncio.run(search_with_crawl4ai(search_query))
-                else:
-                    # Fallback for older Python versions
-                    loop = asyncio.new_event_loop()
-                    asyncio.set_event_loop(loop)
-                    try:
-                        search_result = loop.run_until_complete(search_with_crawl4ai(search_query))
-                    finally:
-                        loop.close()
-                grounding_context += f"\\n\\nWeb search results for '{{search_query}}':\\n{{search_result}}"
-            except Exception as e:
-                # Enhanced fallback with better error handling
-                urls = extract_urls_from_text(search_query)
-                if urls:
-                    fallback_results = []
-                    for url in urls[:2]:  # Limit to 2 URLs for fallback
-                        content = fetch_url_content(url)
-                        fallback_results.append(f"Content from {{url}}:\\n{{content[:500]}}...")
-                    grounding_context += f"\\n\\nWeb search fallback for '{{search_query}}':\\n" + "\\n\\n".join(fallback_results)
-                else:
-                    grounding_context += f"\\n\\nWeb search requested for '{{search_query}}' but search functionality is unavailable"
     # Build enhanced system prompt with grounding context
     enhanced_system_prompt = SYSTEM_PROMPT + grounding_context
@@ -690,6 +571,39 @@ def protected_generate_response(message, history):
         return "Please enter the access code to continue."
     return generate_response(message, history)
 def export_conversation(history):
     \"\"\"Export conversation to markdown file\"\"\"
     if not history:
@@ -698,7 +612,7 @@ def export_conversation(history):
     markdown_content = export_conversation_to_markdown(history)
     # Save to temporary file
-    with tempfile.NamedTemporaryFile(mode='w', suffix='.md', delete=False) as f:
         f.write(markdown_content)
         temp_file = f.name
@@ -723,10 +637,7 @@ def get_configuration_status():
     if ENABLE_DYNAMIC_URLS:
         status_parts.append("🔄 **Dynamic URLs:** Enabled")
-    if ENABLE_WEB_SEARCH:
-        status_parts.append("🔍 **Web Search:** Enabled")
     if ENABLE_VECTOR_RAG:
         status_parts.append("📚 **Document RAG:** Enabled")
@@ -762,7 +673,7 @@ with gr.Blocks(title=SPACE_NAME) as demo:
     # Main chat interface (hidden until access granted)
     with gr.Column(visible=not bool(ACCESS_CODE)) as chat_section:
         chat_interface = gr.ChatInterface(
-            fn=protected_generate_response,
             title="",  # Title already shown above
             description="",  # Description already shown above
             examples=None,
@@ -771,13 +682,12 @@ with gr.Blocks(title=SPACE_NAME) as demo:
         # Export functionality
         with gr.Row():
-            export_btn = gr.Button("Export Conversation", variant="secondary", size="sm")
             export_file = gr.File(label="Download Conversation", visible=False)
         # Connect export functionality
         export_btn.click(
-            export_conversation,
-            inputs=[chat_interface],
             outputs=[export_file]
         )
@@ -801,10 +711,12 @@ if __name__ == "__main__":
 # Available models - Updated with valid OpenRouter model IDs
 MODELS = [
     "google/gemini-2.0-flash-001",      # Fast, reliable, general tasks
     "anthropic/claude-3.5-haiku",       # Complex reasoning and analysis
-    "openai/gpt-4o-mini",               # Balanced performance and cost
-    "meta-llama/llama-3.1-8b-instruct", # Open-source, efficient option
-    "mistralai/mistral-7b-instruct"     # Good for technical topics
 ]
 def fetch_url_content(url):
@@ -943,19 +855,18 @@ Generated on {datetime.now().strftime('%Y-%m-%d %H:%M:%S')} with Chat U/I Helper
     return readme_content
-def create_requirements(enable_vector_rag=False, enable_web_search=False):
     """Generate requirements.txt"""
-    base_requirements = "gradio>=5.35.0\nrequests>=2.32.3\nbeautifulsoup4>=4.12.3"
     if enable_vector_rag:
-        base_requirements += "\nfaiss-cpu==1.7.4\nnumpy==1.24.3"
-    if enable_web_search:
-        base_requirements += "\ncrawl4ai>=0.2.0\naiohttp>=3.8.0"
     return base_requirements
-def generate_zip(name, description, system_prompt, model, api_key_var, temperature, max_tokens, examples_text, access_code="", enable_dynamic_urls=False, url1="", url2="", url3="", url4="", enable_vector_rag=False, rag_data=None, enable_web_search=False):
     """Generate deployable zip file"""
     # Process examples
@@ -991,7 +902,6 @@ def generate_zip(name, description, system_prompt, model, api_key_var, temperatu
         'access_code': "",  # Access code stored in environment variable for security
         'enable_dynamic_urls': enable_dynamic_urls,
         'enable_vector_rag': enable_vector_rag,
-        'enable_web_search': enable_web_search,
         'rag_data_json': json.dumps(rag_data) if rag_data else 'None'
     }
@@ -1001,7 +911,7 @@ def generate_zip(name, description, system_prompt, model, api_key_var, temperatu
     readme_config = config.copy()
     readme_config['access_code'] = access_code or ""
     readme_content = create_readme(readme_config)
-    requirements_content = create_requirements(enable_vector_rag, enable_web_search)
     # Create zip file with clean naming
     filename = f"{name.lower().replace(' ', '_').replace('-', '_')}.zip"
@@ -1157,7 +1067,7 @@ def update_sandbox_preview(config_data):
     return preview_text, preview_html
-def on_preview_combined(name, description, system_prompt, enable_research_assistant, model, temperature, max_tokens, examples_text, enable_dynamic_urls, enable_vector_rag, enable_web_search):
     """Generate configuration and return preview updates"""
     if not name or not name.strip():
         return (
@@ -1189,45 +1099,24 @@ def on_preview_combined(name, description, system_prompt, enable_research_assist
             'max_tokens': max_tokens,
             'enable_dynamic_urls': enable_dynamic_urls,
             'enable_vector_rag': enable_vector_rag,
-            'enable_web_search': enable_web_search,
             'examples_text': examples_text,
             'preview_ready': True
         }
         # Generate preview displays
-        preview_text = f"""🎉 **Preview Successfully Rendered!**
-Your assistant "{name}" is now configured and ready to test in the Sandbox Preview tab.
-**Configuration:**
-- **Model:** {model}
-- **Temperature:** {temperature}
-- **Max Tokens:** {max_tokens}
-- **Dynamic URLs:** {'✅ Enabled' if enable_dynamic_urls else '❌ Disabled'}
-- **Vector RAG:** {'✅ Enabled' if enable_vector_rag else '❌ Disabled'}
-- **Web Search:** {'✅ Enabled' if enable_web_search else '❌ Disabled'}
-**System Prompt:**
-{final_system_prompt[:200]}{'...' if len(final_system_prompt) > 200 else ''}
-✨ **Next Steps:** Switch to the "Sandbox Preview" tab to test your assistant with real conversations before generating the deployment package."""
         config_display = f"""### Current Configuration
-**Space Details:**
 - **Name:** {name}
 - **Description:** {description or 'No description provided'}
-**Model Settings:**
 - **Model:** {model}
 - **Temperature:** {temperature}
 - **Max Response Tokens:** {max_tokens}
-**Features:**
-- **Dynamic URL Fetching:** {'✅ Enabled' if enable_dynamic_urls else '❌ Disabled'}
-- **Document RAG:** {'✅ Enabled' if enable_vector_rag else '❌ Disabled'}
-- **Web Search:** {'✅ Enabled' if enable_web_search else '❌ Disabled'}
 **System Prompt:**
 ```
 {final_system_prompt}
@@ -1238,8 +1127,8 @@ Your assistant "{name}" is now configured and ready to test in the Sandbox Previ
 """
         # Show success notification
-        gr.Info(f"✅ Preview generated successfully for '{name}'! Switch to the Sandbox Preview tab to test your assistant.")
         return (
             config_data,
             gr.update(value=preview_text, visible=True),
@@ -1268,7 +1157,7 @@ def update_preview_display(config_data):
 Your assistant "{config_data['name']}" is configured and ready to test.
-**Configuration:**
 - **Model:** {config_data['model']}
 - **Temperature:** {config_data['temperature']}
 - **Max Tokens:** {config_data['max_tokens']}
@@ -1276,7 +1165,7 @@ Your assistant "{config_data['name']}" is configured and ready to test.
 - **Vector RAG:** {'✅ Enabled' if config_data['enable_vector_rag'] else '❌ Disabled'}
 **System Prompt:**
-{config_data['system_prompt'][:200]}{'...' if len(config_data['system_prompt']) > 200 else ''}
 Use the chat interface below to test your assistant before generating the deployment package."""
@@ -1363,33 +1252,8 @@ Once you set your API key, you'll be able to test real conversations in this pre
                 if dynamic_context_parts:
                     dynamic_context = "\n".join(dynamic_context_parts)
-        # Check for web search request if enabled
-        web_search_result = ""
-        if config_data.get('enable_web_search'):
-            # If web search is enabled, use it for most queries (excluding code blocks and URLs)
-            should_search = True
-            # Skip search for messages that are primarily code blocks
-            if re.search(r'```[\s\S]*```', message):
-                should_search = False
-            # Skip search for messages that are primarily URLs
-            urls_in_message = extract_urls_from_text(message)
-            if urls_in_message and len(' '.join(urls_in_message)) > len(message) * 0.5:
-                should_search = False
-            # Skip search for very short messages (likely greetings)
-            if len(message.strip()) < 5:
-                should_search = False
-            if should_search:
-                # Use the entire message as search query, cleaning it up
-                search_query = message.strip()
-                search_result = perform_web_search(search_query, "Web search requested")
-                web_search_result = f"\n\n{search_result}\n\n"
         # Build enhanced system prompt with all contexts
-        enhanced_system_prompt = config_data.get('system_prompt', '') + grounding_context + rag_context + dynamic_context + web_search_result
         # Build messages array for the API
         messages = [{"role": "system", "content": enhanced_system_prompt}]
@@ -1483,7 +1347,7 @@ def export_preview_conversation(history):
     return gr.update(value=temp_file, visible=True)
-def on_generate(name, description, system_prompt, enable_research_assistant, model, api_key_var, temperature, max_tokens, examples_text, access_code, enable_dynamic_urls, url1, url2, url3, url4, enable_vector_rag, rag_tool_state, enable_web_search):
     if not name or not name.strip():
         return gr.update(value="Error: Please provide a Space Title", visible=True), gr.update(visible=False), {}
@@ -1500,7 +1364,7 @@ def on_generate(name, description, system_prompt, enable_research_assistant, mod
         final_system_prompt = system_prompt.strip()
-        filename = generate_zip(name, description, final_system_prompt, model, api_key_var, temperature, max_tokens, examples_text, access_code, enable_dynamic_urls, url1, url2, url3, url4, enable_vector_rag, rag_data, enable_web_search)
         success_msg = f"""**Deployment package ready!**
@@ -1529,7 +1393,6 @@ def on_generate(name, description, system_prompt, enable_research_assistant, mod
             'max_tokens': max_tokens,
             'enable_dynamic_urls': enable_dynamic_urls,
             'enable_vector_rag': enable_vector_rag,
-            'enable_web_search': enable_web_search,
             'filename': filename
         }
@@ -1715,109 +1578,44 @@ def remove_chat_urls(count):
 # Code execution toggle removed - functionality no longer supported
-def toggle_web_search(enable_search):
-    """Toggle visibility of web search space field"""
-    return gr.update(visible=enable_search)
 def perform_web_search(query, description="Web search"):
-    """Perform web search using crawl4ai with DuckDuckGo"""
     try:
-        # Try to use crawl4ai for web search
-        try:
-            from crawl4ai import WebCrawler
-            import asyncio
-            async def search_with_crawl4ai(search_query):
-                # Create search URL for DuckDuckGo
-                import urllib.parse
-                encoded_query = urllib.parse.quote_plus(search_query)
-                search_url = f"https://duckduckgo.com/html/?q={encoded_query}"
-                # Initialize crawler
-                crawler = WebCrawler(verbose=False)
-                try:
-                    # Start the crawler
-                    await crawler.astart()
-                    # Crawl the search results
-                    result = await crawler.arun(url=search_url)
-                    if result.success:
-                        # Extract text content from search results
-                        content = result.cleaned_html if result.cleaned_html else result.markdown
-                        # Clean and truncate the content
-                        if content:
-                            # Remove excessive whitespace and limit length
-                            lines = [line.strip() for line in content.split('\n') if line.strip()]
-                            cleaned_content = '\n'.join(lines)
-                            # Truncate to reasonable length for context
-                            if len(cleaned_content) > 3000:
-                                cleaned_content = cleaned_content[:3000] + "..."
-                            return cleaned_content
-                        else:
-                            return "No content extracted from search results"
-                    else:
-                        return f"Search failed: {result.error_message if hasattr(result, 'error_message') else 'Unknown error'}"
-                finally:
-                    # Clean up the crawler
-                    await crawler.aclose()
-            # Run the async search
-            if hasattr(asyncio, 'run'):
-                search_result = asyncio.run(search_with_crawl4ai(query))
-            else:
-                # Fallback for older Python versions
-                loop = asyncio.new_event_loop()
-                asyncio.set_event_loop(loop)
-                try:
-                    search_result = loop.run_until_complete(search_with_crawl4ai(query))
-                finally:
-                    loop.close()
-            return f"**{description}**\n\nQuery: {query}\n\n**Search Results:**\n{search_result}"
-        except ImportError:
-            # Fallback to simple DuckDuckGo search without crawl4ai
-            import urllib.parse
-            encoded_query = urllib.parse.quote_plus(query)
-            search_url = f"https://duckduckgo.com/html/?q={encoded_query}"
-            # Use enhanced_fetch_url_content as fallback
-            content = enhanced_fetch_url_content(search_url)
-            return f"**{description} (Simplified)**\n\nQuery: {query}\n\n**Search Results:**\n{content}"
-    except Exception as e:
-        # Final fallback to URL extraction if search fails
         urls = extract_urls_from_text(query)
         if urls:
             results = []
-            for url in urls[:2]:  # Limit to 2 URLs for fallback
-                content = enhanced_fetch_url_content(url)
-                results.append(f"Content from {url}:\n{content[:500]}...")
-            return f"**Web Search Fallback:** {description}\n\n" + "\n\n".join(results)
-        return f"**Web Search Error:** {str(e)}\n\nQuery: {query}"
 # Code execution functionality removed - no longer supported
 def toggle_research_assistant(enable_research):
-    """Toggle research assistant system prompt and web search"""
     if enable_research:
-        combined_prompt = "You are an advanced research assistant specializing in academic literature search and analysis. Your expertise includes finding peer-reviewed sources, critically evaluating research methodology, synthesizing insights across multiple papers, and providing properly formatted citations. When responding, ground all claims in specific sources from provided URL contexts, distinguish between direct evidence and analytical interpretation, and highlight any limitations or conflicting findings. Use clear, accessible language that makes complex research understandable, and suggest related areas of inquiry when relevant. Your goal is to be a knowledgeable research partner who helps users navigate academic information with precision and clarity."
         return (
             gr.update(value=combined_prompt),  # Update main system prompt
-            gr.update(value=True),  # Enable dynamic URL fetching for research template
-            gr.update(value=True)   # Enable web search for research template
         )
     else:
         return (
             gr.update(value=""),  # Clear main system prompt when disabling
-            gr.update(value=False),  # Disable dynamic URL setting
-            gr.update(value=False)   # Disable web search
         )
@@ -1998,20 +1796,7 @@ with gr.Blocks(
                         info="Enable to use pre-configured research assistant settings"
                     )
-                    # Web search under research template
-                    enable_web_search = gr.Checkbox(
-                        label="Enable Web Search",
-                        value=False,
-                        info="Allow the assistant to search the web using crawl4ai"
-                    )
-                    web_search_space = gr.Textbox(
-                        label="Web Search Technology",
-                        value="crawl4ai",
-                        info="Uses crawl4ai library for web crawling",
-                        visible=False,
-                        interactive=False
-                    )
                     # Document RAG section
                     enable_vector_rag = gr.Checkbox(
@@ -2118,15 +1903,11 @@ with gr.Blocks(
             enable_research_assistant.change(
                 toggle_research_assistant,
                 inputs=[enable_research_assistant],
-                outputs=[system_prompt, enable_dynamic_urls, enable_web_search]
             )
-            # Connect the web search checkbox
-            enable_web_search.change(
-                toggle_web_search,
-                inputs=[enable_web_search],
-                outputs=[web_search_space]
-            )
@@ -2160,7 +1941,7 @@ with gr.Blocks(
             # Connect the generate button
             generate_btn.click(
                 on_generate,
-                inputs=[name, description, system_prompt, enable_research_assistant, model, api_key_var, temperature, max_tokens, examples_text, access_code, enable_dynamic_urls, url1, url2, url3, url4, enable_vector_rag, rag_tool_state, enable_web_search],
                 outputs=[status, download_file, sandbox_state]
             )
@@ -2226,7 +2007,7 @@ with gr.Blocks(
                     with gr.Row():
                         preview_send = gr.Button("Send", variant="primary")
                         preview_clear = gr.Button("Clear")
-                        export_btn = gr.Button("Export Conversation", variant="secondary")
                     # Export functionality
                     export_file = gr.File(label="Download Conversation", visible=False)
@@ -2254,7 +2035,7 @@ with gr.Blocks(
                 outputs=[preview_msg, preview_chatbot]
             )
-            export_btn.click(
                 export_preview_conversation,
                 inputs=[preview_chatbot],
                 outputs=[export_file]
@@ -2279,7 +2060,7 @@ with gr.Blocks(
     # Connect cross-tab functionality after all components are defined
     preview_btn.click(
         on_preview_combined,
-        inputs=[name, description, system_prompt, enable_research_assistant, model, temperature, max_tokens, examples_text, enable_dynamic_urls, enable_vector_rag, enable_web_search],
         outputs=[preview_config_state, preview_status_comp, preview_chat_section_comp, config_display_comp]
     )

 # Template for generated space app (based on mvp_simple.py)
 SPACE_TEMPLATE = '''import gradio as gr
+import tempfile
 import os
 import requests
 import json
 import re
 from bs4 import BeautifulSoup
 from datetime import datetime
+import urllib.parse
 # Configuration
 SPACE_NAME = "{name}"
 ACCESS_CODE = os.environ.get("SPACE_ACCESS_CODE", "{access_code}")
 ENABLE_DYNAMIC_URLS = {enable_dynamic_urls}
 ENABLE_VECTOR_RAG = {enable_vector_rag}
 RAG_DATA = {rag_data_json}
 # Get API key from environment - customizable variable name with validation
     elif not API_KEY.startswith('sk-or-'):
         print(f"⚠️  API KEY FORMAT WARNING:")
         print(f"   Variable name: {api_key_var}")
+        print(f"   Current value: {{API_KEY[:10]}}..." if len(API_KEY) > 10 else API_KEY)
         print(f"   Expected format: sk-or-xxxxxxxxxx")
         print(f"   Note: OpenRouter keys should start with 'sk-or-'")
         return True  # Still try to use it
         return True
 # Validate on startup
+try:
+    API_KEY_VALID = validate_api_key()
+except NameError:
+    # During template generation, API_KEY might not be defined yet
+    API_KEY_VALID = False
 def validate_url_domain(url):
     """Basic URL domain validation"""
             if dynamic_context_parts:
                 grounding_context += "\\n".join(dynamic_context_parts)
     # Build enhanced system prompt with grounding context
     enhanced_system_prompt = SYSTEM_PROMPT + grounding_context
         return "Please enter the access code to continue."
     return generate_response(message, history)
+# Global variable to store chat history for export
+chat_history_store = []
+def store_and_generate_response(message, history):
+    \"\"\"Wrapper function that stores history and generates response\"\"\"
+    global chat_history_store
+    # Store the updated history
+    chat_history_store = history.copy() if history else []
+    # Generate response using the protected function
+    response = protected_generate_response(message, history)
+    # Update stored history with the new exchange
+    chat_history_store.append({{"role": "user", "content": message}})
+    chat_history_store.append({{"role": "assistant", "content": response}})
+    return response
+def export_current_conversation():
+    \"\"\"Export the current conversation\"\"\"
+    if not chat_history_store:
+        return gr.update(visible=False)
+    markdown_content = export_conversation_to_markdown(chat_history_store)
+    # Save to temporary file
+    with tempfile.NamedTemporaryFile(mode='w', suffix='.md', delete=False, encoding='utf-8') as f:
+        f.write(markdown_content)
+        temp_file = f.name
+    return gr.update(value=temp_file, visible=True)
 def export_conversation(history):
     \"\"\"Export conversation to markdown file\"\"\"
     if not history:
     markdown_content = export_conversation_to_markdown(history)
     # Save to temporary file
+    with tempfile.NamedTemporaryFile(mode='w', suffix='.md', delete=False, encoding='utf-8') as f:
         f.write(markdown_content)
         temp_file = f.name
     if ENABLE_DYNAMIC_URLS:
         status_parts.append("🔄 **Dynamic URLs:** Enabled")
     if ENABLE_VECTOR_RAG:
         status_parts.append("📚 **Document RAG:** Enabled")
     # Main chat interface (hidden until access granted)
     with gr.Column(visible=not bool(ACCESS_CODE)) as chat_section:
         chat_interface = gr.ChatInterface(
+            fn=store_and_generate_response,  # Use wrapper function to store history
             title="",  # Title already shown above
             description="",  # Description already shown above
             examples=None,
         # Export functionality
         with gr.Row():
+            export_btn = gr.Button("📥 Export Conversation", variant="secondary", size="sm")
             export_file = gr.File(label="Download Conversation", visible=False)
         # Connect export functionality
         export_btn.click(
+            export_current_conversation,
             outputs=[export_file]
         )
 # Available models - Updated with valid OpenRouter model IDs
 MODELS = [
     "google/gemini-2.0-flash-001",      # Fast, reliable, general tasks
+    "google/gemma-3-27b-it",            # High-performance open model
     "anthropic/claude-3.5-haiku",       # Complex reasoning and analysis
+    "openai/gpt-4o-mini-search-preview", # Balanced performance and cost with search
+    "openai/gpt-4.1-nano",              # Lightweight OpenAI model
+    "nvidia/llama-3.1-nemotron-70b-instruct", # Large open-source model
+    "mistralai/devstral-small"           # Coding-focused model
 ]
 def fetch_url_content(url):
     return readme_content
+def create_requirements(enable_vector_rag=False):
     """Generate requirements.txt"""
+    base_requirements = "gradio>=4.44.1\nrequests>=2.32.3\nbeautifulsoup4>=4.12.3\npython-dotenv>=1.0.0"
     if enable_vector_rag:
+        base_requirements += "\n\n# Vector RAG dependencies"
+        base_requirements += "\nfaiss-cpu>=1.11.0\nnumpy>=1.25.0,<3.0\nsentence-transformers>=2.2.2\nPyMuPDF>=1.23.0\npython-docx>=0.8.11"
     return base_requirements
+def generate_zip(name, description, system_prompt, model, api_key_var, temperature, max_tokens, examples_text, access_code="", enable_dynamic_urls=False, url1="", url2="", url3="", url4="", enable_vector_rag=False, rag_data=None):
     """Generate deployable zip file"""
     # Process examples
         'access_code': "",  # Access code stored in environment variable for security
         'enable_dynamic_urls': enable_dynamic_urls,
         'enable_vector_rag': enable_vector_rag,
         'rag_data_json': json.dumps(rag_data) if rag_data else 'None'
     }
     readme_config = config.copy()
     readme_config['access_code'] = access_code or ""
     readme_content = create_readme(readme_config)
+    requirements_content = create_requirements(enable_vector_rag)
     # Create zip file with clean naming
     filename = f"{name.lower().replace(' ', '_').replace('-', '_')}.zip"
     return preview_text, preview_html
+def on_preview_combined(name, description, system_prompt, enable_research_assistant, model, temperature, max_tokens, examples_text, enable_dynamic_urls, enable_vector_rag):
     """Generate configuration and return preview updates"""
     if not name or not name.strip():
         return (
             'max_tokens': max_tokens,
             'enable_dynamic_urls': enable_dynamic_urls,
             'enable_vector_rag': enable_vector_rag,
             'examples_text': examples_text,
             'preview_ready': True
         }
         # Generate preview displays
+        preview_text = f"""**System Prompt:**
+> *{final_system_prompt[:600]}{'...' if len(final_system_prompt) > 600 else '...'}*
+Tip: Try different configurations of your space before generating the deployment package."""
         config_display = f"""### Current Configuration
+> **Configuration**:
 - **Name:** {name}
 - **Description:** {description or 'No description provided'}
 - **Model:** {model}
 - **Temperature:** {temperature}
 - **Max Response Tokens:** {max_tokens}
 **System Prompt:**
 ```
 {final_system_prompt}
 """
         # Show success notification
+        gr.Info(f"✅ Preview generated successfully for '{name}'! Switch to Preview tab.")
         return (
             config_data,
             gr.update(value=preview_text, visible=True),
 Your assistant "{config_data['name']}" is configured and ready to test.
+**Configuration**
 - **Model:** {config_data['model']}
 - **Temperature:** {config_data['temperature']}
 - **Max Tokens:** {config_data['max_tokens']}
 - **Vector RAG:** {'✅ Enabled' if config_data['enable_vector_rag'] else '❌ Disabled'}
 **System Prompt:**
+{config_data['system_prompt'][:600]}{'...' if len(config_data['system_prompt']) > 600 else ''}
 Use the chat interface below to test your assistant before generating the deployment package."""
                 if dynamic_context_parts:
                     dynamic_context = "\n".join(dynamic_context_parts)
         # Build enhanced system prompt with all contexts
+        enhanced_system_prompt = config_data.get('system_prompt', '') + grounding_context + rag_context + dynamic_context
         # Build messages array for the API
         messages = [{"role": "system", "content": enhanced_system_prompt}]
     return gr.update(value=temp_file, visible=True)
+def on_generate(name, description, system_prompt, enable_research_assistant, model, api_key_var, temperature, max_tokens, examples_text, access_code, enable_dynamic_urls, url1, url2, url3, url4, enable_vector_rag, rag_tool_state):
     if not name or not name.strip():
         return gr.update(value="Error: Please provide a Space Title", visible=True), gr.update(visible=False), {}
         final_system_prompt = system_prompt.strip()
+        filename = generate_zip(name, description, final_system_prompt, model, api_key_var, temperature, max_tokens, examples_text, access_code, enable_dynamic_urls, url1, url2, url3, url4, enable_vector_rag, rag_data)
         success_msg = f"""**Deployment package ready!**
             'max_tokens': max_tokens,
             'enable_dynamic_urls': enable_dynamic_urls,
             'enable_vector_rag': enable_vector_rag,
             'filename': filename
         }
 # Code execution toggle removed - functionality no longer supported
 def perform_web_search(query, description="Web search"):
+    """Simplified web search with URL content fetching"""
     try:
+        # Check if query contains URLs for content fetching
         urls = extract_urls_from_text(query)
         if urls:
             results = []
+            for url in urls[:3]:  # Limit to 3 URLs for performance
+                try:
+                    content = enhanced_fetch_url_content(url)
+                    if content and len(content.strip()) > 50:
+                        results.append(f"**Content from {url}:**\n{content[:1000]}...")
+                except Exception as e:
+                    results.append(f"**Error fetching {url}:** {str(e)}")
+            if results:
+                return f"**{description}**\n\nQuery: {query}\n\n" + "\n\n".join(results)
+        # For non-URL queries, return context for model to handle
+        return f"**{description}**\n\nQuery: {query}\n\n**Note:** This query will be processed using the model's knowledge. For real-time information, consider providing specific URLs or mentioning that recent data verification may be needed."
+    except Exception as e:
+        return f"**{description} - Processing Error:** {str(e)}\n\nQuery: {query}\n\n**Note:** Falling back to model's knowledge for this query."
 # Code execution functionality removed - no longer supported
 def toggle_research_assistant(enable_research):
+    """Toggle research assistant system prompt and dynamic URL fetching"""
     if enable_research:
+        combined_prompt = "You are a research aid specializing in academic literature search and analysis. Your expertise spans discovering peer-reviewed sources, assessing research methodologies, synthesizing findings across studies, and delivering properly formatted citations. When responding, anchor claims in specific sources from provided URL contexts, differentiate between direct evidence and interpretive analysis, and note any limitations or contradictory results. Employ clear, accessible language that demystifies complex research, and propose connected research directions when appropriate. Your purpose is to serve as an informed research tool supporting users through initial concept development, exploratory investigation, information collection, and source compilation."
         return (
             gr.update(value=combined_prompt),  # Update main system prompt
+            gr.update(value=True)  # Enable dynamic URL fetching for research template
         )
     else:
         return (
             gr.update(value=""),  # Clear main system prompt when disabling
+            gr.update(value=False)  # Disable dynamic URL setting
         )
                         info="Enable to use pre-configured research assistant settings"
                     )
                     # Document RAG section
                     enable_vector_rag = gr.Checkbox(
             enable_research_assistant.change(
                 toggle_research_assistant,
                 inputs=[enable_research_assistant],
+                outputs=[system_prompt, enable_dynamic_urls]
             )
+            # Web search checkbox is now just for enabling/disabling the feature
+            # No additional UI elements needed since we rely on model capabilities
             # Connect the generate button
             generate_btn.click(
                 on_generate,
+                inputs=[name, description, system_prompt, enable_research_assistant, model, api_key_var, temperature, max_tokens, examples_text, access_code, enable_dynamic_urls, url1, url2, url3, url4, enable_vector_rag, rag_tool_state],
                 outputs=[status, download_file, sandbox_state]
             )
                     with gr.Row():
                         preview_send = gr.Button("Send", variant="primary")
                         preview_clear = gr.Button("Clear")
+                        preview_export_btn = gr.Button("Export Conversation", variant="secondary")
                     # Export functionality
                     export_file = gr.File(label="Download Conversation", visible=False)
                 outputs=[preview_msg, preview_chatbot]
             )
+            preview_export_btn.click(
                 export_preview_conversation,
                 inputs=[preview_chatbot],
                 outputs=[export_file]
     # Connect cross-tab functionality after all components are defined
     preview_btn.click(
         on_preview_combined,
+        inputs=[name, description, system_prompt, enable_research_assistant, model, temperature, max_tokens, examples_text, enable_dynamic_urls, enable_vector_rag],
         outputs=[preview_config_state, preview_status_comp, preview_chat_section_comp, config_display_comp]
     )

requirements.txt CHANGED Viewed

@@ -9,7 +9,7 @@ playwright==1.53.0
 # Vector RAG dependencies (optional)
 sentence-transformers>=2.2.2
-faiss-cpu==1.7.4
 PyMuPDF>=1.23.0
 python-docx>=0.8.11
-numpy==1.26.4

 # Vector RAG dependencies (optional)
 sentence-transformers>=2.2.2
+faiss-cpu>=1.11.0
 PyMuPDF>=1.23.0
 python-docx>=0.8.11
+numpy>=1.25.0,<3.0

support_docs.py CHANGED Viewed

@@ -271,7 +271,6 @@ def create_support_docs():
             **Token Usage Notes:**
             - Tokens include both input (your prompt + context) and output
             - Longer contexts (documents, URLs) use more input tokens
-            - Monitor usage through OpenRouter dashboard
             - Consider costs when setting high token limits
             """)

             **Token Usage Notes:**
             - Tokens include both input (your prompt + context) and output
             - Longer contexts (documents, URLs) use more input tokens
             - Consider costs when setting high token limits
             """)