Spaces:

akashraut
/

indic_bot

Sleeping

File size: 15,211 Bytes

# streamlit_app.py
# A robust Streamlit app with proper error handling and fallback options

import streamlit as st
import torch
import logging
from transformers import pipeline, AutoTokenizer, AutoModelForSeq2SeqLM

# Updated LangChain imports for modern versions
from langchain_community.llms import HuggingFacePipeline
from langchain.prompts import PromptTemplate
from langchain.chains import LLMChain
from langchain.memory import ConversationBufferMemory

# Set up logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

# -----------------------------------------------------------------------------
# CORE MODEL LOGIC (Rebuilt with LangChain and Error Handling)
# -----------------------------------------------------------------------------
class LangChainBot:
    def __init__(self):
        """
        Loads the models and wraps them in LangChain components with fallback options.
        """
        self.chain = None
        self.translator = None
        self.memory = None
        
        try:
            # Check CUDA availability
            device = 0 if torch.cuda.is_available() else -1
            torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
            
            st.info(f"Using device: {'CUDA' if device == 0 else 'CPU'}")
            
            # Try to load the main model with error handling
            self._load_main_model(device, torch_dtype)
            
            # Try to load the translator with error handling
            self._load_translator(device)
            
        except Exception as e:
            logger.error(f"Fatal error during initialization: {e}")
            st.error(f"Fatal: Could not initialize the bot. Error: {e}")

    def _load_main_model(self, device, torch_dtype):
        """Load the main generation model with fallback options."""
        models_to_try = [
            "ai4bharat/IndicBARTSS",
            "google/flan-t5-small",  # Fallback option
            "t5-small"  # Another fallback
        ]
        
        for model_name in models_to_try:
            try:
                st.info(f"Attempting to load model: {model_name}")
                
                # Try loading with pipeline first
                generator_pipeline = pipeline(
                    "text2text-generation",
                    model=model_name,
                    device=device,
                    torch_dtype=torch_dtype,
                    max_new_tokens=100,  # Reduced from 150
                    repetition_penalty=1.5,  # Increased from 1.2
                    do_sample=True,
                    temperature=0.7,
                    top_p=0.9,
                    no_repeat_ngram_size=3,  # Prevent repetition
                    trust_remote_code=True
                )
                
                # Wrap in LangChain LLM
                llm = HuggingFacePipeline(pipeline=generator_pipeline)
                
                # Create prompt template
                template = """You are a helpful AI assistant. Please provide a clear and concise response to the user's question.

Previous conversation:
{history}

User: {input}
Assistant:"""
                prompt_template = PromptTemplate(
                    input_variables=["history", "input"], 
                    template=template
                )
                
                # Set up memory
                self.memory = ConversationBufferMemory(memory_key="history")
                
                # Create the chain
                self.chain = LLMChain(
                    llm=llm,
                    prompt=prompt_template,
                    verbose=True,
                    memory=self.memory
                )
                
                st.success(f"Successfully loaded model: {model_name}")
                return  # Success, exit the loop
                
            except Exception as e:
                logger.warning(f"Failed to load {model_name}: {e}")
                st.warning(f"Failed to load {model_name}, trying next option...")
                continue
        
        raise Exception("All model loading attempts failed")

    def _load_translator(self, device):
        """Load the translator with fallback options."""
        translators_to_try = [
            "Helsinki-NLP/opus-mt-en-hi",  # More reliable fallback for English-Hindi
            "ai4bharat/indictrans2-indic-indic-1B",
        ]
        
        for translator_name in translators_to_try:
            try:
                st.info(f"Attempting to load translator: {translator_name}")
                
                self.translator = pipeline(
                    "translation",
                    model=translator_name,
                    device=device,
                    trust_remote_code=True
                )
                
                st.success(f"Successfully loaded translator: {translator_name}")
                return  # Success
                
            except Exception as e:
                logger.warning(f"Failed to load translator {translator_name}: {e}")
                st.warning(f"Failed to load translator {translator_name}, trying next option...")
                continue
        
        st.warning("No translator loaded - translation features will be limited")

    def _translate(self, text, source_lang, target_lang):
        """Translation logic with improved error handling."""
        if not self.translator or source_lang == target_lang:
            return text
            
        try:
            # Define language codes for indictrans2
            indictrans_codes = {
                'english': 'eng_Latn', 
                'hindi': 'hin_Deva', 
                'tamil': 'tam_Taml', 
                'telugu': 'tel_Telu'
            }
            
            # Try indictrans2 format first
            if source_lang in indictrans_codes and target_lang in indictrans_codes:
                try:
                    result = self.translator(
                        text, 
                        src_lang=indictrans_codes[source_lang], 
                        tgt_lang=indictrans_codes[target_lang]
                    )
                    if result and len(result) > 0 and 'translation_text' in result[0]:
                        return result[0]['translation_text']
                except Exception as e:
                    logger.warning(f"Indictrans2 translation failed: {e}")
            
            # Fallback: Try simple pipeline format
            try:
                result = self.translator(text)
                if result and len(result) > 0:
                    if 'translation_text' in result[0]:
                        return result[0]['translation_text']
                    elif 'generated_text' in result[0]:
                        return result[0]['generated_text']
            except Exception as e:
                logger.warning(f"Simple translation failed: {e}")
                
        except Exception as e:
            logger.warning(f"Translation failed: {e}")
            # Don't show warning to user for every translation failure
            
        return text

    def get_response(self, user_message, input_lang, output_lang):
        """Generate response with comprehensive error handling."""
        if not self.chain:
            return "Error: The LangChain chain is not initialized. Please check the logs above."

        try:
            # Clean the input message
            user_message = user_message.strip()
            
            # For now, let's work primarily in English to avoid translation issues
            # Only translate if specifically needed and working
            if input_lang == 'english':
                processed_message = user_message
            else:
                # Try translation, but fallback to original if it fails
                translated = self._translate(user_message, input_lang, 'english')
                processed_message = translated if translated != user_message else user_message
            
            # Generate response with input validation
            if len(processed_message.strip()) == 0:
                return "I didn't receive a valid message. Please try again."
            
            # Generate response
            response = self.chain.run(input=processed_message)
            
            # Clean up the response
            response = response.strip()
            
            # Remove any repetitive patterns
            words = response.split()
            if len(words) > 10:
                # Check for excessive repetition
                word_counts = {}
                for word in words:
                    word_counts[word] = word_counts.get(word, 0) + 1
                
                # If any word appears more than 5 times, it's likely repetitive
                max_count = max(word_counts.values()) if word_counts else 0
                if max_count > 5:
                    # Generate a simple fallback response
                    response = f"I understand you said '{processed_message[:50]}...' Let me provide a helpful response to that."
            
            # Translate output if needed and different from English
            if output_lang != 'english' and output_lang != input_lang:
                final_response = self._translate(response, 'english', output_lang)
                # If translation fails, return English response
                return final_response if final_response != response else response
            else:
                return response
                
        except Exception as e:
            logger.error(f"Error generating response: {e}")
            return f"I apologize, but I encountered an error while processing your request. Please try rephrasing your message."

# -----------------------------------------------------------------------------
# STREAMLIT UI WITH BETTER ERROR HANDLING
# -----------------------------------------------------------------------------

st.set_page_config(
    page_title="LangChain Model Interface",
    page_icon="🤖",
    layout="centered"
)

st.title("🤖 LangChain Model Interface")
st.markdown("*Multi-language conversational AI powered by LangChain*")

# Initialize the bot with progress tracking
@st.cache_resource
def load_bot():
    with st.spinner("Loading models... This may take a few minutes on first run."):
        return LangChainBot()

# Load the bot
bot = load_bot()

# Check if bot loaded successfully
if bot and bot.chain:
    st.success("✅ Bot loaded successfully!")
    
    st.markdown("---")
    
    # Language selection with helpful notes
    language_options = ["english", "hindi", "tamil", "telugu"]
    col1, col2 = st.columns(2)
    
    with col1:
        input_lang = st.selectbox(
            "🔤 Input Language", 
            options=language_options, 
            index=0,
            help="Select the language you'll type in"
        )
    with col2:
        output_lang = st.selectbox(
            "🗣️ Output Language", 
            options=language_options, 
            index=0,  # Default to English for now
            help="Select the language for the response"
        )
    
    # Show translation status
    if not bot.translator:
        st.info("ℹ️ Translation is currently limited. For best results, use English input and output.")
    elif input_lang != 'english' or output_lang != 'english':
        st.warning("⚠️ Translation is experimental. If you encounter issues, try using English.")


    # Chat interface
    st.markdown("### 💬 Chat Interface")
    user_input = st.text_area(
        "Your Message:", 
        height=100,
        placeholder=f"Type your message in {input_lang}..."
    )

    col1, col2 = st.columns([3, 1])
    
    with col1:
        if st.button("🚀 Get Response", type="primary"):
            if user_input.strip():
                with st.spinner("🤔 LangChain is processing your request..."):
                    response = bot.get_response(user_input, input_lang, output_lang)
                    
                st.markdown("### 🤖 Model Response:")
                st.info(response)
                
                # Add to conversation history display
                if 'conversation_history' not in st.session_state:
                    st.session_state.conversation_history = []
                
                st.session_state.conversation_history.append({
                    'user': user_input,
                    'bot': response,
                    'input_lang': input_lang,
                    'output_lang': output_lang
                })
                
            else:
                st.warning("⚠️ Please enter a message.")
    
    with col2:
        if st.button("🧹 Clear Memory"):
            if hasattr(bot, 'memory') and bot.memory:
                bot.memory.clear()
                if 'conversation_history' in st.session_state:
                    del st.session_state.conversation_history
                st.success("✅ Conversation memory cleared!")

    # Display conversation history
    if 'conversation_history' in st.session_state and st.session_state.conversation_history:
        st.markdown("### 📝 Conversation History")
        for i, conv in enumerate(reversed(st.session_state.conversation_history[-5:])):  # Show last 5
            with st.expander(f"Exchange {len(st.session_state.conversation_history) - i}"):
                st.markdown(f"**You ({conv['input_lang']})**: {conv['user']}")
                st.markdown(f"**Bot ({conv['output_lang']})**: {conv['bot']}")

else:
    st.error("❌ Application could not start. Please check the error messages above.")
    
    # Show some troubleshooting tips
    st.markdown("### 🔧 Troubleshooting Tips:")
    st.markdown("""
    1. **Model Loading Issues**: The models might be too large for the available resources
    2. **Memory Issues**: Try restarting the application
    3. **Network Issues**: Ensure stable internet connection for model downloads
    4. **Compatibility Issues**: Some models might not be compatible with the current environment
    """)
    
    if st.button("🔄 Retry Loading"):
        st.cache_resource.clear()
        st.rerun()

# Add sidebar with information
with st.sidebar:
    st.markdown("### ℹ️ Information")
    st.markdown("""
    This application uses:
    - **LangChain** for conversation management
    - **Hugging Face Transformers** for AI models
    - **Multi-language support** via translation models
    
    **Supported Languages:**
    - English
    - Hindi  
    - Tamil
    - Telugu
    """)
    
    if torch.cuda.is_available():
        st.success("🚀 CUDA GPU detected - faster processing!")
    else:
        st.info("💻 Using CPU - processing may be slower")
    
    st.markdown("### 🔧 System Status")
    st.markdown(f"- PyTorch: {torch.__version__}")
    st.markdown(f"- Device: {'CUDA' if torch.cuda.is_available() else 'CPU'}")
    if bot and bot.chain:
        st.markdown("- Model: ✅ Loaded")
        st.markdown(f"- Translator: {'✅ Loaded' if bot.translator else '❌ Not loaded'}")
    else:
        st.markdown("- Model: ❌ Failed to load")