Spaces:

saritha
/

RAG_with_langchain_gemini

Sleeping

App Files Files Community

saritha commited on May 1, 2024

Commit

140729c

verified ·

1 Parent(s): 88f41cb

Update app.py

Browse files

Files changed (1) hide show

app.py +43 -86

app.py CHANGED Viewed

@@ -1,89 +1,46 @@
 import os
-from langchain_core.prompts import PromptTemplate
-from langchain_community.output_parsers.rail_parser import GuardrailsOutputParser
-from langchain_community.document_loaders import PyPDFLoader
-import google.generativeai as genai
 import gradio as gr
-# Function for initialization
-def initialize(pdf_file, question):
-    try:
-        # Access the uploaded file information from Gradio
-        file_info = pdf_file
-        # Check if a file was uploaded
-        if file_info is not None:
-            # Construct potential file path based on temporary directory and filename
-            file_path = os.path.join("/tmp", file_info.name)  # Adjust temporary directory if needed
-            if os.path.exists(file_path):
-                # Process the PDF
-                pdf_loader = PyPDFLoader(file_path)
-                pages = pdf_loader.load_and_split()
-                processed_context = "\n".join(str(page.page_content) for page in pages[:30])  # Limit to first 30 pages
-                # Configure Google Generative AI (replace with your API key)
-                genai.configure(api_key=os.getenv("GOOGLE_API_KEY"))
-                # Prompt template for formatting context and question
-                prompt_template = """Answer the question as precise as possible using the provided context. If the answer is not contained in the context, say "answer not available in context"
-                Context:
-                {context}
-                Question:
-                {question}
-                Answer:
-                """
-                prompt = PromptTemplate(template=prompt_template, input_variables=["context", "question"])
-                # Load the GeminiPro model
-                model = genai.GenerativeModel('gemini-pro')
-                # Option 1: Using GeminiPro's Text Generation (if applicable)
-                # Check if the model has a 'generate' method (or similar) - adjust based on actual method
-                if hasattr(model, 'generate'):
-                    # Process context and question (already done)
-                    # Generate answer using GeminiPro's generate method
-                    generated_answer = model.generate(prompt=prompt)  # Replace with the appropriate method
-                    # Extract the answer (parse the output from 'generate')
-                    # ... (implementation depends on the model's output format)
-                    return generated_answer
-                # Option 2: Alternative LLM Integration (if GeminiPro methods not suitable)
-                # Replace this section with code using an alternative library/framework
-                # for question answering (e.g., transformers, haystack)
-                # Ensure the code integrates with your chosen LLM and handles context processing,
-                # question answering, and answer extraction.
-                # Example placeholder (replace with your actual implementation):
-                # return "Alternative LLM integration not yet implemented."
-            else:
-                return "Error: The uploaded file could not be found."
-        else:
-            return "Error: No PDF file was uploaded."
-    except Exception as e:
-        return f"An error occurred: {e}"  # Generic error handling
-# Create a Gradio interface
-interface = gr.Interface(
-    fn=initialize,
-    inputs=[
-        gr.File(label="Upload PDF"),  # No need for 'type' argument
-        gr.Textbox(label="Question")
-    ],
-    outputs="text",
-    title="GeminiPro Q&A Bot",
-    description="Ask questions about the uploaded PDF document.",
-)
-# Launch the interface
-interface.launch()

 import os
 import gradio as gr
+from langchain import PromptTemplate
+from langchain.chains.question_answering import load_qa_chain
+from langchain.document_loaders import PyPDFLoader
+from langchain_google_genai import ChatGoogleGenerativeAI
+import google.generativeai as genai
+from dotenv import load_dotenv
+# Load environment variables from .env file
+load_dotenv()
+# Fungsi untuk inisialisasi
+def initialize(file_path, question):
+    genai.configure(api_key=os.getenv("GOOGLE_API_KEY"))
+    model = genai.GenerativeModel('gemini-pro')
+    model = ChatGoogleGenerativeAI(model="gemini-pro", temperature=0.3)
+    prompt_template = """Answer the question as precise as possible using the provided context. If the answer is
+                          not contained in the context, say "answer not available in context" \n\n
+                          Context: \n {context}?\n
+                          Question: \n {question} \n
+                          Answer:
+                        """
+    prompt = PromptTemplate(template=prompt_template, input_variables=["context", "question"])
+    if os.path.exists(file_path):
+        pdf_loader = PyPDFLoader(file_path)
+        pages = pdf_loader.load_and_split()
+        context = "\n".join(str(page.page_content) for page in pages[:30])
+        stuff_chain = load_qa_chain(model, chain_type="stuff", prompt=prompt)
+        stuff_answer = stuff_chain({"input_documents": pages, "question": question, "context": context}, return_only_outputs=True)
+        return stuff_answer['output_text']
+    else:
+        return "Error: Unable to process the document. Please ensure the PDF file is valid."
+# Define Gradio Interface
+input_file = gr.File(label="Upload PDF File")
+input_question = gr.Textbox(label="Ask about the document")
+output_text = gr.Textbox(label="Answer - GeminiPro")
+def pdf_qa(file, question):
+    answer = initialize(file.name, question)
+    return answer
+# Create Gradio Interface
+gr.Interface(fn=pdf_qa, inputs=[input_file, input_question], outputs=output_text, title="PDF Question Answering System", description="Upload a PDF file and ask questions about the content.").launch()