Spaces:

masadonline
/

RAG-PDF

Sleeping

App Files Files Community

masadonline commited on May 18

Commit

0b8ee3b

verified ·

1 Parent(s): 53c3520

Create app.py

Browse files

Files changed (1) hide show

app.py +98 -0

app.py ADDED Viewed

	@@ -0,0 +1,98 @@

+import streamlit as st
+import PyPDF2
+import os
+from dotenv import load_dotenv
+from gql import gql, Client
+from gql.transport.requests import RequestsHTTPTransport
+import pandas as pd
+# Load environment variables (GROQ API Key)
+load_dotenv()
+groq_api_key = os.environ.get("GROQ_API_KEY")
+# Function to extract order data from PDF
+def extract_order_data(pdf_file):
+    """Extracts order data from the uploaded PDF file."""
+    order_data = []
+    reader = PyPDF2.PdfReader(pdf_file)
+    for page in reader.pages:
+        text = page.extract_text()
+        if text:
+            # Splitting the text page by page and then by line
+            lines = text.strip().split('\n')
+            # Find the start of the table, assuming it begins with a "Order ID" heading
+            start_index = next((i for i, line in enumerate(lines) if "Order ID" in line), None)
+            if start_index is not None:
+                # Table headers are on the same line
+                headers = [header.strip() for header in lines[start_index].split(",")]
+                # Data starts from the next line
+                for line in lines[start_index + 1:]:
+                    values = [value.strip() for value in line.split(",")]
+                    # Ensure that the number of values matches the number of headers
+                    if len(headers) == len(values):
+                        order_data.append(dict(zip(headers, values)))
+    return order_data
+# Function to fetch order status using GROQ API
+def fetch_order_status_from_groq(order_id, groq_api_key):
+    """Fetches order status and customer details from GROQ API."""
+    transport = RequestsHTTPTransport(
+        url="https://api.groq.cloud/v1/graphql",  # Replace with your GROQ endpoint
+        headers={"Authorization": f"Bearer {groq_api_key}"},
+        verify=True,
+        retries=3,
+    )
+    client = Client(transport=transport, fetch_schema_from_transport=True)
+    query = gql("""
+        query GetOrder($orderId: String!) {
+          getOrder(id: $orderId) {
+            id
+            status
+            customer {
+              name
+              email
+            }
+          }
+        }
+    """)  # Replace with your GROQ query
+    variables = {"orderId": order_id}
+    try:
+        result = client.execute(query, variable_values=variables)
+        return result["getOrder"]
+    except Exception as e:
+        return f"Error fetching data from GROQ: {e}"
+# Streamlit app
+def main():
+    st.title("Order Status App")
+    uploaded_file = st.file_uploader("Upload Customer Orders PDF", type="pdf")
+    if uploaded_file is not None:
+        order_data = extract_order_data(uploaded_file)
+        if order_data:
+            st.success("Order data extracted successfully!")
+            df = pd.DataFrame(order_data)
+            st.dataframe(df)  # Display the extracted data as a DataFrame
+            order_id_to_check = st.text_input("Enter Order ID to check status:")
+            if order_id_to_check:
+                order_status = fetch_order_status_from_groq(order_id_to_check, groq_api_key)
+                if order_status:
+                    st.json(order_status)
+                else:
+                    st.error("Could not retrieve order status.")
+        else:
+            st.error("Failed to extract order data from PDF.")
+if __name__ == "__main__":
+    main()