Spaces:

Macro27
/

OCR

Sleeping

OCR

File size: 2,789 Bytes

3bc9036

import streamlit as st
from streamlit_webrtc import webrtc_streamer, WebRtcMode
from src.system_initializer import SystemInitializer
from src.video_processor import VideoProcessor
from src.utilities import Utilities

import warnings
warnings.filterwarnings("ignore")  # Ignore warnings for a cleaner output

class OCRChatbotApp:
    def __init__(self):
        # Initialize the system components
        self.system_initializer = SystemInitializer()
        self.utilities = Utilities()
        self.queues = self.system_initializer.initialize_system()  # Initialize queues and start OCR thread
        self.conf_thresh = 50  # Default confidence threshold for OCR
        self.n = 5  # Process every n frames
        self.k = 30  # Number of frames to keep annotations

    def run(self):
        st.title('OCR and Chatbot Application')  # Set the title of the Streamlit app

        # Initialize session state variables if they don't exist
        if "camera_frozen" not in st.session_state:
            st.session_state.update({"camera_frozen": False, "latest": [], "likely_text": ""})

        # Create sliders for adjusting confidence threshold and frame processing interval
        self.conf_thresh = st.slider('Confidence Threshold', 0, 100, 50)
        self.n = st.slider('Process every n frames', 1, 30, 5)

        # Button to freeze or resume the camera
        if st.button("Freeze" if not st.session_state.camera_frozen else "Resume"):
            st.session_state.camera_frozen = not st.session_state.camera_frozen
            if st.session_state.camera_frozen:
                st.session_state.likely_text = self.utilities.fetch_likely_text()  # Fetch likely text when camera is frozen

        # Define constraints for higher resolution video capture
        constraints = {
            "video": {
                "width": {"ideal": 1280},
                "height": {"ideal": 720},
                "frameRate": {"ideal": 30}
            },
            "audio": False
        }

        # Initialize the WebRTC streamer with the specified constraints and video processor
        webrtc_ctx = webrtc_streamer(
            key="example",
            video_processor_factory=lambda: VideoProcessor(self.queues, self.conf_thresh, self.n, self.k),
            media_stream_constraints=constraints,
            async_processing=True,
        )

        # Display the likely text if the camera is frozen
        if st.session_state.camera_frozen and st.session_state.likely_text:
            st.write(st.session_state.likely_text)
        else:
            st.write("No text found")

        # Run the chatbot
        self.system_initializer.run_chatbot()

if __name__ == '__main__':
    app = OCRChatbotApp()  # Create an instance of the OCRChatbotApp
    app.run()  # Run the app