Spaces:

Macro27
/

OCR

Sleeping

OCR / main.py

Marco

initial commit

3bc9036 12 months ago

2.79 kB

	import streamlit as st
	from streamlit_webrtc import webrtc_streamer, WebRtcMode
	from src.system_initializer import SystemInitializer
	from src.video_processor import VideoProcessor
	from src.utilities import Utilities

	import warnings
	warnings.filterwarnings("ignore") # Ignore warnings for a cleaner output

	class OCRChatbotApp:
	def __init__(self):
	# Initialize the system components
	self.system_initializer = SystemInitializer()
	self.utilities = Utilities()
	self.queues = self.system_initializer.initialize_system() # Initialize queues and start OCR thread
	self.conf_thresh = 50 # Default confidence threshold for OCR
	self.n = 5 # Process every n frames
	self.k = 30 # Number of frames to keep annotations

	def run(self):
	st.title('OCR and Chatbot Application') # Set the title of the Streamlit app

	# Initialize session state variables if they don't exist
	if "camera_frozen" not in st.session_state:
	st.session_state.update({"camera_frozen": False, "latest": [], "likely_text": ""})

	# Create sliders for adjusting confidence threshold and frame processing interval
	self.conf_thresh = st.slider('Confidence Threshold', 0, 100, 50)
	self.n = st.slider('Process every n frames', 1, 30, 5)

	# Button to freeze or resume the camera
	if st.button("Freeze" if not st.session_state.camera_frozen else "Resume"):
	st.session_state.camera_frozen = not st.session_state.camera_frozen
	if st.session_state.camera_frozen:
	st.session_state.likely_text = self.utilities.fetch_likely_text() # Fetch likely text when camera is frozen

	# Define constraints for higher resolution video capture
	constraints = {
	"video": {
	"width": {"ideal": 1280},
	"height": {"ideal": 720},
	"frameRate": {"ideal": 30}
	},
	"audio": False
	}

	# Initialize the WebRTC streamer with the specified constraints and video processor
	webrtc_ctx = webrtc_streamer(
	key="example",
	video_processor_factory=lambda: VideoProcessor(self.queues, self.conf_thresh, self.n, self.k),
	media_stream_constraints=constraints,
	async_processing=True,
	)

	# Display the likely text if the camera is frozen
	if st.session_state.camera_frozen and st.session_state.likely_text:
	st.write(st.session_state.likely_text)
	else:
	st.write("No text found")

	# Run the chatbot
	self.system_initializer.run_chatbot()

	if __name__ == '__main__':
	app = OCRChatbotApp() # Create an instance of the OCRChatbotApp
	app.run() # Run the app