Spaces:

Swekerr
/

Qwen2VL-OCR

Running

Swekerr commited on Sep 25, 2024

Commit

14aca25

verified ·

1 Parent(s): 235fb7e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -17,13 +17,10 @@ def load_models():
 RAG, model, processor = load_models()
 # Function for OCR and search
 def ocr_and_search(image, keyword):
     # Hardcoded query to extract text in English, Sanskrit, and Hindi
     text_query = "Extract all the text in English, Sanskrit, and Hindi from the image."
-    results = RAG.search(text_query, k=1)
-    if not results:  # Check if results are empty
-        return "No results found for the given query.", [], "{}"
     # Prepare message for Qwen model
     messages = [
@@ -66,6 +63,7 @@ def ocr_and_search(image, keyword):
     return extracted_text, matched_sentences, json_output
 # Gradio App function
 def app(image, keyword):
     # Call OCR and search function

 RAG, model, processor = load_models()
 # Function for OCR and search
+# Skip RAG search and use Qwen2VL for direct OCR
 def ocr_and_search(image, keyword):
     # Hardcoded query to extract text in English, Sanskrit, and Hindi
     text_query = "Extract all the text in English, Sanskrit, and Hindi from the image."
     # Prepare message for Qwen model
     messages = [
     return extracted_text, matched_sentences, json_output
 # Gradio App function
 def app(image, keyword):
     # Call OCR and search function