Spaces:

gauri-sharan
/

test-two

Sleeping

gauri-sharan commited on Sep 29, 2024

Commit

47c68aa

verified ·

1 Parent(s): ecba862

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -41,7 +41,7 @@ def ocr_and_extract(image, text_query):
         )
         # Perform the search query on the indexed image
-        results = rag_model.search(text_query, k=1)  # Removed index_name argument
         # Prepare the input for Qwen2-VL
         image_data = Image.open(temp_image_path)
@@ -74,10 +74,13 @@ def ocr_and_extract(image, text_query):
             generated_ids, skip_special_tokens=True, clean_up_tokenization_spaces=False
         )
         # Clean up the temporary file
         os.remove(temp_image_path)
-        return output_text[0]
     except Exception as e:
         error_message = str(e)

         )
         # Perform the search query on the indexed image
+        results = rag_model.search(text_query, k=1)
         # Prepare the input for Qwen2-VL
         image_data = Image.open(temp_image_path)
             generated_ids, skip_special_tokens=True, clean_up_tokenization_spaces=False
         )
+        # Filter out system and user prompts
+        filtered_output = [line for line in output_text[0].split("\n") if not any(kw in line.lower() for kw in ["system", "user"])]
         # Clean up the temporary file
         os.remove(temp_image_path)
+        return "\n".join(filtered_output)
     except Exception as e:
         error_message = str(e)