Spaces:

SohomToom
/

ComicBookCleaner

Running

App Files Files Community

SohomToom commited on May 2

Commit

89815d3

verified ·

1 Parent(s): cd98f1b

Upload app.py

Browse files

Files changed (1) hide show

app.py +44 -14

app.py CHANGED Viewed

@@ -39,20 +39,35 @@ def sample_border_color(image, box, padding=2):
     median_color = np.median(border_pixels, axis=0)
     return tuple(map(int, median_color))
-def detect_text_boxes(image):
-    results = ocr.ocr(image, cls=True)
-    if not results or not results[0]:
         return []
-    boxes = []
-    for line in results[0]:
-        box, (text, confidence) = line
-        if text.strip():
-            x_min = int(min(pt[0] for pt in box))
-            x_max = int(max(pt[0] for pt in box))
-            y_min = int(min(pt[1] for pt in box))
-            y_max = int(max(pt[1] for pt in box))
-            boxes.append(((x_min, y_min, x_max, y_max), text, confidence))
-    return boxes
 def remove_text_dynamic_fill(img_path, output_path):
     image = cv2.imread(img_path)
@@ -106,8 +121,23 @@ def process_folder(input_files):
         output_path = os.path.join(temp_output, filename)
         remove_text_dynamic_fill(file.name, output_path)
-    zip_path = shutil.make_archive(temp_output, 'zip', temp_output)
     return zip_path
 demo = gr.Interface(
     fn=process_folder,

     median_color = np.median(border_pixels, axis=0)
     return tuple(map(int, median_color))
+def detect_text_boxes(image, max_dim=1280):
+    try:
+        # Resize large images to reduce memory load
+        height, width = image.shape[:2]
+        if max(height, width) > max_dim:
+            scale = max_dim / float(max(height, width))
+            image = cv2.resize(image, (int(width * scale), int(height * scale)))
+        results = PaddleOCR.ocr(image, cls=True)
+        if results is None or not results[0]:
+            print("No OCR results found or OCR returned None.")
+            return []
+        boxes = []
+        for line in results[0]:
+            box, (text, confidence) = line
+            if text.strip():
+                x_min = int(min(pt[0] for pt in box))
+                x_max = int(max(pt[0] for pt in box))
+                y_min = int(min(pt[1] for pt in box))
+                y_max = int(max(pt[1] for pt in box))
+                boxes.append(((x_min, y_min, x_max, y_max), text, confidence))
+        return boxes
+    except Exception as e:
+        print(f"OCR failed on image: {e}")
         return []
 def remove_text_dynamic_fill(img_path, output_path):
     image = cv2.imread(img_path)
         output_path = os.path.join(temp_output, filename)
         remove_text_dynamic_fill(file.name, output_path)
+    zip_path = "/tmp/cleaned_output.zip"
+    zip_folder(output_path, zip_path)
     return zip_path
+import zipfile
+def zip_folder(folder_path, output_zip):
+    with zipfile.ZipFile(output_zip, 'w', zipfile.ZIP_DEFLATED) as zipf:
+        for root, _, files in os.walk(folder_path):
+            for file in files:
+                file_path = os.path.join(root, file)
+                arcname = os.path.relpath(file_path, folder_path)
+                zipf.write(file_path, arcname)
 demo = gr.Interface(
     fn=process_folder,