Spaces:

dschandra
/

ALNISFPO

Sleeping

dschandra commited on Dec 3, 2024

Commit

d4a05e1

verified ·

1 Parent(s): 62e4c88

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -35,6 +35,10 @@ def parse_po_items_with_filters(text):
     """
     Parses purchase order items from the extracted text using regex with filters.
     Ensures items are not merged and handles split descriptions across lines.
     """
     lines = text.splitlines()
     data = []
@@ -106,7 +110,7 @@ def parse_po_items_with_filters(text):
                 # Remove the extracted portion from item 2's description
                 row["Description"] = row["Description"].replace(item_3_description.group(), "").strip()
-    # Clean specific patterns from item 7
     for item in data:
         if item["Item"] == "7":
             # Remove unwanted text from description

     """
     Parses purchase order items from the extracted text using regex with filters.
     Ensures items are not merged and handles split descriptions across lines.
+    Args:
+        text (str): Extracted text from the PDF.
+    Returns:
+        tuple: A DataFrame with parsed data and a status message.
     """
     lines = text.splitlines()
     data = []
                 # Remove the extracted portion from item 2's description
                 row["Description"] = row["Description"].replace(item_3_description.group(), "").strip()
+    # Ensure each description's additional data is handled properly
     for item in data:
         if item["Item"] == "7":
             # Remove unwanted text from description