Spaces:

dschandra
/

ALNISFPO

Sleeping

dschandra commited on Dec 3, 2024

Commit

391b6b5

verified ·

1 Parent(s): e31a32d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -37,6 +37,7 @@ def clean_description(description, item_number=None):
 def parse_po_items_with_filters(text):
     """
     Parses purchase order items from the extracted text systematically, avoiding merging issues.
     """
     lines = text.splitlines()
     data = []
@@ -91,12 +92,13 @@ def parse_po_items_with_filters(text):
         )
         data.append(current_item)
-    # Final cleanup to handle special cases (e.g., splitting merged items)
     for i, row in enumerate(data):
         if row["Item"] == "2" and "As per Drg. to." in row["Description"]:
-            # Dynamically split merged descriptions
             item_3_match = re.search(r"As per Drg. to. G000810.*Mfd:-2022", row["Description"])
             if item_3_match:
                 data.insert(
                     i + 1,
                     {
@@ -108,9 +110,10 @@ def parse_po_items_with_filters(text):
                         "Total Price": "45.60",
                     },
                 )
                 row["Description"] = row["Description"].replace(item_3_match.group(), "").strip()
-    # Filter out invalid rows
     data = [row for row in data if row["Description"]]
     # Return data as a DataFrame

 def parse_po_items_with_filters(text):
     """
     Parses purchase order items from the extracted text systematically, avoiding merging issues.
+    Ensures Item 3 is split correctly from Item 2.
     """
     lines = text.splitlines()
     data = []
         )
         data.append(current_item)
+    # Split merged descriptions and assign items
     for i, row in enumerate(data):
         if row["Item"] == "2" and "As per Drg. to." in row["Description"]:
+            # Dynamically split merged descriptions for Item 3
             item_3_match = re.search(r"As per Drg. to. G000810.*Mfd:-2022", row["Description"])
             if item_3_match:
+                # Insert Item 3 into the data list
                 data.insert(
                     i + 1,
                     {
                         "Total Price": "45.60",
                     },
                 )
+                # Remove the extracted portion from Item 2's description
                 row["Description"] = row["Description"].replace(item_3_match.group(), "").strip()
+    # Clean and finalize descriptions
     data = [row for row in data if row["Description"]]
     # Return data as a DataFrame