Spaces:

dschandra
/

ALNISFPO

Sleeping

App Files Files Community

dschandra commited on Dec 7, 2024

Commit

c0dd2b0

verified ·

1 Parent(s): e7e2d2c

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -15

app.py CHANGED Viewed

@@ -35,14 +35,14 @@ def clean_description(description, item_number=None):
     return description.strip()
-  # Function: Clean Description (Basic cleaning logic)
-def clean_description(description, item_number):
     """
     Cleans up the description for an item to ensure it's correctly formatted.
     """
     return description.strip()
-# Function to extract PO Items with filters and better error handling
 def parse_po_items_with_filters(text):
     """
     Parses purchase order items from the extracted text systematically.
@@ -52,6 +52,10 @@ def parse_po_items_with_filters(text):
     current_item = None
     description_accumulator = []
     for line in lines:
         print(f"Processing Line: {line}")  # Debugging
@@ -62,10 +66,8 @@ def parse_po_items_with_filters(text):
             # Save the previous item if current_item is not None
             if current_item is not None:
-                current_item["Description"] = clean_description(
-                    " ".join(description_accumulator).strip(),
-                    item_number=int(current_item["Item"]),
-                )
                 data.append(current_item)
                 description_accumulator = []  # Reset description accumulator
                 print(f"Item {current_item['Item']} added to data.")  # Debugging
@@ -84,8 +86,8 @@ def parse_po_items_with_filters(text):
             # Accumulate additional lines for the current item's description
             description_accumulator.append(line.strip())
-        # Match Qty, Unit, Unit Price, and Total Price
-        qty_match = re.search(r"(?P<Qty>\d+)\s+(Nos\.|Set|pcs)", line)
         if qty_match:
             print(f"Qty match found: {qty_match.group('Qty')} {qty_match.group(2)}")  # Debugging
             current_item["Qty"] = qty_match.group("Qty")
@@ -94,7 +96,7 @@ def parse_po_items_with_filters(text):
             print(f"No Qty match found in line: {line}")  # Debugging
         # Match Unit Price and Total Price
-        price_match = re.search(r"(?P<UnitPrice>[\d.]+)\s+(?P<TotalPrice>[\d.]+)$", line)
         if price_match:
             print(f"Price match found: {price_match.group('UnitPrice')} {price_match.group('TotalPrice')}")  # Debugging
             current_item["Unit Price"] = price_match.group("UnitPrice")
@@ -104,14 +106,12 @@ def parse_po_items_with_filters(text):
     # Finalize the last item
     if current_item is not None:
-        current_item["Description"] = clean_description(
-            " ".join(description_accumulator).strip(),
-            item_number=int(current_item["Item"]),
-        )
         data.append(current_item)
         print(f"Finalized Item {current_item['Item']}")  # Debugging
-    # Split merged descriptions and assign items
     for i, row in enumerate(data):
         if row["Item"] == "2" and "Mfd:-2022" in row["Description"]:  # Find the item description boundary
             item_3_match = re.search(

     return description.strip()
+ # Function to clean item description
+def clean_description(description):
     """
     Cleans up the description for an item to ensure it's correctly formatted.
     """
     return description.strip()
+# Function to extract PO items with better error handling and checks
 def parse_po_items_with_filters(text):
     """
     Parses purchase order items from the extracted text systematically.
     current_item = None
     description_accumulator = []
+    # Regex patterns
+    qty_pattern = r"(?P<Qty>\d+)\s+(Nos\.|Set|pcs)"  # Match quantities
+    price_pattern = r"(?P<UnitPrice>[\d.]+)\s+(?P<TotalPrice>[\d.]+)$"  # Match prices
     for line in lines:
         print(f"Processing Line: {line}")  # Debugging
             # Save the previous item if current_item is not None
             if current_item is not None:
+                # Clean and add the description to the current item
+                current_item["Description"] = clean_description(" ".join(description_accumulator).strip())
                 data.append(current_item)
                 description_accumulator = []  # Reset description accumulator
                 print(f"Item {current_item['Item']} added to data.")  # Debugging
             # Accumulate additional lines for the current item's description
             description_accumulator.append(line.strip())
+        # Match Qty (quantity) in the line
+        qty_match = re.search(qty_pattern, line)
         if qty_match:
             print(f"Qty match found: {qty_match.group('Qty')} {qty_match.group(2)}")  # Debugging
             current_item["Qty"] = qty_match.group("Qty")
             print(f"No Qty match found in line: {line}")  # Debugging
         # Match Unit Price and Total Price
+        price_match = re.search(price_pattern, line)
         if price_match:
             print(f"Price match found: {price_match.group('UnitPrice')} {price_match.group('TotalPrice')}")  # Debugging
             current_item["Unit Price"] = price_match.group("UnitPrice")
     # Finalize the last item
     if current_item is not None:
+        # Clean and add the description to the current item
+        current_item["Description"] = clean_description(" ".join(description_accumulator).strip())
         data.append(current_item)
         print(f"Finalized Item {current_item['Item']}")  # Debugging
+    # Split merged descriptions and assign items (if necessary)
     for i, row in enumerate(data):
         if row["Item"] == "2" and "Mfd:-2022" in row["Description"]:  # Find the item description boundary
             item_3_match = re.search(