BF

Running

SamiKoen Claude commited on 8 days ago

Commit

03d4524

1 Parent(s): ceaee51

Akıllı kelime filtreleme - spesifik kelime yok

- Consonant/vowel oranına göre filtreleme
- Alphanumeric kodları koru
- 2-3 harfli product kodları tanı
- Tamamen genel algoritma

🤖 Generated with [Claude Code](https://claude.ai/code)

Co-Authored-By: Claude <[email protected]>

Files changed (1) hide show

app.py +33 -9

app.py CHANGED Viewed

@@ -53,18 +53,42 @@ def get_warehouse_stock(product_name):
         query = normalize(product_name.strip()).replace('(2026)', '').replace('(2025)', '').strip()
         words = query.split()
-        # Words to ignore in product search
-        ignore_words = ['var', 'mi', 'mı', 'mu', 'mü', 'varmi', 'varmı', 'beden', 'size', 'boy',
-                       'stok', 'stokta', 'mevcut', 'hangi', 'magazada', 'nerede', 'kaç', 'adet', 'tane',
-                       'trek', 'bisiklet', 'bike']
-        # Find size
         sizes = ['s', 'm', 'l', 'xl', 'xs', 'xxl', 'ml']
         size = next((w for w in words if w in sizes), None)
-        # Filter product words - remove sizes and question words
-        # Keep numbers (like 6, 7, 8) and words longer than 1 char
-        product_words = [w for w in words if w not in sizes and w not in ignore_words and (len(w) > 1 or w.isdigit())]
         print(f"DEBUG - Searching: {' '.join(product_words)}, Size: {size}")

         query = normalize(product_name.strip()).replace('(2026)', '').replace('(2025)', '').strip()
         words = query.split()
+        # Find size markers (S, M, L, etc.)
         sizes = ['s', 'm', 'l', 'xl', 'xs', 'xxl', 'ml']
         size = next((w for w in words if w in sizes), None)
+        # Smart filtering: Keep only meaningful product identifiers
+        product_words = []
+        # First pass: identify what looks like product terms
+        for word in words:
+            # Skip if it's a size marker
+            if word in sizes:
+                continue
+            # Always keep numbers (model numbers like 6, 7, 8)
+            if word.isdigit():
+                product_words.append(word)
+            # Keep alphanumeric codes (like "sl6", "gen8")
+            elif any(c.isdigit() for c in word) and any(c.isalpha() for c in word):
+                product_words.append(word)
+            # Keep 2-3 letter codes (often product codes like "sl", "slr", "emx")
+            elif 2 <= len(word) <= 3 and word.isalpha():
+                # Check if it has consonants (likely a code, not a particle)
+                if any(c not in 'aeiou' for c in word):
+                    product_words.append(word)
+            # Keep longer words that have good consonant/vowel mix (likely product names)
+            elif len(word) > 3:
+                # Calculate consonant ratio
+                consonants = sum(1 for c in word if c not in 'aeiou')
+                vowels = len(word) - consonants
+                # Product names usually have balanced or consonant-heavy distribution
+                # Turkish question words are often vowel-heavy
+                if consonants >= vowels * 0.5:  # At least 1 consonant per 2 vowels
+                    product_words.append(word)
         print(f"DEBUG - Searching: {' '.join(product_words)}, Size: {size}")