Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -56,8 +56,8 @@ class URLProcessor:
|
|
56 |
to_ascii=True,
|
57 |
lower=True,
|
58 |
no_line_breaks=True,
|
59 |
-
no_urls=
|
60 |
-
no_emails
|
61 |
no_phone_numbers=True,
|
62 |
no_numbers=False,
|
63 |
no_digits=False,
|
@@ -177,7 +177,7 @@ class FileProcessor:
|
|
177 |
|
178 |
def __init__(self, max_file_size: int = 2 * 1024 * 1024 * 1024): # 2GB default
|
179 |
self.max_file_size = max_file_size
|
180 |
-
self.supported_text_extensions = {'.txt', '.md', '.csv', '.json', '.xml'}
|
181 |
|
182 |
def is_text_file(self, filepath: str) -> bool:
|
183 |
"""Check if file is a text file"""
|
|
|
56 |
to_ascii=True,
|
57 |
lower=True,
|
58 |
no_line_breaks=True,
|
59 |
+
no_urls=False,
|
60 |
+
no_emails=,
|
61 |
no_phone_numbers=True,
|
62 |
no_numbers=False,
|
63 |
no_digits=False,
|
|
|
177 |
|
178 |
def __init__(self, max_file_size: int = 2 * 1024 * 1024 * 1024): # 2GB default
|
179 |
self.max_file_size = max_file_size
|
180 |
+
self.supported_text_extensions = {'.txt', '.md', '.csv', '.json', '.xml', '.zip', '.pdf', '.rtf', '.tar'}
|
181 |
|
182 |
def is_text_file(self, filepath: str) -> bool:
|
183 |
"""Check if file is a text file"""
|