Spaces:

acecalisto3
/

urld

Running

App Files Files Community

acecalisto3 commited on Apr 4

Commit

776de71

verified ·

1 Parent(s): 0ee778a

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -34

app.py CHANGED Viewed

@@ -227,43 +227,43 @@ class FileProcessor:
         return chunks
-    def _process_single_file(self, file) -> List[Dict]:
-        """Process a single file"""
-        try:
-            file_stat = os.stat(file.name)
-            # For very large files, read in chunks and summarize
-            if file_stat.st_size > 100 * 1024 * 1024:  # 100MB
-                logger.info(f"Processing large file: {file.name} ({file_stat.st_size} bytes)")
-                # Read first and last 1MB for extremely large files
-                content = ""
-                with open(file.name, 'r', encoding='utf-8', errors='ignore') as f:
-                    content = f.read(1 * 1024 * 1024)  # First 1MB
-                    content += "\n...[Content truncated due to large file size]...\n"
-                    # Seek to the last 1MB
-                    f.seek(max(0, file_stat.st_size - 1 * 1024 * 1024))
-                    content += f.read()  # Last 1MB
-            else:
-                # Regular file processing
-                with open(file.name, 'r', encoding='utf-8', errors='ignore') as f:
-                    content = f.read()
-            return [{
-                'source',
-                'filename': os.path.basename(file.name),
-                'file_size': file_stat.st_size,
-                'mime_type': mimetypes.guess_type(file.name)[0],
-                'created': datetime.fromtimestamp(file_stat.st_ctime).isoformat(),
-                'modified': datetime.fromtimestamp(file_stat.st_mtime).isoformat(),
-                'content': content,
-                'timestamp': datetime.now().isoformat()
-            }]
-        except Exception as e:
-            logger.error(f"File processing error: {e}")
-            return []
 def clean_json(data: Union[str, Dict]) -> Optional[Dict]:
     """Clean and validate JSON data"""
     try:

         return chunks
+def _process_single_file(self, file) -> List[Dict]:
+    """Process a single file"""
+    try:
+        file_stat = os.stat(file.name)
+        # For very large files, read in chunks and summarize
+        if file_stat.st_size > 100 * 1024 * 1024:  # 100MB
+            logger.info(f"Processing large file: {file.name} ({file_stat.st_size} bytes)")
+            # Read first and last 1MB for extremely large files
+            content = ""
+            with open(file.name, 'r', encoding='utf-8', errors='ignore') as f:
+                content = f.read(1 * 1024 * 1024)  # First 1MB
+                content += "\n...[Content truncated due to large file size]...\n"
+                # Seek to the last 1MB
+                f.seek(max(0, file_stat.st_size - 1 * 1024 * 1024))
+                content += f.read()  # Last 1MB
+        else:
+            # Regular file processing
+            with open(file.name, 'r', encoding='utf-8', errors='ignore') as f:
+                content = f.read()
+        return [{
+            'source': 'filename',  # Assuming 'source' should be a string value
+            'filename': os.path.basename(file.name),
+            'file_size': file_stat.st_size,
+            'mime_type': mimetypes.guess_type(file.name)[0],
+            'created': datetime.fromtimestamp(file_stat.st_ctime).isoformat(),
+            'modified': datetime.fromtimestamp(file_stat.st_mtime).isoformat(),
+            'content': content,
+            'timestamp': datetime.now().isoformat()
+        }]
+    except Exception as e:
+        logger.error(f"File processing error: {e}")
+        return []
 def clean_json(data: Union[str, Dict]) -> Optional[Dict]:
     """Clean and validate JSON data"""
     try: