AGI-Screenplay-Pro

Running

App Files Files Community

openfree commited on Jul 17

Commit

c0cc8cf

verified ·

1 Parent(s): f3d6c8c

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -36

app.py CHANGED Viewed

@@ -2872,49 +2872,45 @@ if __name__ == "__main__":
             return value.strip() if value else None
         return None
     def _parse_character_profile(self, content: str, role: str) -> CharacterProfile:
-        """Parse character profile from content"""
-        # Debug logging
         logger.debug(f"Parsing character profile for role: {role}")
         logger.debug(f"Content preview: {content[:200]}...")
-        # Extract name first - handle various formats
-        name = f"Character_{role}"  # default
         name_patterns = [
-            r'(?:이름|Name)[:\s]*([^,\n]+?)(?:\s*\([^)]+\))?\s*',
-            r'^\s*[-*•]\s*([^,\n]+?)(?:\s*\([^)]+\))?\s*',
-            r'^([^,\n]+?)(?:\s*\([^)]+\))?\s*'
         ]
-        for pattern in name_patterns:
-            name_match = re.search(pattern, content, re.IGNORECASE | re.MULTILINE)
-            if name_match and name_match.group(1):
-                extracted_name = name_match.group(1).strip()
-                # Remove markdown and extra characters
-                extracted_name = re.sub(r'[*:\s]+, '', extracted_name)
-                extracted_name = re.sub(r'^[*:\s]+', '', extracted_name)
-                if extracted_name and len(extracted_name) > 1:
-                    name = extracted_name
                     break
-        # Helper function to extract clean fields
-        def extract_clean_field(patterns):
-            if isinstance(patterns, str):
-                patterns = [patterns]
-            for pattern in patterns:
-                # Improved pattern with better capturing groups
-                match = re.search(rf'{pattern}[:\s]*([^\n*]+?)(?=\n|$)', content, re.IGNORECASE | re.DOTALL)
-                if match and match.group(1):
-                    value = match.group(1).strip()
-                    # Clean up the value
-                    value = re.sub(r'^[-*•:\s]+', '', value)
-                    value = re.sub(r'[*]+', '', value)
-                    value = re.sub(r'\s+', ' ', value)
-                    if value:
-                        return value
             return ""
         # Extract all fields with safer extraction
         profile = CharacterProfile(
             name=name,

             return value.strip() if value else None
         return None
+from typing import List
     def _parse_character_profile(self, content: str, role: str) -> CharacterProfile:
+        """Parse character profile from content and return CharacterProfile dataclass"""
+        # --- 1. 로그 ---
         logger.debug(f"Parsing character profile for role: {role}")
         logger.debug(f"Content preview: {content[:200]}...")
+        # --- 2. 이름 추출 ---
+        name = f"Character_{role}"          # fallback
         name_patterns = [
+            r'(?:이름|Name)[:\s]*([^\n,(]+)',      # 예: "이름: 홍길동"
+            r'^\s*[-*•]\s*([^\n,(]+)',             # 예: "- 홍길동"
+            r'^([^\n,(]+)'                         # 문단 첫 단어
         ]
+        for pat in name_patterns:
+            m = re.search(pat, content, re.IGNORECASE | re.MULTILINE)
+            if m and m.group(1).strip():
+                extracted = m.group(1).strip()
+                # 마크다운 기호·불필요 문자 제거
+                extracted = re.sub(r'[\*:\s]+', '', extracted)
+                if len(extracted) > 1:
+                    name = extracted
                     break
+        # --- 3. 필드 추출 헬퍼 ---
+        def extract_clean_field(patterns) -> str:
+            patterns = [patterns] if isinstance(patterns, str) else patterns
+            for p in patterns:
+                m = re.search(rf'{p}[:\s]*([^\n*]+?)(?=\n|$)', content,
+                              re.IGNORECASE | re.DOTALL)
+                if m and m.group(1).strip():
+                    val = m.group(1).strip()
+                    val = re.sub(r'^[-*•:\s]+', '', val)
+                    val = re.sub(r'\*+', '', val)
+                    val = re.sub(r'\s+', ' ', val)
+                    return val
             return ""
         # Extract all fields with safer extraction
         profile = CharacterProfile(
             name=name,