Founder_Name_Extraction_v3

Sleeping

App Files Files Community

dygoo commited on Jun 8

Commit

e032085

verified ·

1 Parent(s): 661d298

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -9

app.py CHANGED Viewed

@@ -32,7 +32,7 @@ def search_articles(name: str) -> str:
 def extract_entities(search_results: str) -> str:
     """Extract entities using Mistral 7B endpoint"""
     modal_endpoint = "https://msoaresdiego--mistral-llm-endpoint-fastapi-app.modal.run/generate"
-    prompt = f"""Extract all person names and organization names from the following text.Do not extract products and service names. Only individuals and organizations.Bring the full details of the name in the newspaper article. For example, if only ACME is mentioned as company name, bring only ACME. IF ACME Inc is mentioned as company name, then you have to extract ACME Inc. Please also bring the relationship between the entity and the company that is being searched. For example, is ACME Inc an owner of the company being searched. Is ACME Inc. a funder of the company being searched?
 Format as:
 PERSON: [name]
 ORG: [organization name]
@@ -40,7 +40,7 @@ Text: {search_results}"""
     try:
         response = requests.post(
             modal_endpoint,
-            json={"prompt": prompt, "max_tokens": 500, "temperature": 0.05}
         )
         if response.status_code == 200:
             return response.json().get("response", "No entities extracted")
@@ -53,7 +53,7 @@ Text: {search_results}"""
 # === Gradio interface ===
 def process_name_with_progress(name: str, progress=gr.Progress()):
-    """Process name with streamed debug updates to help diagnose issues"""
     if not name.strip():
         yield "No name provided", "", ""
         return
@@ -65,26 +65,26 @@ def process_name_with_progress(name: str, progress=gr.Progress()):
     try:
         # Step 1: Search
         progress(0.1, desc="Searching for articles...")
-        search_results += f"[DEBUG] Starting search for: {name}\n"
         yield search_results, "", ""
         search_start = time.time()
         articles_output = search_articles(name.strip())
         search_time = time.time() - search_start
-        search_results += f"[DEBUG] Search completed in {search_time:.2f}s\n"
         search_results += f"{articles_output}\n"
         yield search_results, "", ""
         # Step 2: Extract entities
         progress(0.5, desc="Extracting entities...")
-        search_results += "[DEBUG] Starting entity extraction...\n"
-        yield search_results, "[DEBUG] Extracting entities...", ""
         extract_start = time.time()
         entities = extract_entities(articles_output)
         extract_time = time.time() - extract_start
-        search_results += f"[DEBUG] Entity extraction completed in {extract_time:.2f}s\n"
         yield search_results, entities, ""
@@ -107,7 +107,7 @@ with gr.Blocks(title="Related Entitites Finder") as demo:
     with gr.Column():
-        output1 = gr.Textbox(label="Search Results", lines=10, max_lines=30)
         output2 = gr.Textbox(label="Extracted Entities and Relationships", lines=5, max_lines=10)
     search_btn.click(

 def extract_entities(search_results: str) -> str:
     """Extract entities using Mistral 7B endpoint"""
     modal_endpoint = "https://msoaresdiego--mistral-llm-endpoint-fastapi-app.modal.run/generate"
+    prompt = f"""Extract all person names and organization names from the following text.Do not extract products and service names. Only individuals and organizations.Bring the full details of the name in the newspaper article. For example, if only ACME is mentioned as company name, bring only ACME. IF ACME Inc is mentioned as company name, then you have to extract ACME Inc. In addition, define the relationship between the entity and the company that is being searched. For example, is ACME Inc an owner of the company being searched? Then write 'owner'. Is ACME Inc. a funder of the company being searched? Then write 'funder'
 Format as:
 PERSON: [name]
 ORG: [organization name]
     try:
         response = requests.post(
             modal_endpoint,
+            json={"prompt": prompt, "max_tokens": 2500, "temperature": 0.15}
         )
         if response.status_code == 200:
             return response.json().get("response", "No entities extracted")
 # === Gradio interface ===
 def process_name_with_progress(name: str, progress=gr.Progress()):
+    """Process name """
     if not name.strip():
         yield "No name provided", "", ""
         return
     try:
         # Step 1: Search
         progress(0.1, desc="Searching for articles...")
+        search_results += f"Starting search for: {name}\n"
         yield search_results, "", ""
         search_start = time.time()
         articles_output = search_articles(name.strip())
         search_time = time.time() - search_start
+        search_results += f"Search completed in {search_time:.2f}s\n"
         search_results += f"{articles_output}\n"
         yield search_results, "", ""
         # Step 2: Extract entities
         progress(0.5, desc="Extracting entities...")
+        search_results += "Starting entity extraction...\n"
+        yield search_results, "Extracting entities...", ""
         extract_start = time.time()
         entities = extract_entities(articles_output)
         extract_time = time.time() - extract_start
+        search_results += f"Entity extraction completed in {extract_time:.2f}s\n"
         yield search_results, entities, ""
     with gr.Column():
+        output1 = gr.Textbox(label="Search Results", lines=50, max_lines=100)
         output2 = gr.Textbox(label="Extracted Entities and Relationships", lines=5, max_lines=10)
     search_btn.click(