Spaces:

mroccuper
/

Content-Transformation

Sleeping

mroccuper commited on May 4

Commit

0a52165

verified ·

1 Parent(s): d038cad

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,7 +3,6 @@ import gradio as gr
 import requests
 from bs4 import BeautifulSoup
 import google.generativeai as genai
-from newspaper import Article
 import os
 # Configure Gemini API
@@ -11,13 +10,17 @@ GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
 genai.configure(api_key=GEMINI_API_KEY)
 def fetch_article_content(url):
-    """Extract article content from URL"""
     try:
-        # Using newspaper3k for better article extraction
-        article = Article(url)
-        article.download()
-        article.parse()
-        return article.text
     except Exception as e:
         return f"Error fetching article: {str(e)}"
@@ -85,7 +88,7 @@ app = gr.Interface(
     examples=[
         ["https://example.com/sample-article"]
     ],
-    title="Article to Platform Post Converter",
     description="Convert news articles into optimized Reddit/Quora-style posts with AI-generated formatting and image descriptions"
 )

 import requests
 from bs4 import BeautifulSoup
 import google.generativeai as genai
 import os
 # Configure Gemini API
 genai.configure(api_key=GEMINI_API_KEY)
 def fetch_article_content(url):
+    """Fetch article content using requests and BeautifulSoup"""
     try:
+        headers = {'User-Agent': 'Mozilla/5.0'}
+        response = requests.get(url, headers=headers, timeout=10)
+        response.raise_for_status()
+        soup = BeautifulSoup(response.text, 'html.parser')
+        # Extract text from <p> tags
+        paragraphs = soup.find_all('p')
+        content = ' '.join([p.get_text(strip=True) for p in paragraphs])
+        return content
     except Exception as e:
         return f"Error fetching article: {str(e)}"
     examples=[
         ["https://example.com/sample-article"]
     ],
+    title="Article to Reddit/Quora Post Converter",
     description="Convert news articles into optimized Reddit/Quora-style posts with AI-generated formatting and image descriptions"
 )