Spaces:

loayshabet
/

news-sumarry

Running

App Files Files Community

loayshabet commited on Nov 26, 2024

Commit

29c7963

verified ·

1 Parent(s): 2267b2b

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -28

app.py CHANGED Viewed

@@ -17,36 +17,13 @@ logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(
 SUMMARIZER_MODEL = "facebook/bart-large-cnn"  # You can replace this with other summarization models
 CACHE_SIZE = 500  # Maximum number of cached summaries
 RSS_FETCH_INTERVAL = timedelta(hours=8)  # Fetch recent news within the last 8 hours
-TIMEOUT_LIMIT = 30  # Maximum time in seconds to process summaries
 # News sources
 NEWS_SOURCES = {
-     "Technology": {
-        "TheNewYorkTimes": "https://rss.nytimes.com/services/xml/rss/nyt/Technology.xml",
-        "reutersagency": "https://www.reutersagency.com/feed/?best-topics=tech&post_type=best"
-    },
-    "Business": {
-        "TheNewYorkTimes": "https://rss.nytimes.com/services/xml/rss/nyt/Business.xml",
-        "reutersagency": "https://www.reutersagency.com/feed/?best-topics=business-finance&post_type=best"
-    },
-    "Science": {
-        "TheNewYorkTimes": "https://rss.nytimes.com/services/xml/rss/nyt/Science.xml"
-    },
-    "World News": {
-        "TheNewYorkTimes": "https://rss.nytimes.com/services/xml/rss/nyt/World.xml",
-        "BBC": "http://feeds.bbci.co.uk/news/world/rss.xml",
-        "CNN": "http://rss.cnn.com/rss/edition_world.rss",
-        "reutersagency": "https://www.reutersagency.com/feed/?taxonomy=best-regions&post_type=best"
-    },
-    "Sports": {
-        "TheNewYorkTimes": "https://rss.nytimes.com/services/xml/rss/nyt/Sports.xml",
-        "reutersagency": "https://www.reutersagency.com/feed/?best-topics=sports&post_type=best"
-    },
-    "Health": {
-        "TheNewYorkTimes": "https://rss.nytimes.com/services/xml/rss/nyt/Health.xml",
-        "politico": "http://rss.politico.com/healthcare.xml",
-        "reutersagency": "https://www.reutersagency.com/feed/?best-topics=health&post_type=best"
-    },
 }
 # Initialize cache
@@ -97,6 +74,9 @@ def fetch_rss_news(categories):
                         })
             except Exception as e:
                 logging.error(f"Failed to fetch from {url}: {e}")
     return articles
 def summarize_text(text):
@@ -116,7 +96,7 @@ def summarize_text(text):
         return "Summary unavailable."
 def summarize_articles(articles):
-    """Summarize all fetched articles."""
     summaries = []
     for article in articles:
         try:
@@ -213,3 +193,4 @@ if __name__ == "__main__":

 SUMMARIZER_MODEL = "facebook/bart-large-cnn"  # You can replace this with other summarization models
 CACHE_SIZE = 500  # Maximum number of cached summaries
 RSS_FETCH_INTERVAL = timedelta(hours=8)  # Fetch recent news within the last 8 hours
+ARTICLE_LIMIT = 5  # Limit to the last 5 articles
 # News sources
 NEWS_SOURCES = {
+    "Technology": {"NYTimes": "https://rss.nytimes.com/services/xml/rss/nyt/Technology.xml"},
+    "Business": {"Reuters": "https://www.reutersagency.com/feed/?best-topics=business-finance&post_type=best"},
+    "World": {"BBC": "http://feeds.bbci.co.uk/news/world/rss.xml"},
 }
 # Initialize cache
                         })
             except Exception as e:
                 logging.error(f"Failed to fetch from {url}: {e}")
+    # Sort articles by published date (most recent first) and limit to ARTICLE_LIMIT
+    articles = sorted(articles, key=lambda x: x["published"], reverse=True)[:ARTICLE_LIMIT]
     return articles
 def summarize_text(text):
         return "Summary unavailable."
 def summarize_articles(articles):
+    """Summarize the last 5 fetched articles."""
     summaries = []
     for article in articles:
         try: