devmalik7
diff --git a/‎Python/News Headline Scraper/README.md‎
Lines changed: 28 additions & 0 deletions b/‎Python/News Headline Scraper/README.md‎
Lines changed: 28 additions & 0 deletions
diff --git a/‎Python/News Headline Scraper/news_headline_scraper.py‎
Lines changed: 43 additions & 0 deletions b/‎Python/News Headline Scraper/news_headline_scraper.py‎
Lines changed: 43 additions & 0 deletions
@@ -0,0 +1,28 @@
+# News Headline Scraper (Python)
+
+A simple Python script that fetches news headlines from various news outlets using their public RSS feeds and saves them to a JSOn file, no API keys are required in the process.
+---
+
+## 🚀 Features
+- Saves headlines to JSON with timestamps.
+- Multiple trusted sources: BBC, Reuters, CNN, NYTimes, HackerNews
+- No API key needed (uses official RSS feeds)
+
+---
+## Usage
+
+python3 news_headline_scraper.py
+
+Output: 
+Fetching: BBC
+Fetching: Reuters
+Fetching: CNN
+Fetching: NYTimes
+Fetching: HackerNews
+Headlines saved to the file
+
+## 🧰 Requirements
+
+Install the dependencies using pip:
+```bash
+pip install feedparser
@@ -0,0 +1,43 @@
+import json
+from datetime import datetime
+import feedparser
+import sys
+
+def fetch_headlines(feed):
+    headlines = {}
+    for name, url in feed.items():
+        print(f"Fetching: {name}")
+        feed = feedparser.parse(url)
+        # print("FEED", feed)
+        temp_list=[]
+        for entry in feed.entries:
+            article = {
+                "title": entry.title,
+                "link": entry.link,
+                "published": entry.get("published", None)
+            }
+            temp_list.append(article)
+        headlines[name]= temp_list
+    return headlines
+
+
+
+def save_to_json(data, filename="news_headlines.json"):
+    timestamp = datetime.now().isoformat()
+    output = {"timestamp": timestamp, "sources": data}
+    with open(filename, "w", encoding="utf-8") as f:
+        json.dump(output, f, indent=4, ensure_ascii=False)
+    print("Headlines saved to the file")
+
+if __name__=="__main__":
+    
+    feed={
+        "BBC": "https://feeds.bbci.co.uk/news/rss.xml",
+        "Reuters": "https://feeds.reuters.com/reuters/topNews",
+        "CNN": "http://rss.cnn.com/rss/edition.rss",
+        "NYTimes": "https://rss.nytimes.com/services/xml/rss/nyt/HomePage.xml",
+        "HackerNews": "https://hnrss.org/frontpage"
+    }
+
+    headlines=fetch_headlines(feed)
+    save_to_json(headlines)