Created December 21, 2023 10:56
Generating RSS feed based on existing `sitemap.xml`
import xml.etree.ElementTree as ET
import PyRSS2Gen as rss
import datetime
# Parse the sitemap.xml
tree = ET.parse("book/sitemap.xml")
root = tree.getroot()
# Define the RSS feed basic info
rss_feed = rss.RSS2(
title="Data Engineering Design Patterns (DEDP)",
description="Data Engineering Design Patterns Book: Mastering Convergent Evolution",,
# Extract URLs and their metadata
for url in root.findall("{}url"):
loc = url.find("{}loc").text
if loc.endswith("/"):
loc = loc[:-1] # Remove the trailing slash
loc += ".html" # Append .html
lastmod = url.find("{}lastmod").text
lastmod_date = datetime.datetime.strptime(lastmod, "%Y-%m-%dT%H:%M:%S.%fZ")
# Add item to the RSS feed
description=f"Updated on {lastmod}",
# Generate the RSS feed
rss_feed.write_xml(open("book/feed.xml", "w"))
