from scrapy.spiders import XMLFeedSpider class RssFeedSpider(XMLFeedSpider): name = "rss_feed" start_urls = ["https://updates.example.net/rss.xml"] iterator = "iternodes" itertag = "item" namespaces = [("content", "http://purl.org/rss/1.0/modules/content/")] def parse_node(self, response, node): yield { "title": node.xpath("title/text()").get(), "link": node.xpath("link/text()").get(), "pubDate": node.xpath("pubDate/text()").get(), "body_html": node.xpath("content:encoded/text()").get(), }