from scrapy.spiders import SitemapSpider class SitemapSeedSpider(SitemapSpider): name = "sitemap_seed" allowed_domains = ["shop.example"] sitemap_urls = [ "https://shop.example/sitemap.xml", ] sitemap_follow = [ r"/products\\.xml$", ] sitemap_rules = [ (r"/products/", "parse_product"), ] def parse_product(self, response): name = response.css("h1::text").get() yield {"name": name}