# complete feed: # https://www.diepresse.com/rss # or add a category, e.g.: # https://www.diepresse.com/rss/kultur/kunst title: //div[@class='article']/h1 date: substring-before(//p[@class='articletime'],'|') author: //div[@class='author']/descendant::a body: //article | //div[@id='articletext'] | //div[@id='article-body'] strip: //div[@class='meta__date'] strip: //div[@class='meta__authors'] strip: //h1[@class='article__title'] strip: //div[contains(@class, 'fm-relation')] strip_id_or_class: skyline strip_id_or_class: article__actions strip_id_or_class: article__byline # strip gerneric text images when there is no article photo/image find_string: https://www.diepresse.com/assets_v2/images/ replace_string: # 'data-src' sometimes prevents images to load, replaced with 'src' find_string: class="figure__image lazyload" data-src= replace_string: class="figure__image lazyload" src= find_string: