body: //div[contains(concat(' ',normalize-space(@class),' '),' ltx_page_content ')] body: //article title: //h1[contains(concat(' ',normalize-space(@class),' '),' ltx_title ')] prune: no test_url: https://www.arxiv-vanity.com/papers/2303.13881/