title: //h1 # We can have multiple authors author: //a[@class='auteur'] # Last edition date (if any) date: //time[@itemprop='dateModified']/@datetime # Publication date date: //time[@itemprop='datePublished']/@datetime body: //div[@id='articleBody'] # Remove the insane "conjugaison.lemonde.fr" links: find_string: