body: //div[@id='content']//article/main author: //meta[@name='author']/@content date: //time/@datetime # prevent wallabg from stripping sub-headings: strip_attr: //h3/@class # un-link the subheadings find_string: