wallabag/inc/3rdparty/site_config/standard/dr.dk.txt
2014-07-13 10:15:40 +02:00

9 lines
No EOL
364 B
Text
Executable file

title: //meta[@property='og:title']/@content
author: //div[@class='articleFunctions']//a
date: //meta[@name='pubdate']/@content
# Can you strip elements from the body only? It is required here (`//div[@class='articleContent']/p` breaks for some reason)
body: //div[@class='articleContent']
tidy: no
test_url: http://www.dr.dk/Nyheder/Udland/2011/10/24/150115.htm