2014-07-13 08:15:40 +00:00
|
|
|
title: //h2[@property='dc:title']
|
|
|
|
#body: //div[@class='print-content']
|
|
|
|
body: //div[@id='wysiwyg']
|
|
|
|
author: //a[contains(@href, '/authors')]
|
|
|
|
author: substring-before(//div[@class='print-created'], '|')
|
|
|
|
date: //span[@class='article-date']
|
|
|
|
date: substring-after(//div[@class='print-created'], '|')
|
|
|
|
prune: no
|
|
|
|
|
|
|
|
#single_page_link: //ul[contains(@class, 'article-actions-bar')]//a[contains(@href, '/print/article/')]
|
|
|
|
single_page_link: //ul[contains(@class, 'article-actions-bar')]//a[contains(@href, '?page=full')]
|
|
|
|
|
2013-12-06 09:13:03 +00:00
|
|
|
test_url: http://www.thenation.com/article/162331/hard-against-time-roy-fisher
|