wallabag/inc/3rdparty/site_config/standard/cbsnews.com.txt
2013-12-06 10:13:03 +01:00

14 lines
471 B
Plaintext

date: //meta[@name="published"]/@content
date: //div[@class="timeLine"]
title: //div[@id='contentBody']//h1
author: //dl[@class="storyBlogByline"]/dd/a
body: //div[@id='storyMediaBox'] | //div[contains(@class, 'storyText')]
# Content Pruning
strip: //div[@class="scrollingArrows"]
strip: //div[@class="timeLine"]
strip: //dl[@class="storyBlogByline"]
prune: no
test_url: http://www.cbsnews.com/8301-201_162-57366361/rescued-americans-dad-proud-of-the-u.s/