wallabag/inc/3rdparty/site_config/standard/cbsnews.com.txt
2014-07-13 10:15:40 +02:00

16 lines
496 B
Plaintext
Executable File

date: //meta[@name="published"]/@content
date: //div[@class="timeLine"]
title: //div[@id='contentBody']//h1
author: //dl[@class="storyBlogByline"]/dd/a
body: //div[@id='storyMediaBox'] | //div[contains(@class, 'storyText')]
# Content Pruning
strip: //div[@class="scrollingArrows"]
strip: //div[@class="timeLine"]
strip: //dl[@class="storyBlogByline"]
strip: //span[@class='image-credit']
prune: no
test_url: http://www.cbsnews.com/8301-201_162-57366361/rescued-americans-dad-proud-of-the-u.s/