File: buzzfeed.com.txt

package info (click to toggle)
feedreader 2.10.0-1.1
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 11,580 kB
  • sloc: ansic: 11,948; xml: 879; php: 177; python: 35; sh: 32; makefile: 28
file content (27 lines) | stat: -rw-r--r-- 840 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
# Creator: Greg Leuch <greg@...>

# It can be messy.
tidy:no

# The basic template.
title: //h1[@data-print='title']
author: //a[@data-print='author']
date: //time[@data-print='date']
body: //div[@data-print='body']
body: //section[@data-print='body']
body: //article[contains(concat(' ',normalize-space(@class),' '),' buzz ')]

find_string: rel:bf_image_src=
replace_string: src=
find_string: src="data:
replace_string: disabled_src="data:

native_ad_clue: //meta[@property="article:section" and @content="Advertiser"]

# For various things...
strip: *[@data-print="ignore"]
test_url: http://www.buzzfeed.com/hgrant/35-reasons-why-dogs-hate-the-holidays
# Native ad
test_url: http://www.buzzfeed.com/bravo/ways-to-up-your-online-dating-game
# article DIV
test_url: https://www.buzzfeed.com/charliewarzel/the-terrifying-future-of-fake-news