aboutsummaryrefslogtreecommitdiffhomepage
path: root/reader/scraper/rules.go
blob: d37b08b3ac788a99b0897beca5862dfdcf4ae0b9 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
// Copyright 2017 Frédéric Guillot. All rights reserved.
// Use of this source code is governed by the Apache 2.0
// license that can be found in the LICENSE file.

package scraper

// List of predefined scraper rules (alphabetically sorted)
// domain => CSS selectors
var predefinedRules = map[string]string{
	"cbc.ca":            ".story-content",
	"github.com":        "article.entry-content",
	"igen.fr":           "section.corps",
	"lapresse.ca":       ".amorce, .entry",
	"lemonde.fr":        "div#articleBody",
	"lesjoiesducode.fr": ".blog-post-content img",
	"linux.com":         "div.content, div[property]",
	"medium.com":        ".section-content",
	"opensource.com":    "div[property]",
	"osnews.com":        "div.newscontent1",
	"phoronix.com":      "div.content",
	"techcrunch.com":    "div.article-entry",
	"theregister.co.uk": "#body",
	"wired.com":         "main figure, article",
}