aboutsummaryrefslogtreecommitdiffhomepage
path: root/reader/scraper/rules.go
diff options
context:
space:
mode:
authorGravatar Frédéric Guillot <fred@miniflux.net>2017-12-13 21:30:40 -0800
committerGravatar Frédéric Guillot <fred@miniflux.net>2017-12-13 21:30:40 -0800
commitc6d9eb361454b70406cf6573b284d5e99ba3a2d2 (patch)
treeb53ce39814d225a8f8f02e2036a314ff1d7a1059 /reader/scraper/rules.go
parent827683ab59131ec38ed7cfa268bcaa6dc77d1412 (diff)
Improve content scraper
Diffstat (limited to 'reader/scraper/rules.go')
-rw-r--r--reader/scraper/rules.go6
1 files changed, 6 insertions, 0 deletions
diff --git a/reader/scraper/rules.go b/reader/scraper/rules.go
index ae6c4a5..9dc1405 100644
--- a/reader/scraper/rules.go
+++ b/reader/scraper/rules.go
@@ -7,10 +7,16 @@ package scraper
// List of predefined scraper rules (alphabetically sorted)
// domain => CSS selectors
var predefinedRules = map[string]string{
+ "github.com": "article.entry-content",
+ "igen.fr": "section.corps",
"lemonde.fr": "div#articleBody",
"lesjoiesducode.fr": ".blog-post-content img",
"linux.com": "div.content, div[property]",
+ "medium.com": ".section-content",
"opensource.com": "div[property]",
+ "osnews.com": "div.newscontent1",
"phoronix.com": "div.content",
"techcrunch.com": "div.article-entry",
+ "theregister.co.uk": "#body",
+ "wired.com": "main figure, article",
}