Browse Source

Update scraping rules for ilpost.it

Davide Masserut 3 years ago
parent
commit
690d66ce0b
2 changed files with 2 additions and 1 deletions
  1. 1 0
      reader/rewrite/rules.go
  2. 1 1
      reader/scraper/rules.go

+ 1 - 0
reader/rewrite/rules.go

@@ -16,6 +16,7 @@ var predefinedRules = map[string]string{
 	"exocomics.com":          "add_image_title",
 	"framatube.org":          "nl2br,convert_text_link",
 	"happletea.com":          "add_image_title",
+	"ilpost.it":              `remove(".art_tag, #audioPlayerArticle, .author-container, .caption, .ilpostShare, .lastRecents, #mc_embed_signup, p:has(.leggi-anche)")`,
 	"imogenquest.net":        "add_image_title",
 	"lukesurl.com":           "add_image_title",
 	"medium.com":             "fix_medium_images",

+ 1 - 1
reader/scraper/rules.go

@@ -19,7 +19,7 @@ var predefinedRules = map[string]string{
 	"heise.de":             "header .article-content__lead, header .article-image, div.article-layout__content.article-content",
 	"igen.fr":              "section.corps",
 	"ikiwiki.iki.fi":       ".page.group",
-	"ilpost.it":            "#singleBody > :not(#audioPlayerArticle, .ilpostShare, p:has(.leggi-anche))",
+	"ilpost.it":            ".entry-content",
 	"ing.dk":               "section.body",
 	"lapresse.ca":          ".amorce, .entry",
 	"lemonde.fr":           "article",