Update scraping rules for ilpost.it

This commit is contained in:
Davide Masserut 2022-12-19 14:03:16 +01:00 committed by Frédéric Guillot
parent ef312ef770
commit 690d66ce0b
2 changed files with 2 additions and 1 deletions

View file

@ -16,6 +16,7 @@ var predefinedRules = map[string]string{
"exocomics.com": "add_image_title", "exocomics.com": "add_image_title",
"framatube.org": "nl2br,convert_text_link", "framatube.org": "nl2br,convert_text_link",
"happletea.com": "add_image_title", "happletea.com": "add_image_title",
"ilpost.it": `remove(".art_tag, #audioPlayerArticle, .author-container, .caption, .ilpostShare, .lastRecents, #mc_embed_signup, p:has(.leggi-anche)")`,
"imogenquest.net": "add_image_title", "imogenquest.net": "add_image_title",
"lukesurl.com": "add_image_title", "lukesurl.com": "add_image_title",
"medium.com": "fix_medium_images", "medium.com": "fix_medium_images",

View file

@ -19,7 +19,7 @@ var predefinedRules = map[string]string{
"heise.de": "header .article-content__lead, header .article-image, div.article-layout__content.article-content", "heise.de": "header .article-content__lead, header .article-image, div.article-layout__content.article-content",
"igen.fr": "section.corps", "igen.fr": "section.corps",
"ikiwiki.iki.fi": ".page.group", "ikiwiki.iki.fi": ".page.group",
"ilpost.it": "#singleBody > :not(#audioPlayerArticle, .ilpostShare, p:has(.leggi-anche))", "ilpost.it": ".entry-content",
"ing.dk": "section.body", "ing.dk": "section.body",
"lapresse.ca": ".amorce, .entry", "lapresse.ca": ".amorce, .entry",
"lemonde.fr": "article", "lemonde.fr": "article",