rules.go 3.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081
  1. // SPDX-FileCopyrightText: Copyright The Miniflux Authors. All rights reserved.
  2. // SPDX-License-Identifier: Apache-2.0
  3. package rewrite // import "miniflux.app/v2/internal/reader/rewrite"
  4. import "regexp"
  5. // List of predefined rewrite rules (alphabetically sorted)
  6. // Available rules: "add_image_title", "add_youtube_video"
  7. // domain => rule name
  8. var predefinedRules = map[string]string{
  9. "abstrusegoose.com": "add_image_title",
  10. "amazingsuperpowers.com": "add_image_title",
  11. "blog.cloudflare.com": `add_image_title,remove("figure.kg-image-card figure.kg-image + img")`,
  12. "blog.laravel.com": "parse_markdown",
  13. "cowbirdsinlove.com": "add_image_title",
  14. "drawingboardcomic.com": "add_image_title",
  15. "exocomics.com": "add_image_title",
  16. "framatube.org": "nl2br,convert_text_link",
  17. "happletea.com": "add_image_title",
  18. "ilpost.it": `remove(".art_tag, #audioPlayerArticle, .author-container, .caption, .ilpostShare, .lastRecents, #mc_embed_signup, .outbrain_inread, p:has(.leggi-anche), .youtube-overlay")`,
  19. "imogenquest.net": "add_image_title",
  20. "lukesurl.com": "add_image_title",
  21. "medium.com": "fix_medium_images",
  22. "mercworks.net": "add_image_title",
  23. "monkeyuser.com": "add_image_title",
  24. "mrlovenstein.com": "add_image_title",
  25. "nedroid.com": "add_image_title",
  26. "oglaf.com": `replace("media.oglaf.com/story/tt(.+).gif"|"media.oglaf.com/comic/$1.jpg"),add_image_title`,
  27. "optipess.com": "add_image_title",
  28. "peebleslab.com": "add_image_title",
  29. "quantamagazine.org": `add_youtube_video_from_id, remove("h6:not(.byline,.post__title__kicker), #comments, .next-post__content, .footer__section, figure .outer--content, script")`,
  30. "sentfromthemoon.com": "add_image_title",
  31. "thedoghousediaries.com": "add_image_title",
  32. "theverge.com": `add_dynamic_image, remove("div.duet--recirculation--related-list, .hidden")`,
  33. "treelobsters.com": "add_image_title",
  34. "webtoons.com": `add_dynamic_image,replace("webtoon"|"swebtoon")`,
  35. "www.qwantz.com": "add_image_title,add_mailto_subject",
  36. "www.recalbox.com": "parse_markdown",
  37. "xkcd.com": "add_image_title",
  38. "youtube.com": "add_youtube_video",
  39. }
  40. type RefererRule struct {
  41. URLPattern *regexp.Regexp
  42. Referer string
  43. }
  44. // List of predefined referer rules
  45. var PredefinedRefererRules = []RefererRule{
  46. {
  47. URLPattern: regexp.MustCompile(`^https://\w+\.sinaimg\.cn`),
  48. Referer: "https://weibo.com",
  49. },
  50. {
  51. URLPattern: regexp.MustCompile(`^https://i\.pximg\.net`),
  52. Referer: "https://www.pixiv.net",
  53. },
  54. {
  55. URLPattern: regexp.MustCompile(`^https://cdnfile\.sspai\.com`),
  56. Referer: "https://sspai.com",
  57. },
  58. {
  59. URLPattern: regexp.MustCompile(`^https://(?:\w|-)+\.cdninstagram\.com`),
  60. Referer: "https://www.instagram.com",
  61. },
  62. {
  63. URLPattern: regexp.MustCompile(`^https://sp1\.piokok\.com`),
  64. Referer: "https://sp1.piokok.com",
  65. },
  66. }
  67. // GetRefererForURL returns the referer for the given URL if it exists, otherwise an empty string.
  68. func GetRefererForURL(url string) string {
  69. for _, rule := range PredefinedRefererRules {
  70. if rule.URLPattern.MatchString(url) {
  71. return rule.Referer
  72. }
  73. }
  74. return ""
  75. }