rules.go 3.4 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788
  1. // SPDX-FileCopyrightText: Copyright The Miniflux Authors. All rights reserved.
  2. // SPDX-License-Identifier: Apache-2.0
  3. package rewrite // import "miniflux.app/v2/internal/reader/rewrite"
  4. import "regexp"
  5. // List of predefined rewrite rules (alphabetically sorted)
  6. // Available rules: "add_image_title", "add_youtube_video"
  7. // domain => rule name
  8. var predefinedRules = map[string]string{
  9. "abstrusegoose.com": "add_image_title",
  10. "amazingsuperpowers.com": "add_image_title",
  11. "blog.cloudflare.com": `add_image_title,remove("figure.kg-image-card figure.kg-image + img")`,
  12. "cowbirdsinlove.com": "add_image_title",
  13. "drawingboardcomic.com": "add_image_title",
  14. "exocomics.com": "add_image_title",
  15. "framatube.org": "nl2br,convert_text_link",
  16. "happletea.com": "add_image_title",
  17. "ilpost.it": `remove(".art_tag, #audioPlayerArticle, .author-container, .caption, .ilpostShare, .lastRecents, #mc_embed_signup, .outbrain_inread, p:has(.leggi-anche), .youtube-overlay")`,
  18. "imogenquest.net": "add_image_title",
  19. "lukesurl.com": "add_image_title",
  20. "medium.com": "fix_medium_images",
  21. "mercworks.net": "add_image_title",
  22. "monkeyuser.com": "add_image_title",
  23. "mrlovenstein.com": "add_image_title",
  24. "nedroid.com": "add_image_title",
  25. "oglaf.com": `replace("media.oglaf.com/story/tt(.+).gif"|"media.oglaf.com/comic/$1.jpg"),add_image_title`,
  26. "optipess.com": "add_image_title",
  27. "peebleslab.com": "add_image_title",
  28. "quantamagazine.org": `add_youtube_video_from_id, remove("h6:not(.byline,.post__title__kicker), #comments, .next-post__content, .footer__section, figure .outer--content, script")`,
  29. "sentfromthemoon.com": "add_image_title",
  30. "thedoghousediaries.com": "add_image_title",
  31. "theverge.com": `add_dynamic_image, remove("div.duet--recirculation--related-list, .hidden")`,
  32. "treelobsters.com": "add_image_title",
  33. "webtoons.com": `add_dynamic_image,replace("webtoon"|"swebtoon")`,
  34. "www.qwantz.com": "add_image_title,add_mailto_subject",
  35. "www.recalbox.com": "parse_markdown",
  36. "xkcd.com": "add_image_title",
  37. "youtube.com": "add_youtube_video",
  38. }
  39. type RefererRule struct {
  40. URLPattern *regexp.Regexp
  41. Referer string
  42. }
  43. // List of predefined referer rules
  44. var PredefinedRefererRules = []RefererRule{
  45. {
  46. URLPattern: regexp.MustCompile(`^https://\w+\.sinaimg\.cn`),
  47. Referer: "https://weibo.com",
  48. },
  49. {
  50. URLPattern: regexp.MustCompile(`^https://i\.pximg\.net`),
  51. Referer: "https://www.pixiv.net",
  52. },
  53. {
  54. URLPattern: regexp.MustCompile(`^https://cdnfile\.sspai\.com`),
  55. Referer: "https://sspai.com",
  56. },
  57. {
  58. URLPattern: regexp.MustCompile(`^https://(?:\w|-)+\.cdninstagram\.com`),
  59. Referer: "https://www.instagram.com",
  60. },
  61. {
  62. URLPattern: regexp.MustCompile(`^https://sp1\.piokok\.com`),
  63. Referer: "https://sp1.piokok.com",
  64. },
  65. {
  66. URLPattern: regexp.MustCompile(`^https://f\.video\.weibocdn\.com`),
  67. Referer: "https://weibo.com",
  68. },
  69. {
  70. URLPattern: regexp.MustCompile(`^https://img\.hellogithub\.com`),
  71. Referer: "https://hellogithub.com",
  72. },
  73. }
  74. // GetRefererForURL returns the referer for the given URL if it exists, otherwise an empty string.
  75. func GetRefererForURL(url string) string {
  76. for _, rule := range PredefinedRefererRules {
  77. if rule.URLPattern.MatchString(url) {
  78. return rule.Referer
  79. }
  80. }
  81. return ""
  82. }