| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697 |
- // Copyright 2017 Frédéric Guillot. All rights reserved.
- // Use of this source code is governed by the Apache 2.0
- // license that can be found in the LICENSE file.
- package subscription
- import (
- "bytes"
- "fmt"
- "io"
- "time"
- "github.com/miniflux/miniflux/errors"
- "github.com/miniflux/miniflux/http"
- "github.com/miniflux/miniflux/logger"
- "github.com/miniflux/miniflux/reader/feed"
- "github.com/miniflux/miniflux/timer"
- "github.com/miniflux/miniflux/url"
- "github.com/PuerkitoBio/goquery"
- )
- var (
- errConnectionFailure = "Unable to open this link: %v"
- errUnreadableDoc = "Unable to analyze this page: %v"
- )
- // FindSubscriptions downloads and try to find one or more subscriptions from an URL.
- func FindSubscriptions(websiteURL string) (Subscriptions, error) {
- defer timer.ExecutionTime(time.Now(), fmt.Sprintf("[FindSubscriptions] url=%s", websiteURL))
- client := http.NewClient(websiteURL)
- response, err := client.Get()
- if err != nil {
- return nil, errors.NewLocalizedError(errConnectionFailure, err)
- }
- var buffer bytes.Buffer
- io.Copy(&buffer, response.Body)
- reader := bytes.NewReader(buffer.Bytes())
- if format := feed.DetectFeedFormat(reader); format != feed.FormatUnknown {
- var subscriptions Subscriptions
- subscriptions = append(subscriptions, &Subscription{
- Title: response.EffectiveURL,
- URL: response.EffectiveURL,
- Type: format,
- })
- return subscriptions, nil
- }
- reader.Seek(0, io.SeekStart)
- return parseDocument(response.EffectiveURL, bytes.NewReader(buffer.Bytes()))
- }
- func parseDocument(websiteURL string, data io.Reader) (Subscriptions, error) {
- var subscriptions Subscriptions
- queries := map[string]string{
- "link[type='application/rss+xml']": "rss",
- "link[type='application/atom+xml']": "atom",
- "link[type='application/json']": "json",
- }
- doc, err := goquery.NewDocumentFromReader(data)
- if err != nil {
- return nil, errors.NewLocalizedError(errUnreadableDoc, err)
- }
- for query, kind := range queries {
- doc.Find(query).Each(func(i int, s *goquery.Selection) {
- subscription := new(Subscription)
- subscription.Type = kind
- if title, exists := s.Attr("title"); exists {
- subscription.Title = title
- } else {
- subscription.Title = "Feed"
- }
- if feedURL, exists := s.Attr("href"); exists {
- subscription.URL, _ = url.AbsoluteURL(websiteURL, feedURL)
- }
- if subscription.Title == "" {
- subscription.Title = subscription.URL
- }
- if subscription.URL != "" {
- logger.Debug("[FindSubscriptions] %s", subscription)
- subscriptions = append(subscriptions, subscription)
- }
- })
- }
- return subscriptions, nil
- }
|