4
0

nebula.go 1.8 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364
  1. // SPDX-FileCopyrightText: Copyright The Miniflux Authors. All rights reserved.
  2. // SPDX-License-Identifier: Apache-2.0
  3. package processor // import "miniflux.app/v2/internal/reader/processor"
  4. import (
  5. "errors"
  6. "fmt"
  7. "log/slog"
  8. "net/url"
  9. "strconv"
  10. "github.com/PuerkitoBio/goquery"
  11. "miniflux.app/v2/internal/config"
  12. "miniflux.app/v2/internal/model"
  13. "miniflux.app/v2/internal/proxyrotator"
  14. "miniflux.app/v2/internal/reader/fetcher"
  15. )
  16. func shouldFetchNebulaWatchTime(entry *model.Entry) bool {
  17. if !config.Opts.FetchNebulaWatchTime() {
  18. return false
  19. }
  20. u, err := url.Parse(entry.URL)
  21. if err != nil {
  22. return false
  23. }
  24. return u.Hostname() == "nebula.tv"
  25. }
  26. func fetchNebulaWatchTime(websiteURL string) (int, error) {
  27. requestBuilder := fetcher.NewRequestBuilder()
  28. requestBuilder.WithTimeout(config.Opts.HTTPClientTimeout())
  29. requestBuilder.WithProxyRotator(proxyrotator.ProxyRotatorInstance)
  30. responseHandler := fetcher.NewResponseHandler(requestBuilder.ExecuteRequest(websiteURL))
  31. defer responseHandler.Close()
  32. if localizedError := responseHandler.LocalizedError(); localizedError != nil {
  33. slog.Warn("Unable to fetch Nebula watch time", slog.String("website_url", websiteURL), slog.Any("error", localizedError.Error()))
  34. return 0, localizedError.Error()
  35. }
  36. doc, docErr := goquery.NewDocumentFromReader(responseHandler.Body(config.Opts.HTTPClientMaxBodySize()))
  37. if docErr != nil {
  38. return 0, docErr
  39. }
  40. durs, exists := doc.FindMatcher(goquery.Single(`meta[property="video:duration"]`)).Attr("content")
  41. // durs contains video watch time in seconds
  42. if !exists {
  43. return 0, errors.New("duration has not found")
  44. }
  45. dur, err := strconv.ParseInt(durs, 10, 64)
  46. if err != nil {
  47. return 0, fmt.Errorf("unable to parse duration %s: %v", durs, err)
  48. }
  49. return int(dur / 60), nil
  50. }