atom.go 3.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191
  1. // Copyright 2017 Frédéric Guillot. All rights reserved.
  2. // Use of this source code is governed by the Apache 2.0
  3. // license that can be found in the LICENSE file.
  4. package atom
  5. import (
  6. "encoding/xml"
  7. "log"
  8. "strconv"
  9. "strings"
  10. "time"
  11. "github.com/miniflux/miniflux/helper"
  12. "github.com/miniflux/miniflux/model"
  13. "github.com/miniflux/miniflux/reader/date"
  14. )
  15. type atomFeed struct {
  16. XMLName xml.Name `xml:"http://www.w3.org/2005/Atom feed"`
  17. ID string `xml:"id"`
  18. Title string `xml:"title"`
  19. Author atomAuthor `xml:"author"`
  20. Links []atomLink `xml:"link"`
  21. Entries []atomEntry `xml:"entry"`
  22. }
  23. type atomEntry struct {
  24. ID string `xml:"id"`
  25. Title string `xml:"title"`
  26. Updated string `xml:"updated"`
  27. Links []atomLink `xml:"link"`
  28. Summary string `xml:"summary"`
  29. Content atomContent `xml:"content"`
  30. MediaGroup atomMediaGroup `xml:"http://search.yahoo.com/mrss/ group"`
  31. Author atomAuthor `xml:"author"`
  32. }
  33. type atomAuthor struct {
  34. Name string `xml:"name"`
  35. Email string `xml:"email"`
  36. }
  37. type atomLink struct {
  38. URL string `xml:"href,attr"`
  39. Type string `xml:"type,attr"`
  40. Rel string `xml:"rel,attr"`
  41. Length string `xml:"length,attr"`
  42. }
  43. type atomContent struct {
  44. Type string `xml:"type,attr"`
  45. Data string `xml:",chardata"`
  46. XML string `xml:",innerxml"`
  47. }
  48. type atomMediaGroup struct {
  49. Description string `xml:"http://search.yahoo.com/mrss/ description"`
  50. }
  51. func (a *atomFeed) Transform() *model.Feed {
  52. feed := new(model.Feed)
  53. feed.FeedURL = getRelationURL(a.Links, "self")
  54. feed.SiteURL = getURL(a.Links)
  55. feed.Title = strings.TrimSpace(a.Title)
  56. if feed.Title == "" {
  57. feed.Title = feed.SiteURL
  58. }
  59. for _, entry := range a.Entries {
  60. item := entry.Transform()
  61. if item.Author == "" {
  62. item.Author = getAuthor(a.Author)
  63. }
  64. feed.Entries = append(feed.Entries, item)
  65. }
  66. return feed
  67. }
  68. func (a *atomEntry) Transform() *model.Entry {
  69. entry := new(model.Entry)
  70. entry.URL = getURL(a.Links)
  71. entry.Date = getDate(a)
  72. entry.Author = getAuthor(a.Author)
  73. entry.Hash = getHash(a)
  74. entry.Content = getContent(a)
  75. entry.Title = strings.TrimSpace(a.Title)
  76. entry.Enclosures = getEnclosures(a)
  77. if entry.Title == "" {
  78. entry.Title = entry.URL
  79. }
  80. return entry
  81. }
  82. func getURL(links []atomLink) string {
  83. for _, link := range links {
  84. if strings.ToLower(link.Rel) == "alternate" {
  85. return strings.TrimSpace(link.URL)
  86. }
  87. if link.Rel == "" && link.Type == "" {
  88. return strings.TrimSpace(link.URL)
  89. }
  90. }
  91. return ""
  92. }
  93. func getRelationURL(links []atomLink, relation string) string {
  94. for _, link := range links {
  95. if strings.ToLower(link.Rel) == relation {
  96. return strings.TrimSpace(link.URL)
  97. }
  98. }
  99. return ""
  100. }
  101. func getDate(a *atomEntry) time.Time {
  102. if a.Updated != "" {
  103. result, err := date.Parse(a.Updated)
  104. if err != nil {
  105. log.Println(err)
  106. return time.Now()
  107. }
  108. return result
  109. }
  110. return time.Now()
  111. }
  112. func getContent(a *atomEntry) string {
  113. if a.Content.Type == "html" || a.Content.Type == "text" {
  114. return a.Content.Data
  115. }
  116. if a.Content.Type == "xhtml" {
  117. return a.Content.XML
  118. }
  119. if a.Summary != "" {
  120. return a.Summary
  121. }
  122. if a.MediaGroup.Description != "" {
  123. return a.MediaGroup.Description
  124. }
  125. return ""
  126. }
  127. func getHash(a *atomEntry) string {
  128. for _, value := range []string{a.ID, getURL(a.Links)} {
  129. if value != "" {
  130. return helper.Hash(value)
  131. }
  132. }
  133. return ""
  134. }
  135. func getEnclosures(a *atomEntry) model.EnclosureList {
  136. enclosures := make(model.EnclosureList, 0)
  137. for _, link := range a.Links {
  138. if strings.ToLower(link.Rel) == "enclosure" {
  139. length, _ := strconv.Atoi(link.Length)
  140. enclosures = append(enclosures, &model.Enclosure{URL: link.URL, MimeType: link.Type, Size: length})
  141. }
  142. }
  143. return enclosures
  144. }
  145. func getAuthor(author atomAuthor) string {
  146. if author.Name != "" {
  147. return strings.TrimSpace(author.Name)
  148. }
  149. if author.Email != "" {
  150. return strings.TrimSpace(author.Email)
  151. }
  152. return ""
  153. }