parser_test.go 47 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623
  1. // SPDX-FileCopyrightText: Copyright The Miniflux Authors. All rights reserved.
  2. // SPDX-License-Identifier: Apache-2.0
  3. package rss // import "miniflux.app/v2/internal/reader/rss"
  4. import (
  5. "bytes"
  6. "testing"
  7. "time"
  8. )
  9. func TestParseRss2Sample(t *testing.T) {
  10. data := `
  11. <?xml version="1.0"?>
  12. <rss version="2.0">
  13. <channel>
  14. <title>Liftoff News</title>
  15. <link>http://liftoff.msfc.nasa.gov/</link>
  16. <description>Liftoff to Space Exploration.</description>
  17. <image>
  18. <url>http://liftoff.msfc.nasa.gov/HomePageXtra/MeatBall.gif</url>
  19. <title>NASA</title>
  20. <link>http://liftoff.msfc.nasa.gov/</link>
  21. </image>
  22. <language>en-us</language>
  23. <pubDate>Tue, 10 Jun 2003 04:00:00 GMT</pubDate>
  24. <lastBuildDate>Tue, 10 Jun 2003 09:41:01 GMT</lastBuildDate>
  25. <docs>http://blogs.law.harvard.edu/tech/rss</docs>
  26. <generator>Weblog Editor 2.0</generator>
  27. <managingEditor>editor@example.com</managingEditor>
  28. <webMaster>webmaster@example.com</webMaster>
  29. <item>
  30. <title>Star City</title>
  31. <link>http://liftoff.msfc.nasa.gov/news/2003/news-starcity.asp</link>
  32. <description>How do Americans get ready to work with Russians aboard the International Space Station? They take a crash course in culture, language and protocol at Russia's &lt;a href="http://howe.iki.rssi.ru/GCTC/gctc_e.htm"&gt;Star City&lt;/a&gt;.</description>
  33. <pubDate>Tue, 03 Jun 2003 09:39:21 GMT</pubDate>
  34. <guid>http://liftoff.msfc.nasa.gov/2003/06/03.html#item573</guid>
  35. </item>
  36. <item>
  37. <description>Sky watchers in Europe, Asia, and parts of Alaska and Canada will experience a &lt;a href="http://science.nasa.gov/headlines/y2003/30may_solareclipse.htm"&gt;partial eclipse of the Sun&lt;/a&gt; on Saturday, May 31st.</description>
  38. <pubDate>Fri, 30 May 2003 11:06:42 GMT</pubDate>
  39. <guid>http://liftoff.msfc.nasa.gov/2003/05/30.html#item572</guid>
  40. </item>
  41. <item>
  42. <title>The Engine That Does More</title>
  43. <link>http://liftoff.msfc.nasa.gov/news/2003/news-VASIMR.asp</link>
  44. <description>Before man travels to Mars, NASA hopes to design new engines that will let us fly through the Solar System more quickly. The proposed VASIMR engine would do that.</description>
  45. <pubDate>Tue, 27 May 2003 08:37:32 GMT</pubDate>
  46. <guid>http://liftoff.msfc.nasa.gov/2003/05/27.html#item571</guid>
  47. </item>
  48. <item>
  49. <title>Astronauts' Dirty Laundry</title>
  50. <link>http://liftoff.msfc.nasa.gov/news/2003/news-laundry.asp</link>
  51. <description>Compared to earlier spacecraft, the International Space Station has many luxuries, but laundry facilities are not one of them. Instead, astronauts have other options.</description>
  52. <pubDate>Tue, 20 May 2003 08:56:02 GMT</pubDate>
  53. <guid>http://liftoff.msfc.nasa.gov/2003/05/20.html#item570</guid>
  54. </item>
  55. </channel>
  56. </rss>`
  57. feed, err := Parse("http://liftoff.msfc.nasa.gov/rss.xml", bytes.NewReader([]byte(data)))
  58. if err != nil {
  59. t.Fatal(err)
  60. }
  61. if feed.Title != "Liftoff News" {
  62. t.Errorf("Incorrect title, got: %s", feed.Title)
  63. }
  64. if feed.FeedURL != "http://liftoff.msfc.nasa.gov/rss.xml" {
  65. t.Errorf("Incorrect feed URL, got: %s", feed.FeedURL)
  66. }
  67. if feed.SiteURL != "http://liftoff.msfc.nasa.gov/" {
  68. t.Errorf("Incorrect site URL, got: %s", feed.SiteURL)
  69. }
  70. if feed.IconURL != "http://liftoff.msfc.nasa.gov/HomePageXtra/MeatBall.gif" {
  71. t.Errorf("Incorrect image URL, got: %s", feed.IconURL)
  72. }
  73. if len(feed.Entries) != 4 {
  74. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  75. }
  76. expectedDate := time.Date(2003, time.June, 3, 9, 39, 21, 0, time.UTC)
  77. if !feed.Entries[0].Date.Equal(expectedDate) {
  78. t.Errorf("Incorrect entry date, got: %v, want: %v", feed.Entries[0].Date, expectedDate)
  79. }
  80. if feed.Entries[0].Hash != "5b2b4ac2fe1786ddf0fd2da2f1b07f64e691264f41f2db3ea360f31bb6d9152b" {
  81. t.Errorf("Incorrect entry hash, got: %s", feed.Entries[0].Hash)
  82. }
  83. if feed.Entries[0].URL != "http://liftoff.msfc.nasa.gov/news/2003/news-starcity.asp" {
  84. t.Errorf("Incorrect entry URL, got: %s", feed.Entries[0].URL)
  85. }
  86. if feed.Entries[0].Title != "Star City" {
  87. t.Errorf("Incorrect entry title, got: %s", feed.Entries[0].Title)
  88. }
  89. if feed.Entries[0].Content != `How do Americans get ready to work with Russians aboard the International Space Station? They take a crash course in culture, language and protocol at Russia's <a href="http://howe.iki.rssi.ru/GCTC/gctc_e.htm">Star City</a>.` {
  90. t.Errorf("Incorrect entry content, got: %s", feed.Entries[0].Content)
  91. }
  92. if feed.Entries[1].URL != "http://liftoff.msfc.nasa.gov/2003/05/30.html#item572" {
  93. t.Errorf("Incorrect entry URL, got: %s", feed.Entries[1].URL)
  94. }
  95. }
  96. func TestParseFeedWithoutTitle(t *testing.T) {
  97. data := `<?xml version="1.0" encoding="utf-8"?>
  98. <rss version="2.0">
  99. <channel>
  100. <link>https://example.org/</link>
  101. </channel>
  102. </rss>`
  103. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  104. if err != nil {
  105. t.Fatal(err)
  106. }
  107. if feed.Title != "https://example.org/" {
  108. t.Errorf("Incorrect feed title, got: %s", feed.Title)
  109. }
  110. }
  111. func TestParseEntryWithoutTitleAndDescription(t *testing.T) {
  112. data := `<?xml version="1.0" encoding="utf-8"?>
  113. <rss version="2.0">
  114. <channel>
  115. <link>https://example.org/</link>
  116. <item>
  117. <link>https://example.org/item</link>
  118. </item>
  119. </channel>
  120. </rss>`
  121. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  122. if err != nil {
  123. t.Fatal(err)
  124. }
  125. if feed.Entries[0].Title != "https://example.org/item" {
  126. t.Errorf("Incorrect entry title, got: %s", feed.Entries[0].Title)
  127. }
  128. }
  129. func TestParseEntryWithoutTitleButWithDescription(t *testing.T) {
  130. data := `<?xml version="1.0" encoding="utf-8"?>
  131. <rss version="2.0">
  132. <channel>
  133. <link>https://example.org/</link>
  134. <item>
  135. <link>https://example.org/item</link>
  136. <description>
  137. This is the description
  138. </description>
  139. </item>
  140. </channel>
  141. </rss>`
  142. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  143. if err != nil {
  144. t.Fatal(err)
  145. }
  146. if feed.Entries[0].Title != "This is the description" {
  147. t.Errorf("Incorrect entry title, got: %s", feed.Entries[0].Title)
  148. }
  149. }
  150. func TestParseEntryWithMediaTitle(t *testing.T) {
  151. data := `<?xml version="1.0" encoding="utf-8"?>
  152. <rss version="2.0" xmlns:media="http://search.yahoo.com/mrss/">
  153. <channel>
  154. <link>https://example.org/</link>
  155. <item>
  156. <title>Entry Title</title>
  157. <link>https://example.org/item</link>
  158. <media:title>Media Title</media:title>
  159. </item>
  160. </channel>
  161. </rss>`
  162. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  163. if err != nil {
  164. t.Fatal(err)
  165. }
  166. if feed.Entries[0].Title != "Entry Title" {
  167. t.Errorf("Incorrect entry title, got: %q", feed.Entries[0].Title)
  168. }
  169. }
  170. func TestParseEntryWithDCTitleOnly(t *testing.T) {
  171. data := `<?xml version="1.0" encoding="utf-8"?>
  172. <rss version="2.0" xmlns:media="http://search.yahoo.com/mrss/" xmlns:dc="http://purl.org/dc/elements/1.1/">
  173. <channel>
  174. <link>https://example.org/</link>
  175. <item>
  176. <dc:title>Entry Title</dc:title>
  177. <link>https://example.org/item</link>
  178. </item>
  179. </channel>
  180. </rss>`
  181. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  182. if err != nil {
  183. t.Fatal(err)
  184. }
  185. if feed.Entries[0].Title != "Entry Title" {
  186. t.Errorf("Incorrect entry title, got: %q", feed.Entries[0].Title)
  187. }
  188. }
  189. func TestParseEntryWithoutLink(t *testing.T) {
  190. data := `<?xml version="1.0" encoding="utf-8"?>
  191. <rss version="2.0">
  192. <channel>
  193. <link>https://example.org/</link>
  194. <item>
  195. <guid isPermaLink="false">1234</guid>
  196. </item>
  197. </channel>
  198. </rss>`
  199. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  200. if err != nil {
  201. t.Fatal(err)
  202. }
  203. if feed.Entries[0].URL != "https://example.org/" {
  204. t.Errorf("Incorrect entry link, got: %s", feed.Entries[0].URL)
  205. }
  206. if feed.Entries[0].Hash != "03ac674216f3e15c761ee1a5e255f067953623c8b388b4459e13f978d7c846f4" {
  207. t.Errorf("Incorrect entry hash, got: %s", feed.Entries[0].Hash)
  208. }
  209. }
  210. func TestParseEntryWithOnlyGuidPermalink(t *testing.T) {
  211. data := `<?xml version="1.0" encoding="utf-8"?>
  212. <rss version="2.0">
  213. <channel>
  214. <link>https://example.org/</link>
  215. <item>
  216. <guid isPermaLink="true">https://example.org/some-article.html</guid>
  217. </item>
  218. <item>
  219. <guid>https://example.org/another-article.html</guid>
  220. </item>
  221. </channel>
  222. </rss>`
  223. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  224. if err != nil {
  225. t.Fatal(err)
  226. }
  227. if feed.Entries[0].URL != "https://example.org/some-article.html" {
  228. t.Errorf("Incorrect entry link, got: %s", feed.Entries[0].URL)
  229. }
  230. if feed.Entries[1].URL != "https://example.org/another-article.html" {
  231. t.Errorf("Incorrect entry link, got: %s", feed.Entries[1].URL)
  232. }
  233. }
  234. func TestParseEntryWithAtomLink(t *testing.T) {
  235. data := `<?xml version="1.0" encoding="utf-8"?>
  236. <rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  237. <channel>
  238. <link>https://example.org/</link>
  239. <item>
  240. <title>Test</title>
  241. <atom:link href="https://example.org/item" />
  242. </item>
  243. </channel>
  244. </rss>`
  245. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  246. if err != nil {
  247. t.Fatal(err)
  248. }
  249. if feed.Entries[0].URL != "https://example.org/item" {
  250. t.Errorf("Incorrect entry link, got: %s", feed.Entries[0].URL)
  251. }
  252. }
  253. func TestParseEntryWithMultipleAtomLinks(t *testing.T) {
  254. data := `<?xml version="1.0" encoding="utf-8"?>
  255. <rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  256. <channel>
  257. <link>https://example.org/</link>
  258. <item>
  259. <title>Test</title>
  260. <atom:link rel="payment" href="https://example.org/a" />
  261. <atom:link rel="alternate" href="https://example.org/b" />
  262. </item>
  263. </channel>
  264. </rss>`
  265. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  266. if err != nil {
  267. t.Fatal(err)
  268. }
  269. if feed.Entries[0].URL != "https://example.org/b" {
  270. t.Errorf("Incorrect entry link, got: %s", feed.Entries[0].URL)
  271. }
  272. }
  273. func TestParseFeedURLWithAtomLink(t *testing.T) {
  274. data := `<?xml version="1.0" encoding="utf-8"?>
  275. <rss xmlns:atom="http://www.w3.org/2005/Atom" version="2.0">
  276. <channel>
  277. <title>Example</title>
  278. <link>https://example.org/</link>
  279. <atom:link href="https://example.org/rss" type="application/rss+xml" rel="self"></atom:link>
  280. </channel>
  281. </rss>`
  282. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  283. if err != nil {
  284. t.Fatal(err)
  285. }
  286. if feed.FeedURL != "https://example.org/rss" {
  287. t.Errorf("Incorrect feed URL, got: %s", feed.FeedURL)
  288. }
  289. if feed.SiteURL != "https://example.org/" {
  290. t.Errorf("Incorrect site URL, got: %s", feed.SiteURL)
  291. }
  292. }
  293. func TestParseFeedWithWebmaster(t *testing.T) {
  294. data := `<?xml version="1.0" encoding="utf-8"?>
  295. <rss version="2.0">
  296. <channel>
  297. <title>Example</title>
  298. <link>https://example.org/</link>
  299. <webMaster>webmaster@example.com</webMaster>
  300. <item>
  301. <title>Test</title>
  302. <link>https://example.org/item</link>
  303. </item>
  304. </channel>
  305. </rss>`
  306. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  307. if err != nil {
  308. t.Fatal(err)
  309. }
  310. expected := "webmaster@example.com"
  311. result := feed.Entries[0].Author
  312. if result != expected {
  313. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  314. }
  315. }
  316. func TestParseFeedWithManagingEditor(t *testing.T) {
  317. data := `<?xml version="1.0" encoding="utf-8"?>
  318. <rss version="2.0">
  319. <channel>
  320. <title>Example</title>
  321. <link>https://example.org/</link>
  322. <webMaster>webmaster@example.com</webMaster>
  323. <managingEditor>editor@example.com</managingEditor>
  324. <item>
  325. <title>Test</title>
  326. <link>https://example.org/item</link>
  327. </item>
  328. </channel>
  329. </rss>`
  330. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  331. if err != nil {
  332. t.Fatal(err)
  333. }
  334. expected := "editor@example.com"
  335. result := feed.Entries[0].Author
  336. if result != expected {
  337. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  338. }
  339. }
  340. func TestParseEntryWithAuthorAndInnerHTML(t *testing.T) {
  341. data := `<?xml version="1.0" encoding="utf-8"?>
  342. <rss xmlns:atom="http://www.w3.org/2005/Atom" version="2.0">
  343. <channel>
  344. <title>Example</title>
  345. <link>https://example.org/</link>
  346. <atom:link href="https://example.org/rss" type="application/rss+xml" rel="self"></atom:link>
  347. <item>
  348. <title>Test</title>
  349. <link>https://example.org/item</link>
  350. <author>by <a itemprop="url" class="author" rel="author" href="/author/foobar">Foo Bar</a></author>
  351. </item>
  352. </channel>
  353. </rss>`
  354. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  355. if err != nil {
  356. t.Fatal(err)
  357. }
  358. expected := "by Foo Bar"
  359. result := feed.Entries[0].Author
  360. if result != expected {
  361. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  362. }
  363. }
  364. func TestParseEntryWithAuthorAndCDATA(t *testing.T) {
  365. data := `<?xml version="1.0" encoding="utf-8"?>
  366. <rss xmlns:atom="http://www.w3.org/2005/Atom" version="2.0">
  367. <channel>
  368. <title>Example</title>
  369. <link>https://example.org/</link>
  370. <atom:link href="https://example.org/rss" type="application/rss+xml" rel="self"></atom:link>
  371. <item>
  372. <title>Test</title>
  373. <link>https://example.org/item</link>
  374. <author>
  375. <![CDATA[by Foo Bar]]>
  376. </author>
  377. </item>
  378. </channel>
  379. </rss>`
  380. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  381. if err != nil {
  382. t.Fatal(err)
  383. }
  384. expected := "by Foo Bar"
  385. result := feed.Entries[0].Author
  386. if result != expected {
  387. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  388. }
  389. }
  390. func TestParseEntryWithAtomAuthorEmail(t *testing.T) {
  391. data := `<?xml version="1.0" encoding="utf-8"?>
  392. <rss xmlns:atom="http://www.w3.org/2005/Atom" version="2.0">
  393. <channel>
  394. <title>Example</title>
  395. <link>https://example.org/</link>
  396. <atom:link href="https://example.org/rss" type="application/rss+xml" rel="self"></atom:link>
  397. <item>
  398. <title>Test</title>
  399. <link>https://example.org/item</link>
  400. <atom:author>
  401. <email>author@example.org</email>
  402. </atom:author>
  403. </item>
  404. </channel>
  405. </rss>`
  406. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  407. if err != nil {
  408. t.Fatal(err)
  409. }
  410. expected := "author@example.org"
  411. result := feed.Entries[0].Author
  412. if result != expected {
  413. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  414. }
  415. }
  416. func TestParseEntryWithAtomAuthorName(t *testing.T) {
  417. data := `<?xml version="1.0" encoding="utf-8"?>
  418. <rss xmlns:atom="http://www.w3.org/2005/Atom" version="2.0">
  419. <channel>
  420. <title>Example</title>
  421. <link>https://example.org/</link>
  422. <atom:link href="https://example.org/rss" type="application/rss+xml" rel="self"></atom:link>
  423. <item>
  424. <title>Test</title>
  425. <link>https://example.org/item</link>
  426. <atom:author>
  427. <name>Foo Bar</name>
  428. </atom:author>
  429. </item>
  430. </channel>
  431. </rss>`
  432. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  433. if err != nil {
  434. t.Fatal(err)
  435. }
  436. expected := "Foo Bar"
  437. result := feed.Entries[0].Author
  438. if result != expected {
  439. t.Errorf("Incorrect entry author, got: %q instead of %q", result, expected)
  440. }
  441. }
  442. func TestParseEntryWithDublinCoreAuthor(t *testing.T) {
  443. data := `<?xml version="1.0" encoding="utf-8"?>
  444. <rss version="2.0" xmlns:dc="http://purl.org/dc/elements/1.1/">
  445. <channel>
  446. <title>Example</title>
  447. <link>https://example.org/</link>
  448. <item>
  449. <title>Test</title>
  450. <link>https://example.org/item</link>
  451. <dc:creator>Me (me@example.com)</dc:creator>
  452. </item>
  453. </channel>
  454. </rss>`
  455. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  456. if err != nil {
  457. t.Fatal(err)
  458. }
  459. expected := "Me (me@example.com)"
  460. result := feed.Entries[0].Author
  461. if result != expected {
  462. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  463. }
  464. }
  465. func TestParseEntryWithItunesAuthor(t *testing.T) {
  466. data := `<?xml version="1.0" encoding="utf-8"?>
  467. <rss version="2.0" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd">
  468. <channel>
  469. <title>Example</title>
  470. <link>https://example.org/</link>
  471. <item>
  472. <title>Test</title>
  473. <link>https://example.org/item</link>
  474. <itunes:author>Someone</itunes:author>
  475. </item>
  476. </channel>
  477. </rss>`
  478. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  479. if err != nil {
  480. t.Fatal(err)
  481. }
  482. expected := "Someone"
  483. result := feed.Entries[0].Author
  484. if result != expected {
  485. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  486. }
  487. }
  488. func TestParseFeedWithItunesAuthor(t *testing.T) {
  489. data := `<?xml version="1.0" encoding="utf-8"?>
  490. <rss version="2.0" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd">
  491. <channel>
  492. <title>Example</title>
  493. <link>https://example.org/</link>
  494. <itunes:author>Someone</itunes:author>
  495. <item>
  496. <title>Test</title>
  497. <link>https://example.org/item</link>
  498. </item>
  499. </channel>
  500. </rss>`
  501. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  502. if err != nil {
  503. t.Fatal(err)
  504. }
  505. expected := "Someone"
  506. result := feed.Entries[0].Author
  507. if result != expected {
  508. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  509. }
  510. }
  511. func TestParseFeedWithItunesOwner(t *testing.T) {
  512. data := `<?xml version="1.0" encoding="utf-8"?>
  513. <rss version="2.0" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd">
  514. <channel>
  515. <title>Example</title>
  516. <link>https://example.org/</link>
  517. <itunes:owner>
  518. <itunes:name>John Doe</itunes:name>
  519. <itunes:email>john.doe@example.com</itunes:email>
  520. </itunes:owner>
  521. <item>
  522. <title>Test</title>
  523. <link>https://example.org/item</link>
  524. </item>
  525. </channel>
  526. </rss>`
  527. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  528. if err != nil {
  529. t.Fatal(err)
  530. }
  531. expected := "John Doe"
  532. result := feed.Entries[0].Author
  533. if result != expected {
  534. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  535. }
  536. }
  537. func TestParseFeedWithItunesOwnerEmail(t *testing.T) {
  538. data := `<?xml version="1.0" encoding="utf-8"?>
  539. <rss version="2.0" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd">
  540. <channel>
  541. <title>Example</title>
  542. <link>https://example.org/</link>
  543. <itunes:owner>
  544. <itunes:email>john.doe@example.com</itunes:email>
  545. </itunes:owner>
  546. <item>
  547. <title>Test</title>
  548. <link>https://example.org/item</link>
  549. </item>
  550. </channel>
  551. </rss>`
  552. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  553. if err != nil {
  554. t.Fatal(err)
  555. }
  556. expected := "john.doe@example.com"
  557. result := feed.Entries[0].Author
  558. if result != expected {
  559. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  560. }
  561. }
  562. func TestParseEntryWithGooglePlayAuthor(t *testing.T) {
  563. data := `<?xml version="1.0" encoding="utf-8"?>
  564. <rss version="2.0" xmlns:googleplay="http://www.google.com/schemas/play-podcasts/1.0">
  565. <channel>
  566. <title>Example</title>
  567. <link>https://example.org/</link>
  568. <item>
  569. <title>Test</title>
  570. <link>https://example.org/item</link>
  571. <googleplay:author>Someone</googleplay:author>
  572. </item>
  573. </channel>
  574. </rss>`
  575. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  576. if err != nil {
  577. t.Fatal(err)
  578. }
  579. expected := "Someone"
  580. result := feed.Entries[0].Author
  581. if result != expected {
  582. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  583. }
  584. }
  585. func TestParseFeedWithGooglePlayAuthor(t *testing.T) {
  586. data := `<?xml version="1.0" encoding="utf-8"?>
  587. <rss version="2.0" xmlns:googleplay="http://www.google.com/schemas/play-podcasts/1.0">
  588. <channel>
  589. <title>Example</title>
  590. <link>https://example.org/</link>
  591. <googleplay:author>Someone</googleplay:author>
  592. <item>
  593. <title>Test</title>
  594. <link>https://example.org/item</link>
  595. </item>
  596. </channel>
  597. </rss>`
  598. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  599. if err != nil {
  600. t.Fatal(err)
  601. }
  602. expected := "Someone"
  603. result := feed.Entries[0].Author
  604. if result != expected {
  605. t.Errorf("Incorrect entry author, got %q instead of %q", result, expected)
  606. }
  607. }
  608. func TestParseEntryWithDublinCoreDate(t *testing.T) {
  609. data := `<?xml version="1.0" encoding="utf-8"?>
  610. <rss version="2.0" xmlns:dc="http://purl.org/dc/elements/1.1/">
  611. <channel>
  612. <title>Example</title>
  613. <link>http://example.org/</link>
  614. <item>
  615. <title>Item 1</title>
  616. <link>http://example.org/item1</link>
  617. <description>Description.</description>
  618. <guid isPermaLink="false">UUID</guid>
  619. <dc:date>2002-09-29T23:40:06-05:00</dc:date>
  620. </item>
  621. </channel>
  622. </rss>`
  623. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  624. if err != nil {
  625. t.Fatal(err)
  626. }
  627. location, _ := time.LoadLocation("EST")
  628. expectedDate := time.Date(2002, time.September, 29, 23, 40, 06, 0, location)
  629. if !feed.Entries[0].Date.Equal(expectedDate) {
  630. t.Errorf("Incorrect entry date, got: %v, want: %v", feed.Entries[0].Date, expectedDate)
  631. }
  632. }
  633. func TestParseEntryWithContentEncoded(t *testing.T) {
  634. data := `<?xml version="1.0" encoding="utf-8"?>
  635. <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
  636. <channel>
  637. <title>Example</title>
  638. <link>http://example.org/</link>
  639. <item>
  640. <title>Item 1</title>
  641. <link>http://example.org/item1</link>
  642. <description>Description.</description>
  643. <guid isPermaLink="false">UUID</guid>
  644. <content:encoded><![CDATA[<p><a href="http://www.example.org/">Example</a>.</p>]]></content:encoded>
  645. </item>
  646. </channel>
  647. </rss>`
  648. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  649. if err != nil {
  650. t.Fatal(err)
  651. }
  652. if feed.Entries[0].Content != `<p><a href="http://www.example.org/">Example</a>.</p>` {
  653. t.Errorf("Incorrect entry content, got: %s", feed.Entries[0].Content)
  654. }
  655. }
  656. func TestParseEntryWithFeedBurnerLink(t *testing.T) {
  657. data := `<?xml version="1.0" encoding="utf-8"?>
  658. <rss version="2.0" xmlns:feedburner="http://rssnamespace.org/feedburner/ext/1.0">
  659. <channel>
  660. <title>Example</title>
  661. <link>http://example.org/</link>
  662. <item>
  663. <title>Item 1</title>
  664. <link>http://example.org/item1</link>
  665. <feedburner:origLink>http://example.org/original</feedburner:origLink>
  666. </item>
  667. </channel>
  668. </rss>`
  669. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  670. if err != nil {
  671. t.Fatal(err)
  672. }
  673. if feed.Entries[0].URL != "http://example.org/original" {
  674. t.Errorf("Incorrect entry content, got: %s", feed.Entries[0].URL)
  675. }
  676. }
  677. func TestParseEntryTitleWithWhitespaces(t *testing.T) {
  678. data := `<?xml version="1.0" encoding="utf-8"?>
  679. <rss version="2.0">
  680. <channel>
  681. <title>Example</title>
  682. <link>http://example.org</link>
  683. <item>
  684. <title>
  685. Some Title
  686. </title>
  687. <link>http://www.example.org/entries/1</link>
  688. <pubDate>Fri, 15 Jul 2005 00:00:00 -0500</pubDate>
  689. </item>
  690. </channel>
  691. </rss>`
  692. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  693. if err != nil {
  694. t.Fatal(err)
  695. }
  696. if feed.Entries[0].Title != "Some Title" {
  697. t.Errorf("Incorrect entry title, got: %s", feed.Entries[0].Title)
  698. }
  699. }
  700. func TestParseEntryWithEnclosures(t *testing.T) {
  701. data := `<?xml version="1.0" encoding="utf-8"?>
  702. <rss version="2.0">
  703. <channel>
  704. <title>My Podcast Feed</title>
  705. <link>http://example.org</link>
  706. <author>some.email@example.org</author>
  707. <item>
  708. <title>Podcasting with RSS</title>
  709. <link>http://www.example.org/entries/1</link>
  710. <description>An overview of RSS podcasting</description>
  711. <pubDate>Fri, 15 Jul 2005 00:00:00 -0500</pubDate>
  712. <guid isPermaLink="true">http://www.example.org/entries/1</guid>
  713. <enclosure url="http://www.example.org/myaudiofile.mp3"
  714. length="12345"
  715. type="audio/mpeg" />
  716. </item>
  717. </channel>
  718. </rss>`
  719. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  720. if err != nil {
  721. t.Fatal(err)
  722. }
  723. if len(feed.Entries) != 1 {
  724. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  725. }
  726. if feed.Entries[0].URL != "http://www.example.org/entries/1" {
  727. t.Errorf("Incorrect entry URL, got: %s", feed.Entries[0].URL)
  728. }
  729. if len(feed.Entries[0].Enclosures) != 1 {
  730. t.Errorf("Incorrect number of enclosures, got: %d", len(feed.Entries[0].Enclosures))
  731. }
  732. if feed.Entries[0].Enclosures[0].URL != "http://www.example.org/myaudiofile.mp3" {
  733. t.Errorf("Incorrect enclosure URL, got: %s", feed.Entries[0].Enclosures[0].URL)
  734. }
  735. if feed.Entries[0].Enclosures[0].MimeType != "audio/mpeg" {
  736. t.Errorf("Incorrect enclosure type, got: %s", feed.Entries[0].Enclosures[0].MimeType)
  737. }
  738. if feed.Entries[0].Enclosures[0].Size != 12345 {
  739. t.Errorf("Incorrect enclosure length, got: %d", feed.Entries[0].Enclosures[0].Size)
  740. }
  741. }
  742. func TestParseEntryWithEmptyEnclosureURL(t *testing.T) {
  743. data := `<?xml version="1.0" encoding="utf-8"?>
  744. <rss version="2.0">
  745. <channel>
  746. <title>My Podcast Feed</title>
  747. <link>http://example.org</link>
  748. <author>some.email@example.org</author>
  749. <item>
  750. <title>Podcasting with RSS</title>
  751. <link>http://www.example.org/entries/1</link>
  752. <description>An overview of RSS podcasting</description>
  753. <pubDate>Fri, 15 Jul 2005 00:00:00 -0500</pubDate>
  754. <guid isPermaLink="true">http://www.example.org/entries/1</guid>
  755. <enclosure url="" length="0"/>
  756. </item>
  757. </channel>
  758. </rss>`
  759. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  760. if err != nil {
  761. t.Fatal(err)
  762. }
  763. if len(feed.Entries) != 1 {
  764. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  765. }
  766. if feed.Entries[0].URL != "http://www.example.org/entries/1" {
  767. t.Errorf("Incorrect entry URL, got: %s", feed.Entries[0].URL)
  768. }
  769. if len(feed.Entries[0].Enclosures) != 0 {
  770. t.Errorf("Incorrect number of enclosures, got: %d", len(feed.Entries[0].Enclosures))
  771. }
  772. }
  773. func TestParseEntryWithFeedBurnerEnclosures(t *testing.T) {
  774. data := `<?xml version="1.0" encoding="utf-8"?>
  775. <rss version="2.0" xmlns:feedburner="http://rssnamespace.org/feedburner/ext/1.0">
  776. <channel>
  777. <title>My Example Feed</title>
  778. <link>http://example.org</link>
  779. <author>some.email@example.org</author>
  780. <item>
  781. <title>Example Item</title>
  782. <link>http://www.example.org/entries/1</link>
  783. <enclosure
  784. url="http://feedproxy.google.com/~r/example/~5/lpMyFSCvubs/File.mp3"
  785. length="76192460"
  786. type="audio/mpeg" />
  787. <feedburner:origEnclosureLink>http://example.org/67ca416c-f22a-4228-a681-68fc9998ec10/File.mp3</feedburner:origEnclosureLink>
  788. </item>
  789. </channel>
  790. </rss>`
  791. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  792. if err != nil {
  793. t.Fatal(err)
  794. }
  795. if len(feed.Entries) != 1 {
  796. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  797. }
  798. if feed.Entries[0].URL != "http://www.example.org/entries/1" {
  799. t.Errorf("Incorrect entry URL, got: %s", feed.Entries[0].URL)
  800. }
  801. if len(feed.Entries[0].Enclosures) != 1 {
  802. t.Errorf("Incorrect number of enclosures, got: %d", len(feed.Entries[0].Enclosures))
  803. }
  804. if feed.Entries[0].Enclosures[0].URL != "http://example.org/67ca416c-f22a-4228-a681-68fc9998ec10/File.mp3" {
  805. t.Errorf("Incorrect enclosure URL, got: %s", feed.Entries[0].Enclosures[0].URL)
  806. }
  807. if feed.Entries[0].Enclosures[0].MimeType != "audio/mpeg" {
  808. t.Errorf("Incorrect enclosure type, got: %s", feed.Entries[0].Enclosures[0].MimeType)
  809. }
  810. if feed.Entries[0].Enclosures[0].Size != 76192460 {
  811. t.Errorf("Incorrect enclosure length, got: %d", feed.Entries[0].Enclosures[0].Size)
  812. }
  813. }
  814. func TestParseEntryWithRelativeURL(t *testing.T) {
  815. data := `<?xml version="1.0" encoding="utf-8"?>
  816. <rss version="2.0">
  817. <channel>
  818. <link>https://example.org/</link>
  819. <item>
  820. <link>item.html</link>
  821. </item>
  822. </channel>
  823. </rss>`
  824. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  825. if err != nil {
  826. t.Fatal(err)
  827. }
  828. if feed.Entries[0].Title != "https://example.org/item.html" {
  829. t.Errorf("Incorrect entry title, got: %s", feed.Entries[0].Title)
  830. }
  831. }
  832. func TestParseEntryWithCommentsURL(t *testing.T) {
  833. data := `<?xml version="1.0" encoding="utf-8"?>
  834. <rss version="2.0" xmlns:slash="http://purl.org/rss/1.0/modules/slash/">
  835. <channel>
  836. <link>https://example.org/</link>
  837. <item>
  838. <title>Item 1</title>
  839. <link>https://example.org/item1</link>
  840. <comments>
  841. https://example.org/comments
  842. </comments>
  843. <slash:comments>42</slash:comments>
  844. </item>
  845. </channel>
  846. </rss>`
  847. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  848. if err != nil {
  849. t.Fatal(err)
  850. }
  851. if feed.Entries[0].CommentsURL != "https://example.org/comments" {
  852. t.Errorf("Incorrect entry comments URL, got: %q", feed.Entries[0].CommentsURL)
  853. }
  854. }
  855. func TestParseEntryWithInvalidCommentsURL(t *testing.T) {
  856. data := `<?xml version="1.0" encoding="utf-8"?>
  857. <rss version="2.0" xmlns:slash="http://purl.org/rss/1.0/modules/slash/">
  858. <channel>
  859. <link>https://example.org/</link>
  860. <item>
  861. <title>Item 1</title>
  862. <link>https://example.org/item1</link>
  863. <comments>
  864. Some text
  865. </comments>
  866. </item>
  867. </channel>
  868. </rss>`
  869. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  870. if err != nil {
  871. t.Fatal(err)
  872. }
  873. if feed.Entries[0].CommentsURL != "" {
  874. t.Errorf("Incorrect entry comments URL, got: %q", feed.Entries[0].CommentsURL)
  875. }
  876. }
  877. func TestParseInvalidXml(t *testing.T) {
  878. data := `garbage`
  879. _, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  880. if err == nil {
  881. t.Error("Parse should returns an error")
  882. }
  883. }
  884. func TestParseFeedTitleWithHTMLEntity(t *testing.T) {
  885. data := `<?xml version="1.0" encoding="utf-8"?>
  886. <rss version="2.0" xmlns:slash="http://purl.org/rss/1.0/modules/slash/">
  887. <channel>
  888. <link>https://example.org/</link>
  889. <title>Example &nbsp; Feed</title>
  890. </channel>
  891. </rss>`
  892. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  893. if err != nil {
  894. t.Fatal(err)
  895. }
  896. if feed.Title != "Example \u00a0 Feed" {
  897. t.Errorf(`Incorrect title, got: %q`, feed.Title)
  898. }
  899. }
  900. func TestParseFeedTitleWithUnicodeEntityAndCdata(t *testing.T) {
  901. data := `<?xml version="1.0" encoding="utf-8"?>
  902. <rss version="2.0" xmlns:slash="http://purl.org/rss/1.0/modules/slash/">
  903. <channel>
  904. <link>https://example.org/</link>
  905. <title><![CDATA[Jenny&#8217;s Newsletter]]></title>
  906. </channel>
  907. </rss>`
  908. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  909. if err != nil {
  910. t.Fatal(err)
  911. }
  912. if feed.Title != `Jenny’s Newsletter` {
  913. t.Errorf(`Incorrect title, got: %q`, feed.Title)
  914. }
  915. }
  916. func TestParseItemTitleWithHTMLEntity(t *testing.T) {
  917. data := `<?xml version="1.0" encoding="utf-8"?>
  918. <rss version="2.0" xmlns:slash="http://purl.org/rss/1.0/modules/slash/">
  919. <channel>
  920. <link>https://example.org/</link>
  921. <title>Example</title>
  922. <item>
  923. <title>&lt;/example&gt;</title>
  924. <link>http://www.example.org/entries/1</link>
  925. </item>
  926. </channel>
  927. </rss>`
  928. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  929. if err != nil {
  930. t.Fatal(err)
  931. }
  932. if feed.Entries[0].Title != "</example>" {
  933. t.Errorf(`Incorrect title, got: %q`, feed.Entries[0].Title)
  934. }
  935. }
  936. func TestParseItemTitleWithNumericCharacterReference(t *testing.T) {
  937. data := `<?xml version="1.0" encoding="utf-8"?>
  938. <rss version="2.0" xmlns:slash="http://purl.org/rss/1.0/modules/slash/">
  939. <channel>
  940. <link>https://example.org/</link>
  941. <title>Example</title>
  942. <item>
  943. <title>&#931; &#xDF;</title>
  944. <link>http://www.example.org/article.html</link>
  945. </item>
  946. </channel>
  947. </rss>`
  948. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  949. if err != nil {
  950. t.Fatal(err)
  951. }
  952. if feed.Entries[0].Title != "Σ ß" {
  953. t.Errorf(`Incorrect title, got: %q`, feed.Entries[0].Title)
  954. }
  955. }
  956. func TestParseItemTitleWithDoubleEncodedEntities(t *testing.T) {
  957. data := `<?xml version="1.0" encoding="utf-8"?>
  958. <rss version="2.0" xmlns:slash="http://purl.org/rss/1.0/modules/slash/">
  959. <channel>
  960. <link>https://example.org/</link>
  961. <title>Example</title>
  962. <item>
  963. <title>&amp;#39;Text&amp;#39;</title>
  964. <link>http://www.example.org/article.html</link>
  965. </item>
  966. </channel>
  967. </rss>`
  968. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  969. if err != nil {
  970. t.Fatal(err)
  971. }
  972. if feed.Entries[0].Title != "'Text'" {
  973. t.Errorf(`Incorrect title, got: %q`, feed.Entries[0].Title)
  974. }
  975. }
  976. func TestParseFeedLinkWithInvalidCharacterEntity(t *testing.T) {
  977. data := `<?xml version="1.0" encoding="utf-8"?>
  978. <rss version="2.0" xmlns:slash="http://purl.org/rss/1.0/modules/slash/">
  979. <channel>
  980. <link>https://example.org/a&b</link>
  981. <title>Example Feed</title>
  982. </channel>
  983. </rss>`
  984. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  985. if err != nil {
  986. t.Fatal(err)
  987. }
  988. if feed.SiteURL != "https://example.org/a&b" {
  989. t.Errorf(`Incorrect url, got: %q`, feed.SiteURL)
  990. }
  991. }
  992. func TestParseEntryWithMediaGroup(t *testing.T) {
  993. data := `<?xml version="1.0" encoding="utf-8"?>
  994. <rss version="2.0" xmlns:media="http://search.yahoo.com/mrss/">
  995. <channel>
  996. <title>My Example Feed</title>
  997. <link>http://example.org</link>
  998. <item>
  999. <title>Example Item</title>
  1000. <link>http://www.example.org/entries/1</link>
  1001. <enclosure type="application/x-bittorrent" url="https://example.org/file3.torrent" length="670053113">
  1002. </enclosure>
  1003. <media:group>
  1004. <media:content type="application/x-bittorrent" url="https://example.org/file1.torrent"></media:content>
  1005. <media:content type="application/x-bittorrent" url="https://example.org/file2.torrent" isDefault="true"></media:content>
  1006. <media:content type="application/x-bittorrent" url="https://example.org/file3.torrent"></media:content>
  1007. <media:content type="application/x-bittorrent" url="https://example.org/file4.torrent"></media:content>
  1008. <media:content type="application/x-bittorrent" url="https://example.org/file5.torrent" fileSize="42"></media:content>
  1009. <media:rating>nonadult</media:rating>
  1010. </media:group>
  1011. <media:thumbnail url="https://example.org/image.jpg" height="122" width="223"></media:thumbnail>
  1012. </item>
  1013. </channel>
  1014. </rss>`
  1015. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1016. if err != nil {
  1017. t.Fatal(err)
  1018. }
  1019. if len(feed.Entries) != 1 {
  1020. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  1021. }
  1022. if len(feed.Entries[0].Enclosures) != 6 {
  1023. t.Fatalf("Incorrect number of enclosures, got: %d", len(feed.Entries[0].Enclosures))
  1024. }
  1025. expectedResults := []struct {
  1026. url string
  1027. mimeType string
  1028. size int64
  1029. }{
  1030. {"https://example.org/image.jpg", "image/*", 0},
  1031. {"https://example.org/file3.torrent", "application/x-bittorrent", 670053113},
  1032. {"https://example.org/file1.torrent", "application/x-bittorrent", 0},
  1033. {"https://example.org/file2.torrent", "application/x-bittorrent", 0},
  1034. {"https://example.org/file4.torrent", "application/x-bittorrent", 0},
  1035. {"https://example.org/file5.torrent", "application/x-bittorrent", 42},
  1036. }
  1037. for index, enclosure := range feed.Entries[0].Enclosures {
  1038. if expectedResults[index].url != enclosure.URL {
  1039. t.Errorf(`Unexpected enclosure URL, got %q instead of %q`, enclosure.URL, expectedResults[index].url)
  1040. }
  1041. if expectedResults[index].mimeType != enclosure.MimeType {
  1042. t.Errorf(`Unexpected enclosure type, got %q instead of %q`, enclosure.MimeType, expectedResults[index].mimeType)
  1043. }
  1044. if expectedResults[index].size != enclosure.Size {
  1045. t.Errorf(`Unexpected enclosure size, got %d instead of %d`, enclosure.Size, expectedResults[index].size)
  1046. }
  1047. }
  1048. }
  1049. func TestParseEntryWithMediaContent(t *testing.T) {
  1050. data := `<?xml version="1.0" encoding="utf-8"?>
  1051. <rss version="2.0" xmlns:media="http://search.yahoo.com/mrss/">
  1052. <channel>
  1053. <title>My Example Feed</title>
  1054. <link>http://example.org</link>
  1055. <item>
  1056. <title>Example Item</title>
  1057. <link>http://www.example.org/entries/1</link>
  1058. <media:thumbnail url="https://example.org/thumbnail.jpg" />
  1059. <media:content url="https://example.org/media1.jpg" medium="image">
  1060. <media:title type="html">Some Title for Media 1</media:title>
  1061. </media:content>
  1062. <media:content url="https://example.org/media2.jpg" medium="image" />
  1063. </item>
  1064. </channel>
  1065. </rss>`
  1066. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1067. if err != nil {
  1068. t.Fatal(err)
  1069. }
  1070. if len(feed.Entries) != 1 {
  1071. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  1072. }
  1073. if len(feed.Entries[0].Enclosures) != 3 {
  1074. t.Fatalf("Incorrect number of enclosures, got: %d", len(feed.Entries[0].Enclosures))
  1075. }
  1076. expectedResults := []struct {
  1077. url string
  1078. mimeType string
  1079. size int64
  1080. }{
  1081. {"https://example.org/thumbnail.jpg", "image/*", 0},
  1082. {"https://example.org/media1.jpg", "image/*", 0},
  1083. {"https://example.org/media2.jpg", "image/*", 0},
  1084. }
  1085. for index, enclosure := range feed.Entries[0].Enclosures {
  1086. if expectedResults[index].url != enclosure.URL {
  1087. t.Errorf(`Unexpected enclosure URL, got %q instead of %q`, enclosure.URL, expectedResults[index].url)
  1088. }
  1089. if expectedResults[index].mimeType != enclosure.MimeType {
  1090. t.Errorf(`Unexpected enclosure type, got %q instead of %q`, enclosure.MimeType, expectedResults[index].mimeType)
  1091. }
  1092. if expectedResults[index].size != enclosure.Size {
  1093. t.Errorf(`Unexpected enclosure size, got %d instead of %d`, enclosure.Size, expectedResults[index].size)
  1094. }
  1095. }
  1096. }
  1097. func TestParseEntryWithMediaPeerLink(t *testing.T) {
  1098. data := `<?xml version="1.0" encoding="utf-8"?>
  1099. <rss version="2.0" xmlns:media="http://search.yahoo.com/mrss/">
  1100. <channel>
  1101. <title>My Example Feed</title>
  1102. <link>http://example.org</link>
  1103. <item>
  1104. <title>Example Item</title>
  1105. <link>http://www.example.org/entries/1</link>
  1106. <media:peerLink type="application/x-bittorrent" href="http://www.example.org/file.torrent" />
  1107. </item>
  1108. </channel>
  1109. </rss>`
  1110. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1111. if err != nil {
  1112. t.Fatal(err)
  1113. }
  1114. if len(feed.Entries) != 1 {
  1115. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  1116. }
  1117. if len(feed.Entries[0].Enclosures) != 1 {
  1118. t.Fatalf("Incorrect number of enclosures, got: %d", len(feed.Entries[0].Enclosures))
  1119. }
  1120. expectedResults := []struct {
  1121. url string
  1122. mimeType string
  1123. size int64
  1124. }{
  1125. {"http://www.example.org/file.torrent", "application/x-bittorrent", 0},
  1126. }
  1127. for index, enclosure := range feed.Entries[0].Enclosures {
  1128. if expectedResults[index].url != enclosure.URL {
  1129. t.Errorf(`Unexpected enclosure URL, got %q instead of %q`, enclosure.URL, expectedResults[index].url)
  1130. }
  1131. if expectedResults[index].mimeType != enclosure.MimeType {
  1132. t.Errorf(`Unexpected enclosure type, got %q instead of %q`, enclosure.MimeType, expectedResults[index].mimeType)
  1133. }
  1134. if expectedResults[index].size != enclosure.Size {
  1135. t.Errorf(`Unexpected enclosure size, got %d instead of %d`, enclosure.Size, expectedResults[index].size)
  1136. }
  1137. }
  1138. }
  1139. func TestEntryDescriptionFromItunesSummary(t *testing.T) {
  1140. data := `<?xml version="1.0" encoding="UTF-8"?>
  1141. <rss version="2.0" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd">
  1142. <channel>
  1143. <title>Podcast Example</title>
  1144. <link>http://www.example.com/index.html</link>
  1145. <item>
  1146. <title>Podcast Episode</title>
  1147. <guid>http://example.com/episode.m4a</guid>
  1148. <pubDate>Tue, 08 Mar 2016 12:00:00 GMT</pubDate>
  1149. <itunes:subtitle>Episode Subtitle</itunes:subtitle>
  1150. <itunes:summary>Episode Summary</itunes:summary>
  1151. </item>
  1152. </channel>
  1153. </rss>`
  1154. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1155. if err != nil {
  1156. t.Fatal(err)
  1157. }
  1158. if len(feed.Entries) != 1 {
  1159. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  1160. }
  1161. expected := "Episode Summary"
  1162. result := feed.Entries[0].Content
  1163. if expected != result {
  1164. t.Errorf(`Unexpected podcast content, got %q instead of %q`, result, expected)
  1165. }
  1166. }
  1167. func TestEntryDescriptionFromItunesSubtitle(t *testing.T) {
  1168. data := `<?xml version="1.0" encoding="UTF-8"?>
  1169. <rss version="2.0" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd">
  1170. <channel>
  1171. <title>Podcast Example</title>
  1172. <link>http://www.example.com/index.html</link>
  1173. <item>
  1174. <title>Podcast Episode</title>
  1175. <guid>http://example.com/episode.m4a</guid>
  1176. <pubDate>Tue, 08 Mar 2016 12:00:00 GMT</pubDate>
  1177. <itunes:subtitle>Episode Subtitle</itunes:subtitle>
  1178. </item>
  1179. </channel>
  1180. </rss>`
  1181. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1182. if err != nil {
  1183. t.Fatal(err)
  1184. }
  1185. if len(feed.Entries) != 1 {
  1186. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  1187. }
  1188. expected := "Episode Subtitle"
  1189. result := feed.Entries[0].Content
  1190. if expected != result {
  1191. t.Errorf(`Unexpected podcast content, got %q instead of %q`, result, expected)
  1192. }
  1193. }
  1194. func TestEntryDescriptionFromGooglePlayDescription(t *testing.T) {
  1195. data := `<?xml version="1.0" encoding="UTF-8"?>
  1196. <rss version="2.0"
  1197. xmlns:googleplay="http://www.google.com/schemas/play-podcasts/1.0"
  1198. xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd">
  1199. <channel>
  1200. <title>Podcast Example</title>
  1201. <link>http://www.example.com/index.html</link>
  1202. <item>
  1203. <title>Podcast Episode</title>
  1204. <guid>http://example.com/episode.m4a</guid>
  1205. <pubDate>Tue, 08 Mar 2016 12:00:00 GMT</pubDate>
  1206. <itunes:subtitle>Episode Subtitle</itunes:subtitle>
  1207. <googleplay:description>Episode Description</googleplay:description>
  1208. </item>
  1209. </channel>
  1210. </rss>`
  1211. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1212. if err != nil {
  1213. t.Fatal(err)
  1214. }
  1215. if len(feed.Entries) != 1 {
  1216. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  1217. }
  1218. expected := "Episode Description"
  1219. result := feed.Entries[0].Content
  1220. if expected != result {
  1221. t.Errorf(`Unexpected podcast content, got %q instead of %q`, result, expected)
  1222. }
  1223. }
  1224. func TestParseEntryWithRSSDescriptionAndMediaDescription(t *testing.T) {
  1225. data := `<?xml version="1.0" encoding="UTF-8"?>
  1226. <rss version="2.0" xmlns:media="http://search.yahoo.com/mrss/">
  1227. <channel>
  1228. <title>Podcast Example</title>
  1229. <link>http://www.example.com/index.html</link>
  1230. <item>
  1231. <title>Entry Title</title>
  1232. <link>http://www.example.com/entries/1</link>
  1233. <description>Entry Description</description>
  1234. <media:description type="plain">Media Description</media:description>
  1235. </item>
  1236. </channel>
  1237. </rss>`
  1238. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1239. if err != nil {
  1240. t.Fatal(err)
  1241. }
  1242. if len(feed.Entries) != 1 {
  1243. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  1244. }
  1245. expected := "Entry Description"
  1246. result := feed.Entries[0].Content
  1247. if expected != result {
  1248. t.Errorf(`Unexpected description, got %q instead of %q`, result, expected)
  1249. }
  1250. }
  1251. func TestParseFeedWithCategories(t *testing.T) {
  1252. data := `<?xml version="1.0" encoding="utf-8"?>
  1253. <rss xmlns:atom="http://www.w3.org/2005/Atom" version="2.0">
  1254. <channel>
  1255. <title>Example</title>
  1256. <link>https://example.org/</link>
  1257. <category>Category 1</category>
  1258. <category><![CDATA[Category 2]]></category>
  1259. <item>
  1260. <title>Test</title>
  1261. <link>https://example.org/item</link>
  1262. </item>
  1263. </channel>
  1264. </rss>`
  1265. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1266. if err != nil {
  1267. t.Fatal(err)
  1268. }
  1269. if len(feed.Entries[0].Tags) != 2 {
  1270. t.Errorf("Incorrect number of tags, got: %d", len(feed.Entries[0].Tags))
  1271. }
  1272. expected := []string{"Category 1", "Category 2"}
  1273. result := feed.Entries[0].Tags
  1274. for i, tag := range result {
  1275. if tag != expected[i] {
  1276. t.Errorf("Incorrect tag, got: %q", tag)
  1277. }
  1278. }
  1279. }
  1280. func TestParseEntryWithCategories(t *testing.T) {
  1281. data := `<?xml version="1.0" encoding="utf-8"?>
  1282. <rss xmlns:atom="http://www.w3.org/2005/Atom" version="2.0">
  1283. <channel>
  1284. <title>Example</title>
  1285. <link>https://example.org/</link>
  1286. <category>Category 3</category>
  1287. <item>
  1288. <title>Test</title>
  1289. <link>https://example.org/item</link>
  1290. <category>Category 1</category>
  1291. <category><![CDATA[Category 2]]></category>
  1292. </item>
  1293. </channel>
  1294. </rss>`
  1295. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1296. if err != nil {
  1297. t.Fatal(err)
  1298. }
  1299. if len(feed.Entries[0].Tags) != 3 {
  1300. t.Errorf("Incorrect number of tags, got: %d", len(feed.Entries[0].Tags))
  1301. }
  1302. expected := []string{"Category 1", "Category 2", "Category 3"}
  1303. result := feed.Entries[0].Tags
  1304. for i, tag := range result {
  1305. if tag != expected[i] {
  1306. t.Errorf("Incorrect tag, got: %q", tag)
  1307. }
  1308. }
  1309. }
  1310. func TestParseFeedWithItunesCategories(t *testing.T) {
  1311. data := `<?xml version="1.0" encoding="utf-8"?>
  1312. <rss xmlns:atom="http://www.w3.org/2005/Atom" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd" version="2.0">
  1313. <channel>
  1314. <title>Example</title>
  1315. <link>https://example.org/</link>
  1316. <itunes:category text="Society &amp; Culture">
  1317. <itunes:category text="Documentary" />
  1318. </itunes:category>
  1319. <itunes:category text="Health">
  1320. <itunes:category text="Mental Health" />
  1321. </itunes:category>
  1322. <item>
  1323. <title>Test</title>
  1324. <link>https://example.org/item</link>
  1325. </item>
  1326. </channel>
  1327. </rss>`
  1328. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1329. if err != nil {
  1330. t.Fatal(err)
  1331. }
  1332. if len(feed.Entries[0].Tags) != 4 {
  1333. t.Errorf("Incorrect number of tags, got: %d", len(feed.Entries[0].Tags))
  1334. }
  1335. expected := []string{"Society & Culture", "Documentary", "Health", "Mental Health"}
  1336. result := feed.Entries[0].Tags
  1337. for i, tag := range result {
  1338. if tag != expected[i] {
  1339. t.Errorf("Incorrect tag, got: %q", tag)
  1340. }
  1341. }
  1342. }
  1343. func TestParseFeedWithGooglePlayCategory(t *testing.T) {
  1344. data := `<?xml version="1.0" encoding="utf-8"?>
  1345. <rss xmlns:atom="http://www.w3.org/2005/Atom" xmlns:gplay="http://www.google.com/schemas/play-podcasts/1.0" version="2.0">
  1346. <channel>
  1347. <title>Example</title>
  1348. <link>https://example.org/</link>
  1349. <gplay:category text="Art"></gplay:category>
  1350. <item>
  1351. <title>Test</title>
  1352. <link>https://example.org/item</link>
  1353. </item>
  1354. </channel>
  1355. </rss>`
  1356. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1357. if err != nil {
  1358. t.Fatal(err)
  1359. }
  1360. if len(feed.Entries[0].Tags) != 1 {
  1361. t.Errorf("Incorrect number of tags, got: %d", len(feed.Entries[0].Tags))
  1362. }
  1363. expected := []string{"Art"}
  1364. result := feed.Entries[0].Tags
  1365. for i, tag := range result {
  1366. if tag != expected[i] {
  1367. t.Errorf("Incorrect tag, got: %q", tag)
  1368. }
  1369. }
  1370. }
  1371. func TestParseFeedWithTTLField(t *testing.T) {
  1372. data := `<?xml version="1.0" encoding="utf-8"?>
  1373. <rss version="2.0">
  1374. <channel>
  1375. <title>Example</title>
  1376. <link>https://example.org/</link>
  1377. <ttl>60</ttl>
  1378. <item>
  1379. <title>Test</title>
  1380. <link>https://example.org/item</link>
  1381. </item>
  1382. </channel>
  1383. </rss>`
  1384. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1385. if err != nil {
  1386. t.Fatal(err)
  1387. }
  1388. if feed.TTL != 60 {
  1389. t.Errorf("Incorrect TTL, got: %d", feed.TTL)
  1390. }
  1391. }
  1392. func TestParseFeedWithIncorrectTTLValue(t *testing.T) {
  1393. data := `<?xml version="1.0" encoding="utf-8"?>
  1394. <rss version="2.0">
  1395. <channel>
  1396. <title>Example</title>
  1397. <link>https://example.org/</link>
  1398. <ttl>invalid</ttl>
  1399. <item>
  1400. <title>Test</title>
  1401. <link>https://example.org/item</link>
  1402. </item>
  1403. </channel>
  1404. </rss>`
  1405. feed, err := Parse("https://example.org/", bytes.NewReader([]byte(data)))
  1406. if err != nil {
  1407. t.Fatal(err)
  1408. }
  1409. if feed.TTL != 0 {
  1410. t.Errorf("Incorrect TTL, got: %d", feed.TTL)
  1411. }
  1412. }