parser_test.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482
  1. // Copyright 2017 Frédéric Guillot. All rights reserved.
  2. // Use of this source code is governed by the Apache 2.0
  3. // license that can be found in the LICENSE file.
  4. package atom
  5. import (
  6. "bytes"
  7. "testing"
  8. "time"
  9. )
  10. func TestParseAtomSample(t *testing.T) {
  11. data := `<?xml version="1.0" encoding="utf-8"?>
  12. <feed xmlns="http://www.w3.org/2005/Atom">
  13. <title>Example Feed</title>
  14. <link href="http://example.org/"/>
  15. <updated>2003-12-13T18:30:02Z</updated>
  16. <author>
  17. <name>John Doe</name>
  18. </author>
  19. <id>urn:uuid:60a76c80-d399-11d9-b93C-0003939e0af6</id>
  20. <entry>
  21. <title>Atom-Powered Robots Run Amok</title>
  22. <link href="http://example.org/2003/12/13/atom03"/>
  23. <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id>
  24. <updated>2003-12-13T18:30:02Z</updated>
  25. <summary>Some text.</summary>
  26. </entry>
  27. </feed>`
  28. feed, err := Parse(bytes.NewBufferString(data))
  29. if err != nil {
  30. t.Error(err)
  31. }
  32. if feed.Title != "Example Feed" {
  33. t.Errorf("Incorrect title, got: %s", feed.Title)
  34. }
  35. if feed.FeedURL != "" {
  36. t.Errorf("Incorrect feed URL, got: %s", feed.FeedURL)
  37. }
  38. if feed.SiteURL != "http://example.org/" {
  39. t.Errorf("Incorrect site URL, got: %s", feed.SiteURL)
  40. }
  41. if len(feed.Entries) != 1 {
  42. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  43. }
  44. if !feed.Entries[0].Date.Equal(time.Date(2003, time.December, 13, 18, 30, 2, 0, time.UTC)) {
  45. t.Errorf("Incorrect entry date, got: %v", feed.Entries[0].Date)
  46. }
  47. if feed.Entries[0].Hash != "3841e5cf232f5111fc5841e9eba5f4b26d95e7d7124902e0f7272729d65601a6" {
  48. t.Errorf("Incorrect entry hash, got: %s", feed.Entries[0].Hash)
  49. }
  50. if feed.Entries[0].URL != "http://example.org/2003/12/13/atom03" {
  51. t.Errorf("Incorrect entry URL, got: %s", feed.Entries[0].URL)
  52. }
  53. if feed.Entries[0].Title != "Atom-Powered Robots Run Amok" {
  54. t.Errorf("Incorrect entry title, got: %s", feed.Entries[0].Title)
  55. }
  56. if feed.Entries[0].Content != "Some text." {
  57. t.Errorf("Incorrect entry content, got: %s", feed.Entries[0].Content)
  58. }
  59. if feed.Entries[0].Author != "John Doe" {
  60. t.Errorf("Incorrect entry author, got: %s", feed.Entries[0].Author)
  61. }
  62. }
  63. func TestParseFeedWithoutTitle(t *testing.T) {
  64. data := `<?xml version="1.0" encoding="utf-8"?>
  65. <feed xmlns="http://www.w3.org/2005/Atom">
  66. <link rel="alternate" type="text/html" href="https://example.org/"/>
  67. <link rel="self" type="application/atom+xml" href="https://example.org/feed"/>
  68. <updated>2003-12-13T18:30:02Z</updated>
  69. </feed>`
  70. feed, err := Parse(bytes.NewBufferString(data))
  71. if err != nil {
  72. t.Error(err)
  73. }
  74. if feed.Title != "https://example.org/" {
  75. t.Errorf("Incorrect feed title, got: %s", feed.Title)
  76. }
  77. }
  78. func TestParseEntryWithoutTitle(t *testing.T) {
  79. data := `<?xml version="1.0" encoding="utf-8"?>
  80. <feed xmlns="http://www.w3.org/2005/Atom">
  81. <title>Example Feed</title>
  82. <link href="http://example.org/"/>
  83. <updated>2003-12-13T18:30:02Z</updated>
  84. <author>
  85. <name>John Doe</name>
  86. </author>
  87. <id>urn:uuid:60a76c80-d399-11d9-b93C-0003939e0af6</id>
  88. <entry>
  89. <link href="http://example.org/2003/12/13/atom03"/>
  90. <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id>
  91. <updated>2003-12-13T18:30:02Z</updated>
  92. <summary>Some text.</summary>
  93. </entry>
  94. </feed>`
  95. feed, err := Parse(bytes.NewBufferString(data))
  96. if err != nil {
  97. t.Error(err)
  98. }
  99. if feed.Entries[0].Title != "http://example.org/2003/12/13/atom03" {
  100. t.Errorf("Incorrect entry title, got: %s", feed.Entries[0].Title)
  101. }
  102. }
  103. func TestParseFeedURL(t *testing.T) {
  104. data := `<?xml version="1.0" encoding="utf-8"?>
  105. <feed xmlns="http://www.w3.org/2005/Atom">
  106. <title>Example Feed</title>
  107. <link rel="alternate" type="text/html" href="https://example.org/"/>
  108. <link rel="self" type="application/atom+xml" href="https://example.org/feed"/>
  109. <updated>2003-12-13T18:30:02Z</updated>
  110. </feed>`
  111. feed, err := Parse(bytes.NewBufferString(data))
  112. if err != nil {
  113. t.Error(err)
  114. }
  115. if feed.SiteURL != "https://example.org/" {
  116. t.Errorf("Incorrect site URL, got: %s", feed.SiteURL)
  117. }
  118. if feed.FeedURL != "https://example.org/feed" {
  119. t.Errorf("Incorrect feed URL, got: %s", feed.FeedURL)
  120. }
  121. }
  122. func TestParseEntryWithRelativeURL(t *testing.T) {
  123. data := `<?xml version="1.0" encoding="utf-8"?>
  124. <feed xmlns="http://www.w3.org/2005/Atom">
  125. <title>Example Feed</title>
  126. <link href="http://example.org/"/>
  127. <entry>
  128. <title>Test</title>
  129. <link href="something.html"/>
  130. <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id>
  131. <updated>2003-12-13T18:30:02Z</updated>
  132. <summary>Some text.</summary>
  133. </entry>
  134. </feed>`
  135. feed, err := Parse(bytes.NewBufferString(data))
  136. if err != nil {
  137. t.Error(err)
  138. }
  139. if feed.Entries[0].URL != "http://example.org/something.html" {
  140. t.Errorf("Incorrect entry URL, got: %s", feed.Entries[0].URL)
  141. }
  142. }
  143. func TestParseEntryTitleWithWhitespaces(t *testing.T) {
  144. data := `<?xml version="1.0" encoding="utf-8"?>
  145. <feed xmlns="http://www.w3.org/2005/Atom">
  146. <title>Example Feed</title>
  147. <link href="http://example.org/"/>
  148. <entry>
  149. <title>
  150. Some Title
  151. </title>
  152. <link href="http://example.org/2003/12/13/atom03"/>
  153. <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id>
  154. <updated>2003-12-13T18:30:02Z</updated>
  155. <summary>Some text.</summary>
  156. </entry>
  157. </feed>`
  158. feed, err := Parse(bytes.NewBufferString(data))
  159. if err != nil {
  160. t.Error(err)
  161. }
  162. if feed.Entries[0].Title != "Some Title" {
  163. t.Errorf("Incorrect entry title, got: %s", feed.Entries[0].Title)
  164. }
  165. }
  166. func TestParseEntryTitleWithHTMLAndCDATA(t *testing.T) {
  167. data := `<?xml version="1.0" encoding="utf-8"?>
  168. <feed xmlns="http://www.w3.org/2005/Atom">
  169. <title>Example Feed</title>
  170. <link href="http://example.org/"/>
  171. <entry>
  172. <title type="html"><![CDATA[Test &#8220;Test&#8221;]]></title>
  173. <link href="http://example.org/2003/12/13/atom03"/>
  174. <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id>
  175. <updated>2003-12-13T18:30:02Z</updated>
  176. <summary>Some text.</summary>
  177. </entry>
  178. </feed>`
  179. feed, err := Parse(bytes.NewBufferString(data))
  180. if err != nil {
  181. t.Error(err)
  182. }
  183. if feed.Entries[0].Title != "Test “Test”" {
  184. t.Errorf("Incorrect entry title, got: %q", feed.Entries[0].Title)
  185. }
  186. }
  187. func TestParseEntryTitleWithHTML(t *testing.T) {
  188. data := `<?xml version="1.0" encoding="utf-8"?>
  189. <feed xmlns="http://www.w3.org/2005/Atom">
  190. <title>Example Feed</title>
  191. <link href="http://example.org/"/>
  192. <entry>
  193. <title type="html">&lt;code&gt;Test&lt;/code&gt; Test</title>
  194. <link href="http://example.org/2003/12/13/atom03"/>
  195. <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id>
  196. <updated>2003-12-13T18:30:02Z</updated>
  197. <summary>Some text.</summary>
  198. </entry>
  199. </feed>`
  200. feed, err := Parse(bytes.NewBufferString(data))
  201. if err != nil {
  202. t.Error(err)
  203. }
  204. if feed.Entries[0].Title != "Test Test" {
  205. t.Errorf("Incorrect entry title, got: %q", feed.Entries[0].Title)
  206. }
  207. }
  208. func TestParseEntryTitleWithXHTML(t *testing.T) {
  209. data := `<?xml version="1.0" encoding="utf-8"?>
  210. <feed xmlns="http://www.w3.org/2005/Atom">
  211. <title>Example Feed</title>
  212. <link href="http://example.org/"/>
  213. <entry>
  214. <title type="xhtml"><code>Test</code> Test</title>
  215. <link href="http://example.org/2003/12/13/atom03"/>
  216. <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id>
  217. <updated>2003-12-13T18:30:02Z</updated>
  218. <summary>Some text.</summary>
  219. </entry>
  220. </feed>`
  221. feed, err := Parse(bytes.NewBufferString(data))
  222. if err != nil {
  223. t.Error(err)
  224. }
  225. if feed.Entries[0].Title != "Test Test" {
  226. t.Errorf("Incorrect entry title, got: %q", feed.Entries[0].Title)
  227. }
  228. }
  229. func TestParseEntryWithAuthorName(t *testing.T) {
  230. data := `<?xml version="1.0" encoding="utf-8"?>
  231. <feed xmlns="http://www.w3.org/2005/Atom">
  232. <title>Example Feed</title>
  233. <link href="http://example.org/"/>
  234. <entry>
  235. <link href="http://example.org/2003/12/13/atom03"/>
  236. <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id>
  237. <updated>2003-12-13T18:30:02Z</updated>
  238. <summary>Some text.</summary>
  239. <author>
  240. <name>Me</name>
  241. <email>me@localhost</email>
  242. </author>
  243. </entry>
  244. </feed>`
  245. feed, err := Parse(bytes.NewBufferString(data))
  246. if err != nil {
  247. t.Error(err)
  248. }
  249. if feed.Entries[0].Author != "Me" {
  250. t.Errorf("Incorrect entry author, got: %s", feed.Entries[0].Author)
  251. }
  252. }
  253. func TestParseEntryWithoutAuthorName(t *testing.T) {
  254. data := `<?xml version="1.0" encoding="utf-8"?>
  255. <feed xmlns="http://www.w3.org/2005/Atom">
  256. <title>Example Feed</title>
  257. <link href="http://example.org/"/>
  258. <entry>
  259. <link href="http://example.org/2003/12/13/atom03"/>
  260. <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id>
  261. <updated>2003-12-13T18:30:02Z</updated>
  262. <summary>Some text.</summary>
  263. <author>
  264. <name/>
  265. <email>me@localhost</email>
  266. </author>
  267. </entry>
  268. </feed>`
  269. feed, err := Parse(bytes.NewBufferString(data))
  270. if err != nil {
  271. t.Error(err)
  272. }
  273. if feed.Entries[0].Author != "me@localhost" {
  274. t.Errorf("Incorrect entry author, got: %s", feed.Entries[0].Author)
  275. }
  276. }
  277. func TestParseEntryWithEnclosures(t *testing.T) {
  278. data := `<?xml version="1.0" encoding="utf-8"?>
  279. <feed xmlns="http://www.w3.org/2005/Atom">
  280. <id>http://www.example.org/myfeed</id>
  281. <title>My Podcast Feed</title>
  282. <updated>2005-07-15T12:00:00Z</updated>
  283. <author>
  284. <name>John Doe</name>
  285. </author>
  286. <link href="http://example.org" />
  287. <link rel="self" href="http://example.org/myfeed" />
  288. <entry>
  289. <id>http://www.example.org/entries/1</id>
  290. <title>Atom 1.0</title>
  291. <updated>2005-07-15T12:00:00Z</updated>
  292. <link href="http://www.example.org/entries/1" />
  293. <summary>An overview of Atom 1.0</summary>
  294. <link rel="enclosure"
  295. type="audio/mpeg"
  296. title="MP3"
  297. href="http://www.example.org/myaudiofile.mp3"
  298. length="1234" />
  299. <link rel="enclosure"
  300. type="application/x-bittorrent"
  301. title="BitTorrent"
  302. href="http://www.example.org/myaudiofile.torrent"
  303. length="4567" />
  304. <content type="xhtml">
  305. <div xmlns="http://www.w3.org/1999/xhtml">
  306. <h1>Show Notes</h1>
  307. <ul>
  308. <li>00:01:00 -- Introduction</li>
  309. <li>00:15:00 -- Talking about Atom 1.0</li>
  310. <li>00:30:00 -- Wrapping up</li>
  311. </ul>
  312. </div>
  313. </content>
  314. </entry>
  315. </feed>`
  316. feed, err := Parse(bytes.NewBufferString(data))
  317. if err != nil {
  318. t.Error(err)
  319. }
  320. if len(feed.Entries) != 1 {
  321. t.Errorf("Incorrect number of entries, got: %d", len(feed.Entries))
  322. }
  323. if feed.Entries[0].URL != "http://www.example.org/entries/1" {
  324. t.Errorf("Incorrect entry URL, got: %s", feed.Entries[0].URL)
  325. }
  326. if len(feed.Entries[0].Enclosures) != 2 {
  327. t.Errorf("Incorrect number of enclosures, got: %d", len(feed.Entries[0].Enclosures))
  328. }
  329. if feed.Entries[0].Enclosures[0].URL != "http://www.example.org/myaudiofile.mp3" {
  330. t.Errorf("Incorrect enclosure URL, got: %s", feed.Entries[0].Enclosures[0].URL)
  331. }
  332. if feed.Entries[0].Enclosures[0].MimeType != "audio/mpeg" {
  333. t.Errorf("Incorrect enclosure type, got: %s", feed.Entries[0].Enclosures[0].MimeType)
  334. }
  335. if feed.Entries[0].Enclosures[0].Size != 1234 {
  336. t.Errorf("Incorrect enclosure length, got: %d", feed.Entries[0].Enclosures[0].Size)
  337. }
  338. if feed.Entries[0].Enclosures[1].URL != "http://www.example.org/myaudiofile.torrent" {
  339. t.Errorf("Incorrect enclosure URL, got: %s", feed.Entries[0].Enclosures[1].URL)
  340. }
  341. if feed.Entries[0].Enclosures[1].MimeType != "application/x-bittorrent" {
  342. t.Errorf("Incorrect enclosure type, got: %s", feed.Entries[0].Enclosures[1].MimeType)
  343. }
  344. if feed.Entries[0].Enclosures[1].Size != 4567 {
  345. t.Errorf("Incorrect enclosure length, got: %d", feed.Entries[0].Enclosures[1].Size)
  346. }
  347. }
  348. func TestParseEntryWithPublished(t *testing.T) {
  349. data := `<?xml version="1.0" encoding="utf-8"?>
  350. <feed xmlns="http://www.w3.org/2005/Atom">
  351. <title>Example Feed</title>
  352. <link href="http://example.org/"/>
  353. <entry>
  354. <link href="http://example.org/2003/12/13/atom03"/>
  355. <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id>
  356. <published>2003-12-13T18:30:02Z</published>
  357. <summary>Some text.</summary>
  358. </entry>
  359. </feed>`
  360. feed, err := Parse(bytes.NewBufferString(data))
  361. if err != nil {
  362. t.Error(err)
  363. }
  364. if !feed.Entries[0].Date.Equal(time.Date(2003, time.December, 13, 18, 30, 2, 0, time.UTC)) {
  365. t.Errorf("Incorrect entry date, got: %v", feed.Entries[0].Date)
  366. }
  367. }
  368. func TestParseEntryWithPublishedAndUpdated(t *testing.T) {
  369. data := `<?xml version="1.0" encoding="utf-8"?>
  370. <feed xmlns="http://www.w3.org/2005/Atom">
  371. <title>Example Feed</title>
  372. <link href="http://example.org/"/>
  373. <entry>
  374. <link href="http://example.org/2003/12/13/atom03"/>
  375. <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id>
  376. <published>2002-11-12T18:30:02Z</published>
  377. <updated>2003-12-13T18:30:02Z</updated>
  378. <summary>Some text.</summary>
  379. </entry>
  380. </feed>`
  381. feed, err := Parse(bytes.NewBufferString(data))
  382. if err != nil {
  383. t.Error(err)
  384. }
  385. if !feed.Entries[0].Date.Equal(time.Date(2003, time.December, 13, 18, 30, 2, 0, time.UTC)) {
  386. t.Errorf("Incorrect entry date, got: %v", feed.Entries[0].Date)
  387. }
  388. }
  389. func TestParseInvalidXml(t *testing.T) {
  390. data := `garbage`
  391. _, err := Parse(bytes.NewBufferString(data))
  392. if err == nil {
  393. t.Error("Parse should returns an error")
  394. }
  395. }