Frederic Guillot 28804ca541 Update PicoFeed
2015-07-19 11:19:26 -04:00

311 lines
15 KiB
PHP
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<?php
namespace PicoFeed\Parser;
use PHPUnit_Framework_TestCase;
class Rss20ParserTest extends PHPUnit_Framework_TestCase
{
/**
* @expectedException PicoFeed\Parser\MalformedXmlException
*/
public function testBadInput()
{
$parser = new Rss20('boo');
$parser->execute();
}
public function testGetItemsTree()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertCount(4, $feed->items);
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_feed.xml'));
$feed = $parser->execute();
$this->assertEquals(array(), $feed->items);
}
public function testFindFeedTitle()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('литература на русском языке, либо написанная русскими авторами', $feed->getTitle());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_fallback_on_invalid_feed_values.xml'));
$feed = $parser->execute();
$this->assertEquals('https://en.wikipedia.org/wiki/Category:Russian-language_literature', $feed->getTitle());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_channel.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getTitle());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_feed.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getTitle());
}
public function testFindFeedDescription()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals("Зародилась во второй половине X века, однако до XIX века,\nкогда начался её «золотой век», была практически неизвестна\nв мире.", $feed->getDescription());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_channel.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getDescription());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_feed.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getDescription());
}
public function testFindFeedLogo()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('https://ru.wikipedia.org/static/images/project-logos/ruwiki.png', $feed->getLogo());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_channel.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getLogo());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_feed.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getLogo());
}
public function testFindFeedIcon()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getIcon());
}
public function testFindFeedUrl()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getFeedUrl());
}
public function testFindSiteUrl()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('https://en.wikipedia.org/wiki/Category:Russian-language_literature', $feed->getSiteUrl());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_extra.xml'), '', 'https://feeds.wikipedia.org/category/Russian-language_literature.xml'); // relative url
$feed = $parser->execute();
$this->assertEquals('https://feeds.wikipedia.org/wiki/Category:Russian-language_literature', $feed->getSiteUrl());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_channel.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getSiteUrl());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_feed.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getSiteUrl());
}
public function testFindFeedId()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('https://en.wikipedia.org/wiki/Category:Russian-language_literature', $feed->getId());
}
public function testFindFeedDate()
{
// pubDate
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals(1433451900, $feed->getDate()->getTimestamp());
// lastBuildDate
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_extra.xml'));
$feed = $parser->execute();
$this->assertEquals(1433451900, $feed->getDate()->getTimestamp());
// prefer most recent date and not a particular date element
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_element_preference.xml'));
$feed = $parser->execute();
$this->assertEquals(1433455500, $feed->getDate()->getTimestamp());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_channel.xml'));
$feed = $parser->execute();
$this->assertEquals(time(), $feed->getDate()->getTimestamp(), '', 1);
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_feed.xml'));
$feed = $parser->execute();
$this->assertEquals(time(), $feed->getDate()->getTimestamp(), '', 1);
}
public function testFindFeedLanguage()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('ru', $feed->getLanguage());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_channel.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getTitle());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_feed.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->getTitle());
}
public function testFindItemId()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml')); // <guid>
$feed = $parser->execute();
$this->assertEquals('06e53052cd17cdfb264d9c37d495cc3746ac43f79488c7ce67894e718f674bd5', $feed->items[1]->getId());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml')); // alternate generation
$feed = $parser->execute();
$this->assertEquals('eb6f2d388a77e1f7d067a924970622d630031365fd444abe776d974d95b21990', $feed->items[0]->getId());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_item.xml'));
$feed = $parser->execute();
$this->assertEquals('e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855', $feed->items[0]->getId());
}
public function testFindItemUrl()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('https://en.wikipedia.org/wiki/War_and_Peace', $feed->items[0]->getUrl()); // <rss:link>
$this->assertEquals('https://en.wikipedia.org/wiki/Crime_and_Punishment', $feed->items[1]->getUrl()); // <atom:link>
$this->assertEquals('https://en.wikipedia.org/wiki/Doctor_Zhivago_(novel)', $feed->items[2]->getUrl()); // <feedburner:origLink>
$this->assertEquals('https://guid.wikipedia.org/wiki/A_Hero_of_Our_Time', $feed->items[3]->getUrl()); // <guid>
// relative urls
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_extra.xml'), '', 'https://feeds.wikipedia.org/category/Russian-language_literature.xml');
$feed = $parser->execute();
$this->assertEquals('https://feeds.wikipedia.org/wiki/War_and_Peace', $feed->items[0]->getUrl()); // <rss:link>
$this->assertEquals('https://feeds.wikipedia.org/wiki/Crime_and_Punishment', $feed->items[1]->getUrl()); // <atom:link>
$this->assertEquals('https://feeds.wikipedia.org/wiki/Doctor_Zhivago_(novel)', $feed->items[2]->getUrl()); // <feedburner:origLink>
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_element_preference.xml'));
$feed = $parser->execute();
$this->assertEquals('https://en.wikipedia.org/wiki/War_and_Peace', $feed->items[0]->getUrl()); // <feedburner:origLink> is preferred over <rss:link>, <atom:link>, <guid>
$this->assertEquals('https://en.wikipedia.org/wiki/Crime_and_Punishment', $feed->items[1]->getUrl()); // <rss:link> is preferred over <atom:link>, <guid>
$this->assertEquals('https://en.wikipedia.org/wiki/Doctor_Zhivago_(novel)', $feed->items[2]->getUrl()); // <atom:link> is preferred over <guid>
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_fallback_on_invalid_item_values.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->items[0]->getUrl()); // <guid> is invalid URI
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_item.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->items[0]->getUrl());
}
public function testFindItemTitle()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('Война и мир', $feed->items[0]->getTitle());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_fallback_on_invalid_item_values.xml'));
$feed = $parser->execute();
$this->assertEquals('https://en.wikipedia.org/wiki/Doctor_Zhivago_(novel)', $feed->items[2]->getTitle());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_item.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->items[0]->getTitle());
}
public function testFindItemDate()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals(1433451720, $feed->items[0]->getDate()->getTimestamp()); // item date
$this->assertEquals(1433451900, $feed->items[1]->getDate()->getTimestamp()); // fallback to feed date
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_item.xml'));
$feed = $parser->execute();
$this->assertEquals(time(), $feed->items[0]->getDate()->getTimestamp(), 1);
}
public function testFindItemLanguage()
{
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('bg', $feed->items[0]->getLanguage()); // item language
$this->assertEquals('ru', $feed->items[1]->getLanguage()); // fallback to feed language
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_item.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->items[0]->getLanguage());
}
public function testFindItemAuthor()
{
// items[0] === item author
// items[1] === feed author via empty fallback (channel/managingEditor)
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('Лев Николаевич Толсто́й', $feed->items[0]->getAuthor());
$this->assertEquals('Вики педии - свободной энциклопедии', $feed->items[1]->getAuthor());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_dc.xml'));
$feed = $parser->execute();
$this->assertEquals('Лев Николаевич Толсто́й', $feed->items[0]->getAuthor());
$this->assertEquals('Вики педии - свободной энциклопедии', $feed->items[1]->getAuthor());
// <dc:creator> is preferred over <author>
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_element_preference.xml'));
$feed = $parser->execute();
$this->assertEquals('Лев Николаевич Толсто́й', $feed->items[0]->getAuthor());
$this->assertEquals('Вики педии - свободной энциклопедии', $feed->items[1]->getAuthor());
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_item.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->items[0]->getAuthor());
}
public function testFindItemContent()
{
// items[0] === <description>
// items[1] === <content:encoded>
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$parser->disableContentFiltering();
$feed = $parser->execute();
$this->assertTrue(strpos($feed->items[0]->getContent(), "В наброске предисловия к «Войне и миру» Толстой\nписал, что в 1856 г.") === 0);
$this->assertTrue(strpos($feed->items[1]->getContent(), "<h1>\nИстория создания\n</h1>\n<p>\nОсенью \n<a href=\"/wiki/1865_%D0%B3%D0%BE%D0%B4\"") === 0);
// <content:encoding> is preferred over <description>
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_element_preference.xml'));
$parser->disableContentFiltering();
$feed = $parser->execute();
$this->assertTrue(strpos($feed->items[1]->getContent(), "<h1>\nИстория создания\n</h1>\n<p>\nОсенью \n<a href=\"/wiki/1865_%D0%B3%D0%BE%D0%B4\"") === 0);
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_fallback_on_invalid_item_values.xml'));
$parser->disableContentFiltering();
$feed = $parser->execute();
$this->assertTrue(strpos($feed->items[1]->getContent(), "Осенью 1865 года, потеряв все свои\nденьги в казино") === 0); // <content:encoded> => <description>
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_item.xml'));
$parser->disableContentFiltering();
$feed = $parser->execute();
$this->assertEquals('', $feed->items[0]->getContent());
}
public function testFindItemEnclosure()
{
// Test tests covers the preference of <feedburner:origEnclosureLink> over <enclosure> as well
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20.xml'));
$feed = $parser->execute();
$this->assertEquals('https://upload.wikimedia.org/wikipedia/commons/4/41/War-and-peace_1873.gif', $feed->items[0]->getEnclosureUrl()); // <enclosure>
$this->assertEquals('image/gif', $feed->items[0]->getEnclosureType());
$this->assertEquals('https://upload.wikimedia.org/wikipedia/commons/7/7b/Crime_and_Punishment-1.png', $feed->items[1]->getEnclosureUrl()); // <feedburner:origEnclosureLink>
$parser = new Rss20(file_get_contents('tests/fixtures/rss_20_empty_item.xml'));
$feed = $parser->execute();
$this->assertEquals('', $feed->items[0]->getEnclosureUrl());
$this->assertEquals('', $feed->items[0]->getEnclosureType());
}
}