2014-12-23 21:28:26 -05:00
< ? php
2015-07-19 11:19:26 -04:00
2014-12-23 21:28:26 -05:00
namespace PicoFeed\Parser ;
use PHPUnit_Framework_TestCase ;
class Rss10ParserTest extends PHPUnit_Framework_TestCase
{
/**
* @ expectedException PicoFeed\Parser\MalformedXmlException
*/
public function testBadInput ()
{
$parser = new Rss10 ( 'boo' );
$parser -> execute ();
}
2015-07-19 11:19:26 -04:00
public function testGetItemsTree ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$feed = $parser -> execute ();
$this -> assertCount ( 2 , $feed -> items );
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_no_default_namespace.xml' ));
$feed = $parser -> execute ();
$this -> assertCount ( 3 , $feed -> items );
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_prefixed.xml' ));
$feed = $parser -> execute ();
$this -> assertCount ( 1 , $feed -> items );
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_feed.xml' ));
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( array (), $feed -> items );
2014-12-23 21:28:26 -05:00
}
2015-07-19 11:19:26 -04:00
public function testFindFeedTitle ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'литература на русском языке, либо написанная русскими авторами' , $feed -> getTitle ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_no_default_namespace.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'литература на русском языке, либо написанная русскими авторами' , $feed -> getTitle ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_prefixed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'литература на русском языке, либо написанная русскими авторами' , $feed -> getTitle ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_fallback_on_invalid_feed_values.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://en.wikipedia.org/wiki/Category:Russian-language_literature' , $feed -> getTitle ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_channel.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> getTitle ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_feed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> getTitle ());
}
public function testFindFeedDescription ()
{
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( " Зародилась во второй половине X века, однако до XIX века, \n когда начался её «золотой век», была практически неизвестна \n в мире. " , $feed -> getDescription ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_no_default_namespace.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( " Зародилась во второй половине X века, однако до XIX века, \n когда начался её «золотой век», была практически неизвестна \n в мире. " , $feed -> getDescription ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_prefixed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( " Зародилась во второй половине X века, однако до XIX века, \n когда начался её «золотой век», была практически неизвестна \n в мире. " , $feed -> getDescription ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_channel.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> getDescription ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_feed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> getDescription ());
}
public function testFindFeedLogo ()
{
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://ru.wikipedia.org/static/images/project-logos/ruwiki.png' , $feed -> getLogo ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_no_default_namespace.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://ru.wikipedia.org/static/images/project-logos/ruwiki.png' , $feed -> getLogo ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_prefixed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://ru.wikipedia.org/static/images/project-logos/ruwiki.png' , $feed -> getLogo ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_channel.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> getLogo ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_feed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> getLogo ());
}
public function testFindFeedIcon ()
{
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> getIcon ());
}
public function testFindFeedUrl ()
{
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> getFeedUrl ());
}
2015-07-19 11:19:26 -04:00
public function testFindSiteUrl ()
{
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://en.wikipedia.org/wiki/Category:Russian-language_literature' , $feed -> getSiteUrl ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_extra.xml' ), '' , 'https://feeds.wikipedia.org/category/Russian-language_literature.xml' ); // relative url
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://feeds.wikipedia.org/wiki/Category:Russian-language_literature' , $feed -> getSiteUrl ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_no_default_namespace.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://en.wikipedia.org/wiki/Category:Russian-language_literature' , $feed -> getSiteUrl ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_prefixed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://en.wikipedia.org/wiki/Category:Russian-language_literature' , $feed -> getSiteUrl ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_channel.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> getSiteUrl ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_feed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> getSiteUrl ());
}
public function testFindFeedId ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( 'https://en.wikipedia.org/wiki/Category:Russian-language_literature' , $feed -> getId ());
2014-12-23 21:28:26 -05:00
}
2015-07-19 11:19:26 -04:00
public function testFindFeedDate ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 1433451900 , $feed -> getDate () -> getTimestamp ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_no_default_namespace.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 1433451900 , $feed -> getDate () -> getTimestamp ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_prefixed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 1433451900 , $feed -> getDate () -> getTimestamp ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_channel.xml' ));
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( time (), $feed -> getDate () -> getTimestamp (), '' , 1 );
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_feed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( time (), $feed -> getDate () -> getTimestamp (), '' , 1 );
2014-12-23 21:28:26 -05:00
}
2015-07-19 11:19:26 -04:00
public function testFindFeedLanguage ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'ru' , $feed -> getLanguage ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_no_default_namespace.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'ru' , $feed -> getLanguage ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_prefixed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'ru' , $feed -> getLanguage ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_channel.xml' ));
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( '' , $feed -> getTitle ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_feed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> getTitle ());
2014-12-23 21:28:26 -05:00
}
2015-07-19 11:19:26 -04:00
public function testFindItemId ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'eb6f2d388a77e1f7d067a924970622d630031365fd444abe776d974d95b21990' , $feed -> items [ 0 ] -> getId ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_item.xml' ));
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( 'e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855' , $feed -> items [ 0 ] -> getId ());
2014-12-23 21:28:26 -05:00
}
2015-07-19 11:19:26 -04:00
public function testFindItemUrl ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://en.wikipedia.org/wiki/War_and_Peace' , $feed -> items [ 0 ] -> getUrl ()); // <rss:link>
$this -> assertEquals ( 'https://en.wikipedia.org/wiki/Crime_and_Punishment' , $feed -> items [ 1 ] -> getUrl ()); // <feedburner:origLink>
// relative urls
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_extra.xml' ), '' , 'https://feeds.wikipedia.org/category/Russian-language_literature.xml' );
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( 'https://feeds.wikipedia.org/wiki/War_and_Peace' , $feed -> items [ 0 ] -> getUrl ()); // <rss:link>
$this -> assertEquals ( 'https://feeds.wikipedia.org/wiki/Crime_and_Punishment' , $feed -> items [ 1 ] -> getUrl ()); // <feedburner:origLink>
2014-12-23 21:28:26 -05:00
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_no_default_namespace.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://en.wikipedia.org/wiki/War_and_Peace' , $feed -> items [ 0 ] -> getUrl ()); // <rss:link>
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_prefixed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://en.wikipedia.org/wiki/War_and_Peace' , $feed -> items [ 0 ] -> getUrl ()); // <rss:link>
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_element_preference.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://en.wikipedia.org/wiki/War_and_Peace' , $feed -> items [ 0 ] -> getUrl ()); // <feedburner:origLink> is preferred over <rss:link>
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_item.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> items [ 0 ] -> getUrl ());
2014-12-23 21:28:26 -05:00
}
2015-07-19 11:19:26 -04:00
public function testFindItemTitle ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( 'Война и мир' , $feed -> items [ 0 ] -> getTitle ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_no_default_namespace.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'Война и мир' , $feed -> items [ 0 ] -> getTitle ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_prefixed.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'Война и мир' , $feed -> items [ 0 ] -> getTitle ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_fallback_on_invalid_item_values.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'https://en.wikipedia.org/wiki/Doctor_Zhivago_(novel)' , $feed -> items [ 2 ] -> getTitle ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_item.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> items [ 0 ] -> getTitle ());
2014-12-23 21:28:26 -05:00
}
2015-07-19 11:19:26 -04:00
/*
* TODO : Add test of feed date fallback
*/
public function testFindItemDate ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( 1433451720 , $feed -> items [ 0 ] -> getDate () -> getTimestamp ()); // item date
$this -> assertEquals ( 1433451900 , $feed -> items [ 1 ] -> getDate () -> getTimestamp ()); // fallback to feed date
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_item.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( time (), $feed -> items [ 0 ] -> getDate () -> getTimestamp (), 1 );
2014-12-23 21:28:26 -05:00
}
2015-07-19 11:19:26 -04:00
public function testFindItemLanguage ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( 'bg' , $feed -> items [ 0 ] -> getLanguage ()); // item language
$this -> assertEquals ( 'ru' , $feed -> items [ 1 ] -> getLanguage ()); // fallback to feed language
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_item.xml' ));
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( '' , $feed -> items [ 0 ] -> getAuthor ());
2014-12-23 21:28:26 -05:00
}
2015-07-19 11:19:26 -04:00
public function testFindItemAuthor ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
// items[0] === item author
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( 'Лев Николаевич Толсто́й' , $feed -> items [ 0 ] -> getAuthor ());
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_item.xml' ));
$feed = $parser -> execute ();
$this -> assertEquals ( '' , $feed -> items [ 0 ] -> getAuthor ());
2014-12-23 21:28:26 -05:00
}
2015-07-19 11:19:26 -04:00
public function testFindItemContent ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
// items[0] === <description>
// items[1] === <content:encoded>
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
$parser -> disableContentFiltering ();
$feed = $parser -> execute ();
$this -> assertTrue ( strpos ( $feed -> items [ 0 ] -> getContent (), " В наброске предисловия к «Войне и миру» Толстой\n писал, что в 1856 г . " ) === 0 );
$this -> assertTrue ( strpos ( $feed -> items [ 1 ] -> getContent (), " <h1> \n История создания \n </h1> \n <p> \n Осенью \n <a href= \" /wiki/1865_%D0%B3%D0%BE%D0%B4 \" " ) === 0 );
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_no_default_namespace.xml' ));
$parser -> disableContentFiltering ();
$feed = $parser -> execute ();
$this -> assertTrue ( strpos ( $feed -> items [ 0 ] -> getContent (), " В наброске предисловия к «Войне и миру» Толстой\n писал, что в 1856 г . " ) === 0 );
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_prefixed.xml' ));
$parser -> disableContentFiltering ();
$feed = $parser -> execute ();
$this -> assertTrue ( strpos ( $feed -> items [ 0 ] -> getContent (), " В наброске предисловия к «Войне и миру» Толстой\n писал, что в 1856 г . " ) === 0 );
// <content:encoding> is preferred over <description>
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_element_preference.xml' ));
$parser -> disableContentFiltering ();
$feed = $parser -> execute ();
$this -> assertTrue ( strpos ( $feed -> items [ 1 ] -> getContent (), " <h1> \n История создания \n </h1> \n <p> \n Осенью \n <a href= \" /wiki/1865_%D0%B3%D0%BE%D0%B4 \" " ) === 0 );
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_fallback_on_invalid_item_values.xml' ));
$parser -> disableContentFiltering ();
$feed = $parser -> execute ();
$this -> assertTrue ( strpos ( $feed -> items [ 1 ] -> getContent (), " Осенью 1865 года, потеряв все свои \n деньги в казино " ) === 0 ); // <content:encoded> => <description>
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10_empty_item.xml' ));
$parser -> disableContentFiltering ();
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( '' , $feed -> items [ 0 ] -> getContent ());
2014-12-23 21:28:26 -05:00
}
2015-07-19 11:19:26 -04:00
public function testFindItemEnclosure ()
2014-12-23 21:28:26 -05:00
{
2015-07-19 11:19:26 -04:00
$parser = new Rss10 ( file_get_contents ( 'tests/fixtures/rss_10.xml' ));
2014-12-23 21:28:26 -05:00
$feed = $parser -> execute ();
2015-07-19 11:19:26 -04:00
$this -> assertEquals ( '' , $feed -> items [ 0 ] -> getEnclosureUrl ());
$this -> assertEquals ( '' , $feed -> items [ 0 ] -> getEnclosureType ());
2014-12-23 21:28:26 -05:00
}
}