Add new grabber rules

This commit is contained in:
Frédéric Guillot 2013-09-18 22:48:29 -04:00
parent 9e437c1a93
commit d29653f121
7 changed files with 78 additions and 2 deletions

View File

@ -278,6 +278,8 @@ It would be awesome for everybody :)
- Original theme By Frederic Guillot - Original theme By Frederic Guillot
- Midnight By Luca Marra - Midnight By Luca Marra
- Green by Maxime (aka EpocDotFr) - Green by Maxime (aka EpocDotFr)
- Bootstrap 3 (Light) By Silvus
- Bootswatch Cyborg By Silvus
### Coding standards for contributors ### Coding standards for contributors
@ -336,20 +338,25 @@ Don't forget to send a pull request or a ticket to share your contribution with
- *.blog.lemonde.fr - *.blog.lemonde.fr
- *.blog.nytimes.com - *.blog.nytimes.com
- *.nytimes.php - *.nytimes.com
- *.slate.com - *.slate.com
- *.theguardian.com
- *.wikipedia.org - *.wikipedia.org
- *.wired.com
- *.wsj.com - *.wsj.com
- github.com - github.com
- lifehacker.com - lifehacker.com
- plus.google.com
- rue89.com - rue89.com
- smallhousebliss.com - smallhousebliss.com
- techcrunch.com - techcrunch.com
- www.bbc.co.uk - www.bbc.co.uk
- www.businessweek.com
- www.cnn.com - www.cnn.com
- www.egscomics.com - www.egscomics.com
- www.forbes.com - www.forbes.com
- www.lemonde.fr - www.lemonde.fr
- www.lepoint.fr
- www.npr.org
- www.numerama.com - www.numerama.com
- www.slate.fr - www.slate.fr
- www.theguardian.com

View File

@ -5,5 +5,6 @@ return array(
'//div[@id="article-wrapper"]', '//div[@id="article-wrapper"]',
), ),
'strip' => array( 'strip' => array(
'//*[contains(@class, "promo")]',
), ),
); );

19
vendor/PicoFeed/Rules/.wired.com.php vendored Normal file
View File

@ -0,0 +1,19 @@
<?php
return array(
'test_url' => 'http://www.wired.com/gamelife/2013/09/ouya-free-the-games/',
'body' => array(
'//div[@class="entry"]',
),
'strip' => array(
'//script',
'//style',
'//*[@id="linker_widget"]',
'//*[contains(@class, "bio")]',
'//*[contains(@class, "entry-footer")]',
'//*[contains(@class, "mobify_backtotop_link")]',
'//*[contains(@class, "gallery-navigation")]',
'//*[contains(@class, "gallery-thumbnail")]',
'//img[contains(@src, "1x1")]',
'//a[contains(@href, "creativecommons")]',
),
);

View File

@ -0,0 +1,7 @@
<?php
return array(
'test_url' => 'https://plus.google.com/+LarryPage/posts/Lh8SKC6sED1',
'body' => array(
'//div[@role="article"]/div[contains(@class, "eE")]',
),
);

View File

@ -0,0 +1,11 @@
<?php
return array(
'test_url' => 'http://www.businessweek.com/articles/2013-09-18/elon-musks-hyperloop-will-work-says-some-very-smart-software',
'body' => array(
'//div[@id="lead_graphic"]',
'//div[@id="article_body"]',
),
'strip' => array(
'//*[contains(@class, "related_item")]',
),
);

View File

@ -0,0 +1,16 @@
<?php
return array(
'test_url' => 'http://www.lepoint.fr/c-est-arrive-aujourd-hui/19-septembre-1783-pour-la-premiere-fois-un-mouton-un-canard-et-un-coq-s-envoient-en-l-air-devant-louis-xvi-18-09-2012-1507704_494.php',
'body' => array(
'//article',
),
'strip' => array(
'//script',
'//style',
'//*[contains(@class, "info_article")]',
'//*[contains(@class, "fildariane_titre")]',
'//*[contains(@class, "entete2_article")]',
'//*[contains(@class, "signature_article")]',
'//*[contains(@id, "share")]',
)
);

15
vendor/PicoFeed/Rules/www.npr.org.php vendored Normal file
View File

@ -0,0 +1,15 @@
<?php
return array(
'test_url' => 'http://www.npr.org/blogs/thesalt/2013/09/17/223345977/auto-brewery-syndrome-apparently-you-can-make-beer-in-your-gut',
'body' => array(
'//div[@id="storytext"]',
),
'strip' => array(
'//script',
'//style',
'//*[@class="bucket img"]',
'//*[@class="creditwrap"]',
'//*[@class="captionwrap"]',
'//*[contains(@class, "enlargebtn")]',
),
);