2013-08-31 17:05:45 +02:00
|
|
|
<?php
|
|
|
|
return array(
|
2015-04-28 18:08:42 +02:00
|
|
|
'grabber' => array(
|
|
|
|
'%.*%' => array(
|
|
|
|
'test_url' => 'http://www.bbc.co.uk/news/world-middle-east-23911833',
|
|
|
|
'body' => array(
|
2015-10-18 23:31:23 +02:00
|
|
|
'//div[@class="story-body__inner"] | //div[@class="article"]',
|
2015-10-20 04:49:30 +02:00
|
|
|
'//div[@class="indPost"]',
|
2015-04-28 18:08:42 +02:00
|
|
|
),
|
|
|
|
'strip' => array(
|
|
|
|
'//form',
|
2016-02-10 02:30:07 +01:00
|
|
|
'//div[@id="headline"]',
|
2015-04-28 18:08:42 +02:00
|
|
|
'//*[@class="warning"]',
|
2015-10-18 23:31:23 +02:00
|
|
|
'//span[@class="off-screen"]',
|
|
|
|
'//span[@class="story-image-copyright"]',
|
2016-01-12 02:03:13 +01:00
|
|
|
'//ul[@class="story-body__unordered-list"]',
|
2015-10-18 23:31:23 +02:00
|
|
|
'//div[@class="ad_wrapper"]',
|
|
|
|
'//div[@id="article-sidebar"]',
|
2016-02-10 02:30:07 +01:00
|
|
|
'//div[@class="data-table-outer"]',
|
2015-04-28 18:08:42 +02:00
|
|
|
'//*[@class="story-date"]',
|
|
|
|
'//*[@class="story-header"]',
|
2015-10-18 23:31:23 +02:00
|
|
|
'//figure[contains(@class,"has-caption")]',
|
2015-04-28 18:08:42 +02:00
|
|
|
'//*[@class="story-related"]',
|
|
|
|
'//*[contains(@class, "byline")]',
|
2015-10-18 23:31:23 +02:00
|
|
|
'//p[contains(@class, "media-message")]',
|
2015-04-28 18:08:42 +02:00
|
|
|
'//*[contains(@class, "story-feature")]',
|
|
|
|
'//*[@id="video-carousel-container"]',
|
|
|
|
'//*[@id="also-related-links"]',
|
|
|
|
'//*[contains(@class, "share") or contains(@class, "hidden") or contains(@class, "hyper")]',
|
2015-10-20 04:49:30 +02:00
|
|
|
),
|
|
|
|
),
|
|
|
|
),
|
2015-10-18 23:31:23 +02:00
|
|
|
);
|