2016-01-12 02:03:13 +01:00
|
|
|
<?php
|
|
|
|
return array(
|
|
|
|
'grabber' => array(
|
|
|
|
'%.*%' => array(
|
|
|
|
'test_url' => 'http://international.thenewslens.com/post/255032/',
|
|
|
|
'body' => array(
|
2017-04-05 22:05:48 +02:00
|
|
|
'//div[@class="article-section"]',
|
2016-01-12 02:03:13 +01:00
|
|
|
),
|
|
|
|
'strip' => array(
|
2017-04-05 22:05:48 +02:00
|
|
|
'//div[contains(@class,"ad-")]',
|
|
|
|
'//div[@class="article-title-box"]',
|
|
|
|
'//div[@class="function-box"]',
|
|
|
|
'//p/span',
|
|
|
|
'//aside',
|
|
|
|
'//footer',
|
|
|
|
'//div[@class="article-infoBot-box"]',
|
|
|
|
'//div[contains(@class,"standard-container")]'
|
2016-01-12 02:03:13 +01:00
|
|
|
),
|
|
|
|
),
|
|
|
|
),
|
|
|
|
);
|