2015-10-18 23:31:23 +02:00
|
|
|
<?php
|
2015-10-20 04:49:30 +02:00
|
|
|
|
2015-10-18 23:31:23 +02:00
|
|
|
return array(
|
|
|
|
'grabber' => array(
|
|
|
|
'%.*%' => array(
|
|
|
|
'test_url' => 'http://arstechnica.com/tech-policy/2015/09/judge-warners-2m-happy-birthday-copyright-is-bogus/',
|
|
|
|
'body' => array(
|
2016-01-12 02:03:13 +01:00
|
|
|
'//header/h2',
|
|
|
|
'//section[@id="article-guts"]',
|
|
|
|
'//div[@class="superscroll-content show"]',
|
|
|
|
'//div[@class="gallery"]',
|
2015-10-18 23:31:23 +02:00
|
|
|
),
|
2016-01-12 02:03:13 +01:00
|
|
|
'next_page' => '//span[@class="numbers"]/a',
|
2015-10-18 23:31:23 +02:00
|
|
|
'strip' => array(
|
2016-01-12 02:03:13 +01:00
|
|
|
'//figcaption',
|
|
|
|
'//div[@class="post-meta"]',
|
|
|
|
'//div[@class="gallery-image-credit"]',
|
|
|
|
'//aside',
|
|
|
|
'//div[@class="article-expander"]',
|
2015-10-18 23:31:23 +02:00
|
|
|
),
|
2015-10-20 04:49:30 +02:00
|
|
|
),
|
|
|
|
),
|
2015-10-18 23:31:23 +02:00
|
|
|
);
|