24 lines
756 B
PHP
Raw Normal View History

2015-10-18 17:31:23 -04:00
<?php
2015-10-18 17:31:23 -04:00
return array(
'grabber' => array(
'%.*%' => array(
'test_url' => 'http://arstechnica.com/tech-policy/2015/09/judge-warners-2m-happy-birthday-copyright-is-bogus/',
'body' => array(
2016-01-11 20:03:13 -05:00
'//header/h2',
'//section[@id="article-guts"]',
'//div[@class="superscroll-content show"]',
'//div[@class="gallery"]',
2015-10-18 17:31:23 -04:00
),
2016-01-11 20:03:13 -05:00
'next_page' => '//span[@class="numbers"]/a',
2015-10-18 17:31:23 -04:00
'strip' => array(
2016-01-11 20:03:13 -05:00
'//figcaption',
'//div[@class="post-meta"]',
'//div[@class="gallery-image-credit"]',
'//aside',
'//div[@class="article-expander"]',
2015-10-18 17:31:23 -04:00
),
),
),
2015-10-18 17:31:23 -04:00
);