19 lines
551 B
PHP
19 lines
551 B
PHP
<?php
|
|
|
|
return array(
|
|
'grabber' => array(
|
|
'%.*%' => array(
|
|
'test_url' => 'http://www.themoscowtimes.com/business/article/535500.html',
|
|
'body' => array(
|
|
'//div[@class="article_main_img"]',
|
|
'//div[@class="article_text"]',
|
|
),
|
|
'strip' => array(
|
|
'//div[@class="articlebottom"]',
|
|
'//p/b',
|
|
'//p/a[contains(@href, "/article.php?id=")]',
|
|
'//div[@class="disqus_wrap"]',
|
|
),
|
|
),
|
|
),
|
|
);
|