Example #1
0
<?php

/**
 * Created by PhpStorm.
 * User: yakov
 * Date: 05.06.16
 * Time: 12:19
 */
require __DIR__ . '/../vendor/autoload.php';
$parser = new \jakulov\HyperParser\Parser();
$url = 'https://en.wikipedia.org/wiki/Adam_Smith';
$pattern = ['name' => '#firstHeading', 'img' => '.image img|src', 'bio' => '#mw-content-text p|innertext', 'tags' => '#mw-normal-catlinks a'];
$data = $parser->parseUrl($url, $pattern);
echo 'Name: ' . $data['name'][0] . PHP_EOL;
echo 'Photo: ' . $data['img'][0] . PHP_EOL . PHP_EOL;
echo 'Bio: ' . strip_tags($data['bio'][0]) . PHP_EOL . PHP_EOL;
echo '===================== ' . PHP_EOL;
echo 'Tags: ' . join(', ', array_slice($data['tags'], 1)) . PHP_EOL . PHP_EOL;
Example #2
0
<?php

/**
 * Created by PhpStorm.
 * User: yakov
 * Date: 05.06.16
 * Time: 15:30
 */
require __DIR__ . '/../vendor/autoload.php';
$parser = new \jakulov\HyperParser\Parser();
$url1 = 'http://lenta.ru';
$pattern1 = ['links' => '.b-yellow-box .item a|href'];
$data1 = $parser->parseUrl($url1, $pattern1);
$urls = [];
foreach ($data1['links'] as $link) {
    if ($link) {
        $urls[] = $url1 . $link;
    }
}
//var_dump($urls);
$pattern2 = ['title' => 'title', 'img' => '.b-topic__title-image img|src', 'text' => '.b-text|innertext'];
$data2 = $parser->bulkParse($urls, $pattern2, false);
foreach ($data2 as $url => $news) {
    if (is_array($news)) {
        echo PHP_EOL . '==============' . PHP_EOL;
        echo $url . PHP_EOL;
        echo 'Title: ' . $news['title'][0] . PHP_EOL;
        echo 'IMG: ' . $news['img'][0] . PHP_EOL . PHP_EOL;
        echo 'Text: ' . $news['text'][0] . PHP_EOL . PHP_EOL;
    } else {
        echo 'ERROR: ' . $news . PHP_EOL . PHP_EOL;