Esempio n. 1
0
    $cc->displayError($e->getMessage());
}
$url = $res->args['url'];
$url = Helper::addSchema($url);
$urlObj = new \Net_URL2($url);
$url = $urlObj->getNormalizedURL();
if (!Helper::isUrlAllowed($url)) {
    Log::error("Domain is not allowed; not crawling");
    exit(2);
}
try {
    $actions = array();
    foreach ($res->args['actions'] as $action) {
        if ($action == 'crawl') {
            $crawler = new Crawler();
            $crawler->setShowLinksOnly($res->options['showLinksOnly']);
            $actions[$action] = $crawler;
        } else {
            if ($action == 'index') {
                $actions[$action] = new Indexer();
            }
        }
    }
    $fetcher = new Fetcher();
    $retrieved = $fetcher->fetch($url, $actions, $res->options['force']);
    if ($retrieved === false) {
        exit(0);
    }
    $update = false;
    foreach ($actions as $key => $action) {
        Log::info("step: {$key}");