/** * 爬虫 * @param string $url * @return array */ function spider($url) { $html = _getHtmlFromUrl($url); if ($html) { $url_list = _reviseUrl($url, _filterUrl($html)); if ($url_list) { return $url_list; } else { return; } } else { return; } }
/** * 爬虫 * * @param string $url * @return array */ function crawler($url) { $content = _getUrlContent($url); if ($content) { $url_list = _reviseUrl($url, _filterUrl($content)); if ($url_list) { return $url_list; } else { return; } } else { return; } }
function crawler($id, $url) { $content = _curl_get_file_contents($url); _save($id, $url, $content); if ($content) { $url_list = _reviseUrl($url, _filterUrl($content)); if ($url_list) { return $url_list; } else { return; } } else { return; } }