function getinfodetail(&$data) { global $model, $start_page, $_root, $cid, $strreplace, $pregreplace; echo $data['ourl'], "\n"; $html = getHtml($data['ourl']); // $html = mb_convert_encoding($html,"UTF-8","GBK"); if (!$html) { echo "获取html失败"; exit; } //kw $data['keyword'] = ''; // $data['ptime'] = time(); $data['utime'] = time(); preg_match('#<span class="more" txt="([^"]+)"\\s*>#Uis', $html, $match); $match[1] = isset($match[1]) ? $match[1] : ''; //echo $match[1],"\n";exit; $data['intro'] = strip_tags($match[1]); $data['intro'] = preg_replace('#&\\S+;#Uis', '', $data['intro']); $data['intro'] = mb_strlen($data['intro']) > 300 ? mb_substr($data['intro'], 0, 300, 'utf-8') : $data['intro']; $data['intro'] = str_replace('?', '', $data['intro']); $data['intro'] = trim($data['intro']); $data['intro'] = preg_replace("#(\r\n)+#is", "\r\n", $data['intro']); $data['intro'] = preg_replace("#\n+#is", "\n", $data['intro']); $playhtml = getArticlePlayData($data['purl']); if (empty($playhtml)) { echo "\n++ Ourl:{$data['ourl']} Purl:{$data['purl']} playdata vols decode error!++\n"; return 0; } $data['vols'] = getParseVideoInfo($playhtml); unset($data['purl']); if (!$data['name'] || empty($data['vols'])) { echo "抓取失败 {$data['ourl']} \r\n"; return false; } $data['ourl'] = str_replace($_root, '', $data['ourl']); // echo '<pre>';var_dump($data);exit; /**/ //在判断是否更新 $oname = $data['name']; $aid = checkArticleByOname($oname); if ($aid) { $vdata = array('name' => $data['name'], 'vols' => $data['vols']); $aid = addArticleVols($vdata); echo "{$aid}已存在更新!\r\n"; return 6; } /**/ $aid = addArticle($data); //echo '|',$aid,'|';exit; if (!$aid) { var_dump($data); echo "\r\n添加失败! {$data['ourl']} \r\n"; exit; return false; } echo "添加成功! {$aid} \r\n"; }
continue; } // check local exists $check = $m->checkid97vid($ovid); if ($check) { echo "\n=== {$ovid} already exists! ====\n"; continue; } $infoUrl = sprintf('%svideos/play/mid/%d.html', $_root, $ovid); $title = trim($titlePool[$uk]); $sourceUrl = sprintf('%svideos/resource/id/%d', $_root, $ovid); $data = getinfodetail($sourceUrl); $data['name'] = $title; $data['ourl'] = $ovid; $data['thum'] = $picPool[$uk]; $vinfo = getParseVideoInfo($uv); $data['vols'] = $vinfo; //var_dump($data);exit; if (empty($vinfo)) { echo "\n==== Get Parse Info Failed Ourl: {$infoUrl} Purl: {$sourceUrl} Page: {$start_page} =====\n"; if (stripos($uv, '/resource/id/') !== false) { continue; } exit; } $aid = checkArticleByOname($data['name']); if ($aid) { $vdata = array('name' => $data['name'], 'vols' => $data['vols']); $aid = addArticleVols($vdata); echo "{$aid}已存在更新! ovid: {$ovid} Page: {$start_page} \r\n"; $m->addid97vid($ovid);
function getinfodetail(&$data) { global $model, $_root, $cid, $strreplace, $pregreplace; echo $data['ourl'], "\n"; $html = getHtml($data['ourl']); $html = mb_convert_encoding($html, "UTF-8", "GBK"); if (!$html) { echo "获取html失败"; exit; } //kw $data['keyword'] = ''; // $data['ptime'] = time(); $data['utime'] = time(); preg_match('#剧情介绍:</h2>\\s*</div>\\s*<div style="[^"]+">(.+)<p>#Uis', $html, $match); $match[1] = isset($match[1]) ? $match[1] : ''; //echo $match[1],"\n"; $data['intro'] = strip_tags($match[1]); $data['intro'] = preg_replace('#&\\S+;#Uis', '', $data['intro']); $data['intro'] = mb_strlen($data['intro']) > 300 ? mb_substr($data['intro'], 0, 300, 'utf-8') : $data['intro']; $data['intro'] = str_replace('?', '', $data['intro']); $data['intro'] = trim($data['intro']); $data['intro'] = preg_replace("#(\r\n)+#is", "\r\n", $data['intro']); $data['intro'] = preg_replace("#\n+#is", "\n", $data['intro']); $data['intro'] = preg_replace('#\\s\\s+#is', ' ', $data['intro']); $data['intro'] = @iconv("UTF-8", "UTF-8//TRANSLIT", $data['intro']); $data['intro'] = str_replace('?', '', $data['intro']); preg_match('#<li><a title=\'[^\']+\' href=\'(/.+/player-0-0\\.html)\' target="_blank">.+</a></li>#Uis', $html, $match); $data['purl'] = @$match[1]; $playhtml = getArticlePlayData($data['purl']); if (empty($playhtml)) { echo "\n++ Ourl:{$data['ourl']} Purl:{$data['purl']} playdata vols decode error!++\n"; return 0; } $data['vols'] = getParseVideoInfo($playhtml); unset($data['purl']); if (!$data['name'] || empty($data['vols'])) { echo "抓取失败 {$data['ourl']} \r\n"; return false; } $data['ourl'] = str_replace($_root, '', $data['ourl']); # echo '<pre>';var_dump($data);exit; /**/ //在判断是否更新 $oname = $data['name']; $aid = checkArticleByOname($oname); if ($aid) { $vdata = array('name' => $data['name'], 'vols' => $data['vols']); $aid = addArticleVols($vdata); echo "{$aid}已存在更新!\r\n"; return 6; } /**/ $aid = addArticle($data); //echo '|',$aid,'|';exit; if (!$aid) { var_dump($data); echo "\r\n添加失败! {$data['ourl']} \r\n"; exit; return false; } echo "添加成功! {$aid} \r\n"; }