phpdigGetSiteFromUrl($id_connect, trim(str_replace("\n\r\t", '', $urlFileLine)), $linksper, $linksper_flag, $limit, $limit_flag, $usetable); } } } $common_words = phpdigComWords("{$relative_script_path}/includes/common_words.txt"); //connect to distant ftp for text content (if constants are defined) $ftp_id = phpdigFtpConnect(); //mode url : test new or existing site if ($from_shell_flag == 2 && isset($url) && $url && $url != 'http://' && $url != 'https://' && (!$respider_mode || $respider_mode == 'site')) { extract(phpdigGetSiteFromUrl($id_connect, trim($url), $linksper, $linksper_flag, $limit, $limit_flag, $usetable)); } elseif (isset($url) && !empty($url) && $url != 'http://' && $url != 'https://' && (!$respider_mode || $respider_mode == 'site')) { $urlsBox = preg_split("/[\r\n]+/", $url); $urlsBox_cnt = count($urlsBox); for ($i = 0; $i < $urlsBox_cnt; $i++) { if (ereg('^http[s]?://[a-zA-Z0-9.-]+', trim($urlsBox[$i]))) { phpdigGetSiteFromUrl($id_connect, trim(str_replace("\n\r\t", '', $urlsBox[$i])), $linksper, $linksper_flag, $limit, $limit_flag, $usetable); } } } //retrieve list of urls if ($site_id) { $site_id = (int) $site_id; $where_site = "WHERE site_id={$site_id}"; } else { $where_site = ''; } if (isset($urlsFile) || isset($urlsBox)) { $query = "SELECT DISTINCT(" . PHPDIG_DB_PREFIX . "sites.site_id)," . PHPDIG_DB_PREFIX . "sites.site_url," . PHPDIG_DB_PREFIX . "sites.username as user," . PHPDIG_DB_PREFIX . "sites.password as pass," . PHPDIG_DB_PREFIX . "sites.port FROM " . PHPDIG_DB_PREFIX . "sites," . PHPDIG_DB_PREFIX . "tempspider WHERE " . PHPDIG_DB_PREFIX . "sites.site_id = " . PHPDIG_DB_PREFIX . "tempspider.site_id"; } elseif ($site_id || $from_shell_flag == 1) { $query = "SELECT site_id,site_url,username as user,password as pass,port FROM " . PHPDIG_DB_PREFIX . "sites {$where_site}"; } else {
function phpdigSpiderAddSite($id_connect, $url, $linksper, $linksper_flag, $limit, $limit_flag, $usetable) { $pu = parse_url($url); settype($pu['path'], 'string'); settype($pu['query'], 'string'); settype($pu['port'], 'integer'); if ($pu['port'] == 0 || $pu['port'] == 80) { $pu['port'] = ''; } else { settype($pu['port'], 'integer'); } $url = $pu['scheme'] . "://" . $pu['host'] . "/"; if (!$pu['port']) { $where_port = "and (port IS NULL OR port = 0)"; } else { $where_port = "and port='" . $pu['port'] . "'"; } $query = "SELECT site_id FROM " . PHPDIG_DB_PREFIX . "sites WHERE site_url = '{$url}' {$where_port}"; $result = mysql_query($query, $id_connect); if (mysql_num_rows($result) > 0) { list($site_id) = mysql_fetch_row($result); $query = "DELETE FROM " . PHPDIG_DB_PREFIX . "tempspider WHERE site_id = {$site_id} AND file = '" . $pu['query'] . "' and path = '" . $pu['path'] . "'"; mysql_query($query, $id_connect); $added_site['site_id'] = "zzz"; return $added_site['site_id']; } else { $added_site = phpdigGetSiteFromUrl($id_connect, $url, $linksper, $linksper_flag, $limit, $limit_flag, $usetable); if (is_array($added_site)) { $query = "SELECT site_id,site_url,username as user,password as pass,port,locked FROM " . PHPDIG_DB_PREFIX . "sites where site_id=" . $added_site['site_id']; $added_site = phpdigMySelect($id_connect, $query); if (is_array($added_site)) { return $added_site[0]; } } } }