/** * Constructor. * * @param string $host The server's host name/IP. * @param string $port The port that the server is listening on. * @param array $indexes The list of indexes that can be used. */ function __construct() { //sphinx $sphinxconf = Yaf_Registry::get("config")->get('sphinx')->toArray(); $this->host = $sphinxconf['host']; $this->port = $sphinxconf['port']; $this->indexes = $sphinxconf['indexes']; $this->sphinx = new SphinxClient(); $this->sphinx->SetServer($this->host, $this->port); //sphinx连接超时时间,单位为秒 $this->sphinx->SetConnectTimeout(5); //sphinx搜索结果集返回方式:TRUE为普通数组返回,FALSE为PHP hash格式返回 $this->sphinx->SetArrayResult(false); //sphinx最大搜索时间,单位为毫秒 $this->sphinx->SetMaxQueryTime(5000); //匹配模式 $this->sphinx->SetMatchMode(SPH_MATCH_EXTENDED2); //设置权重评分模式,详见sphinx文档第6.3.2节:SetRankingMode $this->sphinx->SetRankingMode(SPH_RANK_PROXIMITY_BM25); //设置排序模式排序模式 $this->sphinx->SetSortMode(SPH_SORT_EXTENDED, '@weight DESC,@id DESC'); //中文分词配置 $httpcwsconf = Yaf_Registry::get("config")->get('httpcws')->toArray(); //中文分词HTTPCWS服务器接口地址 $this->httpcws_url = 'http://' . $httpcwsconf['host'] . ':' . $httpcwsconf['port'] . '/?w='; }
/** * 初始化搜索引擎 */ private function _initSphinx() { $this->_loadCore('Help_SphinxClient'); $this->_sphinx = new SphinxClient(); $this->_sphinx->SetServer(SPHINX_HOST, SPHINX_PORT); $this->_sphinx->SetConnectTimeout(5); //连接时间 $this->_sphinx->SetArrayResult(true); $this->_sphinx->SetMaxQueryTime(10); //设置最大超时时间 $this->_sphinx->SetMatchMode(SPH_MATCH_ANY); //匹配模式 }
/** * 初始化搜索引擎 */ private function _initSphinx() { import('@.Util.SphinxClient'); $this->_sphinx = new SphinxClient(); $this->_sphinx->SetServer(C('SPHINX_HOST'), C('SPHINX_PORT')); $this->_sphinx->SetConnectTimeout(5); //连接时间 $this->_sphinx->SetArrayResult(true); //设置数组返回 $this->_sphinx->SetMaxQueryTime(10); //设置最大超时时间 $this->_sphinx->SetMatchMode(SPH_MATCH_ANY); //匹配模式 }
/** * * @param string $query * @return array of integers - taskIds */ public static function searchTasks($query) { $fieldWeights = array('description' => 10, 'note' => 6); $indexName = 'plancake_tasks'; $client = new SphinxClient(); // $client->SetServer (sfConfig::get('app_sphinx_host'), sfConfig::get('app_sphinx_port')); $client->SetFilter("author_id", array(PcUserPeer::getLoggedInUser()->getId())); $client->SetConnectTimeout(1); $client->SetMatchMode(SPH_MATCH_ANY); $client->SetSortMode(SPH_SORT_RELEVANCE); $client->SetRankingMode(SPH_RANK_PROXIMITY_BM25); $client->SetArrayResult(true); $client->SetFieldWeights($fieldWeights); $client->setLimits(0, 100); $results = $client->query($client->EscapeString($query), $indexName); if ($results === false) { $error = "Sphinx Error - " . $client->GetLastError(); sfErrorNotifier::alert($error); } $ids = array(); if (isset($results['matches']) && count($results['matches'])) { foreach ($results['matches'] as $match) { $ids[] = $match['id']; } } return PcTaskPeer::retrieveByPKs($ids); }
function hook_search($search) { $offset = 0; $limit = 500; $sphinxClient = new SphinxClient(); $sphinxpair = explode(":", SPHINX_SERVER, 2); $sphinxClient->SetServer($sphinxpair[0], (int) $sphinxpair[1]); $sphinxClient->SetConnectTimeout(1); $sphinxClient->SetFieldWeights(array('title' => 70, 'content' => 30, 'feed_title' => 20)); $sphinxClient->SetMatchMode(SPH_MATCH_EXTENDED2); $sphinxClient->SetRankingMode(SPH_RANK_PROXIMITY_BM25); $sphinxClient->SetLimits($offset, $limit, 1000); $sphinxClient->SetArrayResult(false); $sphinxClient->SetFilter('owner_uid', array($_SESSION['uid'])); $result = $sphinxClient->Query($search, SPHINX_INDEX); $ids = array(); if (is_array($result['matches'])) { foreach (array_keys($result['matches']) as $int_id) { $ref_id = $result['matches'][$int_id]['attrs']['ref_id']; array_push($ids, $ref_id); } } $ids = join(",", $ids); if ($ids) { return array("ref_id IN ({$ids})", array()); } else { return array("ref_id = -1", array()); } }
public function __construct() { parent::__construct(); // 获取关键字 $this->keyword = t($this->data['keyword']); $this->type = $this->data['type'] ? intval($this->data['type']) : 1; // 分页数 $page = intval($this->data['page']); $page <= 0 && ($page = 1); // 分页大小 $pageSize = 10; // 使用sphinx进行搜索功能 $sphinx = new SphinxClient(); // 配置sphinx服务器信息 $sphinx->SetServer(self::SPHINX_HOST, self::SPHINX_PORT); // 配置返回结果集 $sphinx->SetArrayResult(true); // 匹配结果偏移量 $sphinx->SetLimits(($page - 1) * $pageSize, $pageSize, 1000); // 设置最大搜索时间 $sphinx->SetMaxQueryTime(3); // 设置搜索模式 $sphinx->setMatchMode(SPH_MATCH_PHRASE); $this->sphinx = $sphinx; }
public function __construct() { parent::__construct(); $this->infohash_model = new InfohashModel(); $sphinx = new SphinxClient(); $sphinx->SetServer(Config::get('app.sphinx.host'), Config::get('app.sphinx.port')); $sphinx->SetArrayResult(true); $this->sphinx = $sphinx; }
public function __construct(Application $app, $host, $port, $rt_host, $rt_port) { $this->app = $app; $this->sphinx = new \SphinxClient(); $this->sphinx->SetServer($host, $port); $this->sphinx->SetArrayResult(true); $this->sphinx->SetConnectTimeout(1); $this->suggestionClient = new \SphinxClient(); $this->suggestionClient->SetServer($host, $port); $this->suggestionClient->SetArrayResult(true); $this->suggestionClient->SetConnectTimeout(1); try { $this->rt_conn = @new \PDO(sprintf('mysql:host=%s;port=%s;', $rt_host, $rt_port)); $this->rt_conn->setAttribute(\PDO::ATTR_ERRMODE, \PDO::ERRMODE_EXCEPTION); } catch (\PDOException $e) { $this->rt_conn = null; } return $this; }
private function _getSphinxClient() { require_once SCRIPT_BASE . 'lib/sphinx-2.1.9/sphinxapi.php'; $sphinxClient = new SphinxClient(); $sphinxClient->SetServer('127.0.0.1', 9312); $sphinxClient->SetConnectTimeout(20); $sphinxClient->SetArrayResult(true); $sphinxClient->SetWeights(array(1000, 1)); $sphinxClient->SetMatchMode(SPH_MATCH_EXTENDED); return $sphinxClient; }
/** * __construct() * 构造函数 */ public function __construct() { parent::__construct(); parent::SetServer(SPH_HOST, 9312); //parent::SetServer("localhost",9312); //parent::SetConnectTimeout(10); parent::SetMatchMode(SPH_MATCH_EXTENDED2); //parent::SetFieldWeights($this->weights); parent::SetRankingMode(SPH_RANK_WORDCOUNT); // parent::SetSortMode(SPH_SORT_EXTENDED, '@weight desc'); parent::SetArrayResult(TRUE); $this->SetLimits($this->offset, $this->limit); }
protected function resetClient() { $this->sphinxClient->ResetFilters(); $this->sphinxClient->ResetGroupBy(); $this->sphinxClient->ResetOverrides(); $this->sphinxClient->SetLimits(0, 20); $this->sphinxClient->SetArrayResult(true); $this->sphinxClient->SetFieldWeights(array()); $this->sphinxClient->SetIDRange(0, 0); $this->sphinxClient->SetIndexWeights(array()); $this->sphinxClient->SetMatchMode(SPH_MATCH_EXTENDED2); $this->sphinxClient->SetRankingMode(SPH_RANK_NONE); $this->sphinxClient->SetSortMode(SPH_SORT_RELEVANCE, ""); $this->sphinxClient->SetSelect("*"); }
function MakeSuggestion($keyword) { $trigrams = BuildTrigrams($keyword); $query = "\"{$trigrams}\"/1"; $len = strlen($keyword); $delta = LENGTH_THRESHOLD; $cl = new SphinxClient(); $cl->SetMatchMode(SPH_MATCH_EXTENDED2); $cl->SetRankingMode(SPH_RANK_WORDCOUNT); $cl->SetFilterRange("len", $len - $delta, $len + $delta); $cl->SetSelect("*, @weight+{$delta}-abs(len-{$len}) AS myrank"); $cl->SetSortMode(SPH_SORT_EXTENDED, "myrank DESC, freq DESC"); $cl->SetArrayResult(true); // pull top-N best trigram matches and run them through Levenshtein $cl->SetLimits(0, TOP_COUNT); $res = $cl->Query($query, "suggest"); if (!$res || !$res["matches"]) { return false; } if (SUGGEST_DEBUG) { print "--- DEBUG START ---\n"; foreach ($res["matches"] as $match) { $w = $match["attrs"]["keyword"]; $myrank = @$match["attrs"]["myrank"]; if ($myrank) { $myrank = ", myrank={$myrank}"; } // FIXME? add costs? // FIXME! does not work with UTF-8.. THIS! IS!! PHP!!! $levdist = levenshtein($keyword, $w); print "id={$match['id']}, weight={$match['weight']}, freq={$match[attrs][freq]}{$myrank}, word={$w}, levdist={$levdist}\n"; } print "--- DEBUG END ---\n"; } // further restrict trigram matches with a sane Levenshtein distance limit foreach ($res["matches"] as $match) { $suggested = $match["attrs"]["keyword"]; if (levenshtein($keyword, $suggested) <= LEVENSHTEIN_THRESHOLD) { return $suggested; } } return $keyword; }
public function getResultByTag($keyword = "", $offset = 0, $limit = 0, $searchParams = array()) { $sphinx = $this->config->item('sphinx'); $query = array(); $cl = new SphinxClient(); $cl->SetServer($sphinx['ip'], $sphinx['port']); // 注意这里的主机 $cl->SetConnectTimeout($sphinx['timeout']); $cl->SetArrayResult(true); // $cl->SetIDRange(89,90);//过滤ID if (isset($searchParams['provice_sid']) && $searchParams['provice_sid']) { $cl->setFilter('provice_sid', array($searchParams['provice_sid'])); } if (isset($searchParams['city_sid']) && $searchParams['city_sid']) { $cl->setFilter('city_sid', array($searchParams['city_sid'])); } if (isset($searchParams['piccode']) && $searchParams['piccode']) { $cl->setFilter('piccode', array($searchParams['piccode'])); } if (isset($searchParams['recent']) && $searchParams['recent']) { $cl->SetFilterRange('createtime', time() - 86400 * 30, time()); //近期1个月 } if (isset($searchParams['searchtype']) && $searchParams['searchtype']) { //精确:模糊 $searchtype = SPH_MATCH_ALL; } else { $searchtype = SPH_MATCH_ANY; } $cl->SetLimits($offset, $limit); $cl->SetMatchMode($searchtype); // 使用多字段模式 $cl->SetSortMode(SPH_SORT_EXTENDED, "@weight desc,@id desc"); $index = "*"; $query = $cl->Query($keyword, $index); $cl->close(); return $query; }
/** * sphinx search */ public function sphinxSearch(Request $request, \SphinxClient $sphinx) { $search = $request->get('search'); //sphinx的主机名和端口 //mysql -h 127.0.0.1 -P 9306 $sphinx->SetServer('127.0.0.1', 9312); //设定搜索模式 SPH_MATCH_ALL(匹配所有的查询词) $sphinx->SetMatchMode(SPH_MATCH_ALL); //设置返回结果集为数组格式 $sphinx->SetArrayResult(true); //匹配结果的偏移量,参数的意义依次为:起始位置,返回结果条数,最大匹配条数 $sphinx->SetLimits(0, 20, 1000); //最大搜索时间 $sphinx->SetMaxQueryTime(10); //索引源是配置文件中的 index 类,如果有多个索引源可使用,号隔开:'email,diary' 或者使用'*'号代表全部索引源 $result = $sphinx->query($search, '*'); //返回值说明 total 本次查询返回条数 total_found 一共检索到多少条 docs 在多少文档中出现 hits——共出现了多少次 //关闭查询连接 $sphinx->close(); //打印结果 /*echo "<pre>"; print_r($result); echo "</pre>";exit();*/ $ids = [0]; if (!empty($result)) { foreach ($result['matches'] as $key => $val) { $ids[] = $val['id']; } } $ids = implode(',', array_unique($ids)); $list = DB::select("SELECT * from documents WHERE id IN ({$ids})"); if (!empty($list)) { foreach ($list as $key => $val) { $val->content = str_replace($search, '<span style="color: red;">' . $search . '</span>', $val->content); $val->title = str_replace($search, '<span style="color: red;">' . $search . '</span>', $val->title); } } return view('/sphinx.search')->with('data', array('total' => $result['total'] ? $result['total'] : 0, 'time' => $result['time'] ? $result['time'] : 0, 'list' => $list)); }
function do_query($search_str) { //$tmp_var = array(array('itemName' => "test1"), array('itemName' => "test2"), array('itemName' => "test3")); //echo implode(",",tmp_var); //echo json_encode($tmp_var); //return tmp_var; $q = ""; $sql = ""; $mode = SPH_MATCH_ALL; $host = "localhost"; $port = 9312; $index = "*"; $groupby = ""; $groupsort = "@group desc"; $filter = "group_id"; $filtervals = array(); $distinct = ""; $sortby = ""; $sortexpr = ""; $limit = 20; $ranker = SPH_RANK_PROXIMITY_BM25; $select = "*"; $cl = new SphinxClient(); $cl->SetServer($host, $port); $cl->SetConnectTimeout(1); $cl->SetArrayResult(true); $cl->SetWeights(array(100, 1)); $cl->SetMatchMode($mode); if (count($filtervals)) { $cl->SetFilter($filter, $filtervals); } if ($groupby) { $cl->SetGroupBy($groupby, SPH_GROUPBY_ATTR, $groupsort); } if ($sortby) { $cl->SetSortMode(SPH_SORT_EXTENDED, $sortby); } if ($sortexpr) { $cl->SetSortMode(SPH_SORT_EXPR, $sortexpr); } if ($distinct) { $cl->SetGroupDistinct($distinct); } if ($select) { $cl->SetSelect($select); } if ($limit) { $cl->SetLimits(0, $limit, $limit > 1000 ? $limit : 1000); } $cl->SetRankingMode($ranker); $res = $cl->Query($search_str, $index); //return $res; if (is_array($res["matches"])) { $results = array(); $n = 1; //print "Matches:\n"; foreach ($res["matches"] as $docinfo) { //print "$n. doc_id=$docinfo[id], weight=$docinfo[weight]"; $attr_array = array(); $results[$docinfo[id]]; foreach ($res["attrs"] as $attrname => $attrtype) { $value = $docinfo["attrs"][$attrname]; if ($attrtype == SPH_ATTR_MULTI || $attrtype == SPH_ATTR_MULTI64) { $value = "(" . join(",", $value) . ")"; } else { if ($attrtype == SPH_ATTR_TIMESTAMP) { $value = date("Y-m-d H:i:s", $value); } } $attr_array[$attrname] = $value; //print $value; } $results[$docinfo[id]] = $attr_array; $n++; //print implode("",$results)."\n"; } return $results; } }
function getCategory($keywords) { $q = $keywords; $mode = SPH_MATCH_EXTENDED; $item = array(); $comma_separated = ""; //Init config $host = SPHINX_SERVER; $port = SPHINX_PORT; $index = '*'; $ranker = SPH_RANK_PROXIMITY_BM25; $cl = new SphinxClient(); $cl->SetServer($host, $port); $cl->SetConnectTimeout(1); $cl->SetWeights(array(100, 1)); $cl->SetMatchMode($mode); $cl->SetRankingMode($ranker); $cl->SetArrayResult(true); $cl->SetFilter('status', array('1')); $cl->SetGroupBy("level_1_category_id", SPH_GROUPBY_ATTR, "@count DESC"); $res = $cl->Query($q, $index); $arr = array(); if ($res && isset($res["matches"])) { if (is_array($res["matches"])) { foreach ($res["matches"] as $results) { $arr[] = $results["attrs"]; } } } return $arr; }
/** * 全文搜索 * */ private function full_search($search_txt) { $conf = C('fullindexer'); uk86_import('libraries.sphinx'); $cl = new SphinxClient(); $cl->SetServer($conf['host'], $conf['port']); $cl->SetConnectTimeout(1); $cl->SetArrayResult(true); $cl->SetRankingMode($conf['rankingmode'] ? $conf['rankingmode'] : 0); $cl->setLimits(0, $conf['querylimit']); $matchmode = $conf['matchmode']; $cl->setMatchMode($matchmode); //可以使用全文搜索进行状态筛选及排序,但需要经常重新生成索引,否则结果不太准,所以暂不使用。使用数据库,速度会慢些 // $cl->SetFilter('store_state',array(1),false); // if ($_GET['key'] == 'store_credit'){ // $order = $_GET['order'] == 'desc' ? SPH_SORT_ATTR_DESC : SPH_SORT_ATTR_ASC; // $cl->SetSortMode($order,'store_sort'); // } $res = $cl->Query($search_txt, $conf['index_shop']); if ($res) { if (is_array($res['matches'])) { foreach ($res['matches'] as $value) { $matchs_id[] = $value['id']; } } } if ($search_txt != '') { $condition['store.store_id'] = array('in', $matchs_id); } return $condition; }
<?php require "sphinxapi.php"; $cl = new SphinxClient(); $cl->SetServer('127.0.0.1', 9312); $cl->SetConnectTimeout(1); $cl->SetArrayResult(true); // $cl->SetWeights ( array ( 100, 1 ) ); $cl->SetMatchMode(SPH_MATCH_EXTENDED2); $cl->SetRankingMode(SPH_RANK_WORDCOUNT); // $cl->SetSortMode ( SPH_SORT_EXTENDED, '@weight DESC' ); // $cl->SetSortMode ( SPH_SORT_EXPR, $sortexpr ); // $cl->SetFieldWeights(array('title'=>10,'content'=>1)); $res = $cl->Query('sphinxse', "*"); print_r($res['matches']);
function CsGetData($index = '*', $words = '卫浴', $wheres = '', $orderby = 'id desc', $firstRow = 0, $listRows = 10, $timeout = 1, $host = 'localhost', $port = 9312) { require C('INTERFACE_PATH') . 'coreseek/api/sphinxapi.php'; $mem = new Memcache(); $result = $mem->connect('localhost', 11211); $mem_key = 'coreseek_config'; if ($mem->get($mem_key)) { $config = $mem->get($mem_key); } else { $config = (require C('ROOT_SITE_DIR') . 'coreseek_config.php'); $mem->set($mem_key, $config, 0, 86400 * 365); } if (date('H') > 5 && date('H') < 6) { $host = $config[1]['host']; $port = $config[1]['port']; } else { $host = $config[1]['host']; $port = $config[1]['port']; } $cl = new SphinxClient(); $cl->SetServer($host, $port); $cl->SetArrayResult(true); $cl->SetConnectTimeout($timeout); if ($wheres) { foreach ($wheres as $where) { $cl->SetFilter($where['field'], array($where['value']), $where['status']); } } $cl->SetSortMode(SPH_SORT_EXTENDED, $orderby); $cl->SetLimits($firstRow, $listRows); $cl->AddQuery($words, $index); $result = $cl->RunQueries(); return $result; }
function sphinx_search($query, $offset = 0, $limit = 30) { require_once 'lib/sphinxapi.php'; $sphinxClient = new SphinxClient(); $sphinxClient->SetServer('localhost', 9312); $sphinxClient->SetConnectTimeout(1); $sphinxClient->SetFieldWeights(array('title' => 70, 'content' => 30, 'feed_title' => 20)); $sphinxClient->SetMatchMode(SPH_MATCH_EXTENDED2); $sphinxClient->SetRankingMode(SPH_RANK_PROXIMITY_BM25); $sphinxClient->SetLimits($offset, $limit, 1000); $sphinxClient->SetArrayResult(false); $sphinxClient->SetFilter('owner_uid', array($_SESSION['uid'])); $result = $sphinxClient->Query($query, SPHINX_INDEX); $ids = array(); if (is_array($result['matches'])) { foreach (array_keys($result['matches']) as $int_id) { $ref_id = $result['matches'][$int_id]['attrs']['ref_id']; array_push($ids, $ref_id); } } return $ids; }
private function resetSphinxClient() { $cl = new SphinxClient(); $dbConf = Propel::getConfiguration(); $dsn = $dbConf['datasources']['propel']['connection']['dsn']; $sphinxServer = sfConfig::get('sf_sphinx_server'); $cl->SetServer($sphinxServer, 3312); $cl->SetConnectTimeout(1); $this->limit = 15; $cl->SetArrayResult(true); return $cl; }
/** * Does an index search via Sphinx and returns the results * * @param string $type Search type. Valid types are: author, title, series, subject, keyword (default) * @param string $term Search term/phrase * @param int $limit Number of results to return * @param int $offset Where to begin result set -- for pagination purposes * @param array $sort_array Numerically keyed array of sort parameters. Valid options are: newest, oldest * @param array $location_array Numerically keyed array of location params. NOT IMPLEMENTED YET * @param array $facet_args String-keyed array of facet parameters. See code below for array structure * @return array String-keyed result set */ public function search($type, $term, $limit, $offset, $sort_opt = NULL, $format_array = array(), $location_array = array(), $facet_args = array(), $override_search_filter = FALSE, $limit_available = FALSE, $show_inactive = FALSE) { if (is_callable(array(__CLASS__ . '_hook', __FUNCTION__))) { eval('$hook = new ' . __CLASS__ . '_hook;'); return $hook->{__FUNCTION__}($type, $term, $limit, $offset, $sort_opt, $format_array, $location_array, $facet_args, $override_search_filter, $limit_available); } require_once $this->locum_config['sphinx_config']['api_path'] . '/sphinxapi.php'; $db =& MDB2::connect($this->dsn); $term_arr = explode('?', trim(preg_replace('/\\//', ' ', $term))); $term = trim($term_arr[0]); if ($term == '*' || $term == '**') { $term = ''; } else { $term_prestrip = $term; //$term = preg_replace('/[^A-Za-z0-9*\- ]/iD', '', $term); $term = preg_replace('/\\*\\*/', '*', $term); //fix for how iii used to do wildcards } $final_result_set['term'] = $term; $final_result_set['type'] = trim($type); $cl = new SphinxClient(); $cl->SetServer($this->locum_config['sphinx_config']['server_addr'], (int) $this->locum_config['sphinx_config']['server_port']); // Defaults to 'keyword', non-boolean $bool = FALSE; $cl->SetMatchMode(SPH_MATCH_ALL); if (!$term) { // Searches for everything (usually for browsing purposes--Hot/New Items, etc..) $cl->SetMatchMode(SPH_MATCH_EXTENDED2); } else { $picturebook = array('picturebook', 'picture book'); $picbk_search = '(@callnum ^E)'; $term = str_ireplace($picturebook, $picbk_search, $term); if ($type == 'keyword') { // Custom fiction and non-fiction search $nonfic_search = ' (@callnum "0*" | @callnum "1*" | @callnum "2*" | @callnum "3*" | @callnum "4*" | @callnum "5*" | @callnum "6*" | @callnum "7*" | @callnum "8*" | @callnum "9*")'; $fiction_search = ' (@title fiction | @subjects fiction | @callnum mystery | @callnum fantasy | @callnum fiction | @callnum western | @callnum romance)'; if (stripos($term, 'nonfiction') !== FALSE) { $term = '@@relaxed ' . str_ireplace('nonfiction', '', $term) . $nonfic_search; } else { if (strpos($term, 'non-fiction') !== FALSE) { $term = '@@relaxed ' . str_ireplace('non-fiction', '', $term) . $nonfic_search; } else { if (strpos($term, 'fiction') !== FALSE) { $term = '@@relaxed ' . str_ireplace('fiction', '', $term) . $fiction_search; } } } } // Is it a boolean search? if (preg_match("/ \\| /i", $term) || preg_match("/ \\-/i", $term) || preg_match("/ \\!/i", $term)) { $cl->SetMatchMode(SPH_MATCH_BOOLEAN); $bool = TRUE; } if (preg_match("/ OR /i", $term)) { $cl->SetMatchMode(SPH_MATCH_BOOLEAN); $term = preg_replace('/ OR /i', ' | ', $term); $bool = TRUE; } // Is it a phrase search? if (preg_match("/\"/i", $term) || preg_match("/\\@/i", $term)) { $cl->SetMatchMode(SPH_MATCH_EXTENDED2); $bool = TRUE; } } // Set up for the various search types switch ($type) { case 'author': $cl->SetFieldWeights(array('author' => 50, 'addl_author' => 30)); $idx = 'bib_items_author'; break; case 'title': $cl->SetFieldWeights(array('title' => 50, 'title_medium' => 50, 'series' => 30)); $idx = 'bib_items_title'; break; case 'series': $cl->SetFieldWeights(array('title' => 5, 'series' => 80)); $idx = 'bib_items_title'; break; case 'subject': $idx = 'bib_items_subject'; break; case 'callnum': $cl->SetFieldWeights(array('callnum' => 100)); $idx = 'bib_items_callnum'; //$cl->SetMatchMode(SPH_MATCH_ANY); break; case 'tags': $cl->SetFieldWeights(array('tag_idx' => 100)); $idx = 'bib_items_tags'; //$cl->SetMatchMode(SPH_MATCH_PHRASE); break; case 'reviews': $cl->SetFieldWeights(array('review_idx' => 100)); $idx = 'bib_items_reviews'; break; case 'keyword': default: $cl->SetFieldWeights(array('title' => 400, 'title_medium' => 30, 'author' => 70, 'addl_author' => 40, 'tag_idx' => 25, 'series' => 25, 'review_idx' => 10, 'notes' => 10, 'subjects' => 5)); $idx = 'bib_items_keyword'; break; } // Filter out the records we don't want shown, per locum.ini if (!$override_search_filter) { if (trim($this->locum_config['location_limits']['no_search'])) { $cfg_filter_arr = $this->csv_parser($this->locum_config['location_limits']['no_search']); foreach ($cfg_filter_arr as $cfg_filter) { $cfg_filter_vals[] = $this->string_poly($cfg_filter); } $cl->SetFilter('loc_code', $cfg_filter_vals, TRUE); } } // Valid sort types are 'newest' and 'oldest'. Default is relevance. switch ($sort_opt) { case 'newest': $cl->SetSortMode(SPH_SORT_EXTENDED, 'pub_year DESC, @relevance DESC'); break; case 'oldest': $cl->SetSortMode(SPH_SORT_EXTENDED, 'pub_year ASC, @relevance DESC'); break; case 'catalog_newest': $cl->SetSortMode(SPH_SORT_EXTENDED, 'bib_created DESC, @relevance DESC'); break; case 'catalog_oldest': $cl->SetSortMode(SPH_SORT_EXTENDED, 'bib_created ASC, @relevance DESC'); break; case 'title': $cl->SetSortMode(SPH_SORT_ATTR_ASC, 'title_ord'); break; case 'author': $cl->SetSortMode(SPH_SORT_EXTENDED, 'author_null ASC, author_ord ASC'); break; case 'top_rated': $cl->SetSortMode(SPH_SORT_ATTR_DESC, 'rating_idx'); break; case 'popular_week': $cl->SetSortMode(SPH_SORT_ATTR_DESC, 'hold_count_week'); break; case 'popular_month': $cl->SetSortMode(SPH_SORT_ATTR_DESC, 'hold_count_month'); break; case 'popular_year': $cl->SetSortMode(SPH_SORT_ATTR_DESC, 'hold_count_year'); break; case 'popular_total': $cl->SetSortMode(SPH_SORT_ATTR_DESC, 'hold_count_total'); break; case 'atoz': $cl->SetSortMode(SPH_SORT_ATTR_ASC, 'title_ord'); break; case 'ztoa': $cl->SetSortMode(SPH_SORT_ATTR_DESC, 'title_ord'); break; default: $cl->SetSortMode(SPH_SORT_EXPR, "@weight + (hold_count_total)*0.02"); break; } // Filter by material types if (is_array($format_array)) { foreach ($format_array as $format) { if (strtolower($format) != 'all') { $filter_arr_mat[] = $this->string_poly(trim($format)); } } if (count($filter_arr_mat)) { $cl->SetFilter('mat_code', $filter_arr_mat); } } // Filter by location if (count($location_array)) { foreach ($location_array as $location) { if (strtolower($location) != 'all') { $filter_arr_loc[] = $this->string_poly(trim($location)); } } if (count($filter_arr_loc)) { $cl->SetFilter('loc_code', $filter_arr_loc); } } // Filter by pub_year if ($facet_args['facet_year']) { if (strpos($facet_args['facet_year'][0], '-') !== FALSE) { $min_year = 1; $max_year = 9999; $args = explode('-', $facet_args['facet_year'][0]); $min_arg = (int) $args[0]; $max_arg = (int) $args[1]; if ($min_arg && $min_arg > $min_year) { $min_year = $min_arg; } if ($max_arg && $max_arg < $max_year) { $max_year = $max_arg; } $cl->setFilterRange('pub_year', $min_year, $max_year); } else { $cl->SetFilter('pub_year', $facet_args['facet_year']); } } // Filter by pub_decade if ($facet_args['facet_decade']) { $cl->SetFilter('pub_decade', $facet_args['facet_decade']); } // Filter by lexile if ($facet_args['facet_lexile']) { $cl->SetFilter('lexile', $facet_args['facet_lexile']); } // Filter by Series if (count($facet_args['facet_series'])) { foreach ($facet_args['facet_series'] as &$facet_series) { $facet_series = $this->string_poly($facet_series); } $cl->SetFilter('series_attr', $facet_args['facet_series']); } // Filter by Language if (count($facet_args['facet_lang'])) { foreach ($facet_args['facet_lang'] as &$facet_lang) { $facet_lang = $this->string_poly($facet_lang); } $cl->SetFilter('lang', $facet_args['facet_lang']); } // Filter inactive records if (!$show_inactive) { $cl->SetFilter('active', array('0'), TRUE); } // Filter by age if (count($facet_args['age'])) { foreach ($facet_args['age'] as $age_facet) { $cl->SetFilter('ages', array($this->string_poly($age_facet))); } } // Filter by availability if ($limit_available) { $cl->SetFilter('branches', array($this->string_poly($limit_available))); } $cl->SetRankingMode(SPH_RANK_SPH04); $proximity_check = $cl->Query($term, $idx); // Quick check on number of results // If original match didn't return any results, try a proximity search if (empty($proximity_check['matches']) && $bool == FALSE && $term != "*" && $type != "tags") { $term = '"' . $term . '"/1'; $cl->SetMatchMode(SPH_MATCH_EXTENDED); $forcedchange = 'yes'; } // Paging/browsing through the result set. $sort_limit = 2000; if ($offset + $limit > $sort_limit) { $sort_limit = $offset + $limit; } $cl->SetLimits((int) $offset, (int) $limit, (int) $sort_limit); // And finally.... we search. $cl->AddQuery($term, $idx); // CREATE FACETS $cl->SetLimits(0, 1000); // Up to 1000 facets $cl->SetArrayResult(TRUE); // Allow duplicate documents in result, for facet grouping $cl->SetGroupBy('pub_year', SPH_GROUPBY_ATTR); $cl->AddQuery($term, $idx); $cl->ResetGroupBy(); $cl->SetGroupBy('pub_decade', SPH_GROUPBY_ATTR); $cl->AddQuery($term, $idx); $cl->ResetGroupBy(); $cl->SetGroupBy('mat_code', SPH_GROUPBY_ATTR, '@count desc'); $cl->AddQuery($term, $idx); $cl->ResetGroupBy(); $cl->SetGroupBy('branches', SPH_GROUPBY_ATTR, '@count desc'); $cl->AddQuery($term, $idx); $cl->ResetGroupBy(); $cl->SetGroupBy('ages', SPH_GROUPBY_ATTR, '@count desc'); $cl->AddQuery($term, $idx); $cl->ResetGroupBy(); $cl->SetGroupBy('lang', SPH_GROUPBY_ATTR, '@count desc'); $cl->AddQuery($term, $idx); $cl->ResetGroupBy(); $cl->SetGroupBy('series_attr', SPH_GROUPBY_ATTR, '@count desc'); $cl->AddQuery($term, $idx); $cl->ResetGroupBy(); $cl->SetGroupBy('lexile', SPH_GROUPBY_ATTR); $cl->AddQuery($term, $idx); $cl->ResetGroupBy(); $results = $cl->RunQueries(); // Include descriptors $final_result_set['num_hits'] = $results[0]['total_found']; if ($results[0]['total'] <= $this->locum_config['api_config']['suggestion_threshold'] || $forcedchange == 'yes') { if ($this->locum_config['api_config']['use_yahoo_suggest'] == TRUE) { $final_result_set['suggestion'] = $this->yahoo_suggest($term_prestrip); } } // Pull full records out of Couch if ($final_result_set['num_hits']) { $skip_avail = $this->csv_parser($this->locum_config['format_special']['skip_avail']); $bib_hits = array(); foreach ($results[0]['matches'] as $match) { $bib_hits[] = (string) $match['id']; } $final_result_set['results'] = $this->get_bib_items_arr($bib_hits); foreach ($final_result_set['results'] as &$result) { $result = $result['value']; if ($result['bnum']) { // Get availability (Only cached) $result['status'] = $this->get_item_status($result['bnum'], FALSE, TRUE); } } } $final_result_set['facets'] = $this->sphinx_facetizer($results); if ($forcedchange == 'yes') { $final_result_set['changed'] = 'yes'; } return $final_result_set; }
case 'MD5_16': $keyToSearch = substr(md5($getKey), 8, 16); break; case 'MD5_32': $keyToSearch = md5($getKey); break; case 'Normal': $keyToSearch = $getKey; break; default: ShowError('ಥ_ಥ,出错啦!!!', 'javascript:closeWindow()', '关闭'); } $sp = new SphinxClient(); $sp->SetServer('10.211.55.14', 9312); //设置spinx的服务器地址和端口 $sp->SetArrayResult(true); //设置 显示结果集方式 $sp->SetLimits(0, 1000); //同sql语句中的LIMIT $sp->SetSortMode(SPH_SORT_RELEVANCE); //设置默认按照相关性排序 $sp->SetMatchMode($mod); if ($keyToSearch != " ") { // 如果关键字为空 不执行 否则程序出错 $result = $sp->Query($keyToSearch, "*"); } //执行搜索 $count = $result['total']; //计算一共多少页 // $pn=(ceil($count / 10)); if (is_array($result['matches'])) {
function draw() { //$tbl_source = "category_bk"; $tbl_source = "category"; global $display; $keywords = AZLib::getParam('searchKeyword'); $src_catid = (int) Url::get('sourceCategories'); $src_l1_catid = 0; $src_l2_catid = 0; $src_l3_catid = 0; if ($src_catid) { //Kiểm tra danh mục nguồn $src_cat = DB::select("{$tbl_source}", "id={$src_catid}"); if ($src_cat) { if ($src_cat && $src_cat['parent_id']) { //DM cấp 2 /*$src_l1_catid = $src_cat['parent_id']; $src_l2_catid = $src_catid; */ $src_cat_parent = DB::select("{$tbl_source}", "id={$src_cat['id']}"); if (!$src_cat_parent || $src_cat_parent && $src_cat_parent['parent_id']) { //DM cấp 3 $src_l1_catid = $src_cat_parent['parent_id']; $src_l2_catid = $src_cat['parent_id']; $src_l3_catid = $src_catid; } else { $src_l1_catid = $src_cat['parent_id']; $src_l2_catid = $src_catid; } } else { $src_l1_catid = $src_catid; } } } $des_catid = (int) AZLib::getParam('desCategories'); $search_result = false; $items = array(); $total = 0; if ($keywords) { //Nếu tìm theo từ khóa $q = $keywords; $mode = SPH_MATCH_ALL; //Init config $host = SPHINX_SERVER; $port = SPHINX_PORT; $index = SPHINX_INDEX; $ranker = SPH_RANK_PROXIMITY_BM25; $cl = new SphinxClient(); $cl->SetServer($host, $port); $cl->SetConnectTimeout(1); $cl->_limit = 50000; $cl->_maxmatches = 50000; $cl->SetWeights(array(100, 1)); $cl->SetMatchMode($mode); if ($src_l2_catid) { $cl->SetFilter('category_id', array($src_catid)); } elseif ($src_l1_catid) { $cl->SetFilter('level_1_catid', array($src_catid)); } //$cl->SetLimits( $offset , $limit, 10000 ); $cl->SetRankingMode($ranker); $cl->SetArrayResult(true); $res = $cl->Query($q, $index); if ($res && isset($res["matches"])) { if (is_array($res["matches"])) { $itemIDs = ''; $count = 0; foreach ($res["matches"] as $results) { $itemIDs .= ($itemIDs != '' ? ',' : '') . $results['id']; } if ($itemIDs != '') { //Đếm lại số bản ghi chính xác $sql = 'SELECT count(*) AS totalItem FROM item WHERE id IN(' . $itemIDs . ')'; if ($src_catid) { if ($src_l3_catid) { // Nếu tìm kiếm theo từ khóa trong danh mục cấp 3 $sql .= ' AND category_id = ' . $src_l3_catid; } elseif ($src_l2_catid) { // Nếu tìm kiếm theo từ khóa trong danh mục nào đó $sql .= ' AND level_2_catid = ' . $src_l2_catid; } elseif ($src_l1_catid) { $sql .= ' AND level_1_catid = ' . $src_l1_catid; } } if ($des_catid) { $sql .= ' AND category_id != ' . $des_catid; } $re = DB::Query($sql); if ($re) { $row = mysql_fetch_assoc($re); $total += (int) $row['totalItem']; } $display->add('itemids', $itemIDs); } } } } elseif ($src_catid) { // Nếu giới hạn theo danh mục $sql = "SELECT count(*) AS itemTotal FROM item"; if ($src_l3_catid) { $sql .= ' WHERE category_id = ' . $src_l3_catid; } elseif ($src_l2_catid) { $sql .= ' WHERE level_3_category_id = ' . $src_l2_catid; } elseif ($src_l1_catid) { $sql .= ' WHERE level_1_catid = ' . $src_l1_catid; } $re = DB::query($sql); if ($re) { $row = mysql_fetch_assoc($re); $total = $row['itemTotal']; } } $this->beginForm(); //Build source categories list $cat_search_name = ''; $re = DB::query("SELECT id,name,parent_id ,position,status FROM {$tbl_source} ORDER BY parent_id,position"); $all_cats = array(); $all_subcats = array(); if ($re) { while ($cat = mysql_fetch_assoc($re)) { if ($cat['parent_id']) { //Là danh mục cấp 2 if (isset($all_cats[$cat['parent_id']]) && $all_cats[$cat['parent_id']]['parent_id'] == 0) { //Là danh mục cấp 2 $all_subcats[$cat['parent_id']][$cat['id']] = $cat; } } else { if (!isset($all_subcats[$cat['id']])) { $all_subcats[$cat['id']] = array(); } } $all_cats[$cat['id']] = $cat; } } $all_top_cat = array(); $all_top_cat[0] = 'Tất cả các danh mục'; foreach ($all_subcats as $topid => $subcats) { if ($src_catid && $src_catid == $topid) { $cat_search_name = $all_cats[$topid]['name']; } if ($all_cats[$topid]['status'] == 'HIDE') { $all_cats[$topid]['name'] .= ' (ẨN)'; } $all_top_cat[$topid] = $all_cats[$topid]['name']; foreach ($subcats as $subcat) { if ($src_catid && $src_catid == $subcat['id']) { $cat_search_name = $subcat['name']; } if ($subcat['status'] == 'HIDE') { $subcat['name'] .= ' (ẨN)'; } $all_top_cat[$subcat['id']] = " - " . $subcat['name']; } } //print_r($all_top_cat); $display->add('msg', $this->showFormSuccesMessages(1)); $display->add('sourceCategories', $all_top_cat); //Build destination categories list $re = DB::query("SELECT id,name,parent_id,status,position FROM category ORDER BY parent_id,position"); $all_cats = array(); $all_subcats = array(); $level1_cats = array(); $level2_cats = array(); $level3_cats = array(); if ($re) { while ($cat = mysql_fetch_assoc($re)) { if ($cat['parent_id']) { //Là danh mục cấp 2 hoặc 3 if (isset($all_cats[$cat['parent_id']]) && $all_cats[$cat['parent_id']]['parent_id'] == 0) { //Là danh mục cấp 2 $all_subcats[$cat['parent_id']][$cat['id']] = $cat; $cat['max'] = 0; if ($cat['position'] > $level1_cats[$cat['parent_id']]['max']) { $level1_cats[$cat['parent_id']]['max'] = $cat['position']; } $level2_cats[$cat['id']] = $cat; } else { //là danh mục cấp 3 if ($cat['position'] > $level2_cats[$cat['parent_id']]['max']) { $level2_cats[$cat['parent_id']]['max'] = $cat['position']; } $level3_cats[$all_cats[$cat['parent_id']]['parent_id']][$cat['parent_id']][$cat['id']] = $cat; } } else { $cat['max'] = 0; $level1_cats[$cat['id']] = $cat; if (!isset($all_subcats[$cat['id']])) { $all_subcats[$cat['id']] = array(); } } $all_cats[$cat['id']] = $cat; } } $all_top_cat = array(); $categories = array(); foreach ($all_subcats as $topid => $subcats) { if ($all_cats[$topid]['status'] == 'HIDE') { $all_cats[$topid]['name'] .= ' (ẨN)'; } $categories[$topid] = $all_cats[$topid]; $all_top_cat[$topid] = $all_cats[$topid]['name']; foreach ($subcats as $subcat) { if ($subcat['status'] == 'HIDE') { $subcat['name'] .= ' (ẨN)'; } $all_top_cat[$subcat['id']] = " - " . $subcat['name']; $categories[$subcat['id']] = $subcat; if (isset($level2_cats[$subcat['id']]) && $level2_cats[$subcat['id']]['max']) { $subcatsl3 = $level3_cats[$subcat['parent_id']][$subcat['id']]; foreach ($subcatsl3 as $subcatl3) { if ($subcatl3['status'] == 'HIDE') { $subcatl3['name'] .= ' (ẨN)'; } $all_top_cat[$subcatl3['id']] = " + " . $subcatl3['name']; $subcatl3['parent_id'] .= ',' . $subcat['parent_id']; $categories[$subcatl3['id']] = $subcatl3; } } } } $display->add('desCategories', $all_top_cat); $display->add('desJSONCategories', json_encode($categories)); $display->add("allrecord", $total); $display->add('keywords', $keywords); $display->add('cat_search_id', $src_catid); $display->add('cat_search_name', $cat_search_name); $display->add('category_id', $des_catid); $display->output("ManageContentCategory"); $this->endForm(); }
function actionIndex() { $this->_pathway->addStep('检索下载'); $type = $this->_context->type; if ($type == 1) { $this->_pathway->addStep('视频资料'); } else { if ($type == 2) { $this->_pathway->addStep('音频资料'); } else { if ($type == 3) { $this->_pathway->addStep('图片资料'); } else { if ($type == 4) { $this->_pathway->addStep('富媒体资料'); } else { $type = 0; } } } } $this->_view['type'] = $type; require Q::ini('appini/search/sphinxApi'); $host = Q::ini('appini/search/sphinxHost'); $port = Q::ini('appini/search/sphinxPort'); $limit = Q::ini('appini/search/sphinxLimit'); $level = $this->_view['currentUser']['level_id']; $group_id = $this->_view['currentUser']['group_id']; $page = intval($this->_context->page); if ($page < 1) { $page = 1; } $query = $this->_view['query'] = $this->_context->query; $s = new SphinxClient(); $s->SetServer($host, $port); $s->SetConnectTimeout(10); $s->SetWeights(array(100, 1)); if ($type >= 1 && $type <= 4) { $s->SetFilter('type', array($type)); } $s->SetFilter('status', array(2)); //0:新节目;1:待审核;2:已发布;3:打回;4:删除. $s->SetFilterRange('level', 0, $level); $s->SetLimits(($page - 1) * $limit, $limit, 1000); $s->SetArrayResult(true); $s->SetMatchMode(SPH_MATCH_EXTENDED); //设置匹配模式为Sphinx内部语言表达式 $s->SetSortMode(SPH_SORT_EXPR, '@id'); //设置排序模式 $result = $s->Query("{$query} @groups '(,{$group_id},)|(all)'"); if ($result) { //获得文件 if (isset($result['matches'])) { $ids = array(); foreach ($result['matches'] as $v) { $ids[] = $v['id']; } $files = Files::find('id in (?)', $ids)->order('id desc')->getAll(); $this->_view['files'] = $files; } $result['start'] = ($page - 1) * $limit + 1 > $result['total'] ? $result['total'] : ($page - 1) * $limit + 1; $result['end'] = $result['start'] + $limit - 1 > $result['total'] ? $result['total'] : $result['start'] + $limit - 1; $this->_view['result'] = $result; //生成页码控制 $pagination = array(); $pagination['record_count'] = $result['total']; $pagination['page_count'] = ceil($result['total'] / $limit); $pagination['first'] = 1; $pagination['last'] = $pagination['page_count']; if ($pagination['last'] < $pagination['first']) { $pagination['last'] = $pagination['first']; } if ($page >= $pagination['page_count'] + 1) { $page = $pagination['last']; } if ($page < 1) { $page = $pagination['first']; } if ($page < $pagination['last'] - 1) { $pagination['next'] = $page + 1; } else { $pagination['next'] = $pagination['last']; } if ($page > 1) { $pagination['prev'] = $page - 1; } else { $pagination['prev'] = $pagination['first']; } $pagination['current'] = $page; $pagination['page_size'] = $limit; $pagination['page_base'] = 1; $this->_view['pagination'] = $pagination; } // $categoryId = $this->_context->category_id; // $categoryId = isset($categoryId) ? $categoryId : 1; // $category = Category::find()->getById($categoryId); // $this->_view['category'] = $category; // $categoryIds = Category::getChildrenIds($categoryId); // if(count($categoryIds)){//所有编目文件 // // 分页查询内容列表 // $page = intval($this->_context->page); // if ($page < 1) $page = 1; // $select = Files::find('category_id in (?) and type=? and upload_username=? and status=2 and (groups=\'\' or groups like \'%,?,%\') and level <= ?', $categoryIds, $type, $this->_view['currentUser']['username'], $this->_view['currentUser']['group_id'], $this->_view['currentUser']['level_id'])->order('upload_at desc'); // $select->limitPage($page, 12); // // 将分页信息和查询到的数据传递到视图 // $this->_view['pagination'] = $select->getPagination(); // $this->_view['files'] = $select->getAll(); // } }
//$sphinx_index = 'media'; //Sphinx 搜索 header("content-type:application/json"); require_once '../tools/db.php'; require_once '../tools/main.php'; include_once "../tools/sphinxapi.php"; if (isset($_REQUEST["number"]) && intval($_REQUEST["number"]) > 9) { $number = $_REQUEST["number"]; } else { $number = 9; } $pageNum = isset($_REQUEST["page"]) ? intval($_REQUEST["page"]) : 0; $mdb = new MeekroDB(DB_HOST, DB_USERNAME, DB_PASSWORD, DB_TABLE_NAME, DB_PORT, DB_CHARSET); $sphinx = new SphinxClient(); $sphinx->SetServer(SPHINX_HOST, SPHINX_PORT); $sphinx->SetArrayResult(true); $sphinx->SetLimits($pageNum * $number, $number, 5000); $sphinx->SetMaxQueryTime(10); $sphinx->SetMatchMode(SPH_MATCH_EXTENDED2); $sphinx->SetFilter('enabled', array(1)); if (isset($_REQUEST["type"])) { $r1 = $mdb->queryFirstRow("SELECT id, name FROM media_type WHERE name=%s", $_REQUEST["type"]); $type = $r1["id"]; //set type if ($type == "") { echo json_encode(array("result" => null, "status" => false, "error" => "请求的类型不存在")); exit; } $sphinx->SetFilter('type', array($type)); } if (isset($_REQUEST['language'])) {
function search() { spAddViewFunction('kred', 'SearchReplaceKw'); $kw = urldecode($this->spArgs("kw", "")); $page = $this->spArgs("page", "1"); $px = $this->spArgs("px", "1"); $cl = new SphinxClient(); $cl->SetServer('127.0.0.1', 9312); $cl->SetArrayResult(true); $cl->SetLimits(0, 150000); if ($px == "1") { $cl->SetSortMode(SPH_SORT_EXTENDED, "ctime DESC"); } elseif ($px == "2") { $cl->SetSortMode(SPH_SORT_EXTENDED, "length DESC"); } elseif ($px == "3") { $cl->SetSortMode(SPH_SORT_EXTENDED, "click DESC"); } else { $cl->SetSortMode(SPH_SORT_EXTENDED, "ctime DESC"); } $res = $cl->Query("{$kw}", "*"); $total_found = $res['total_found']; $pages = floor($total_found / 15); $time = $res['time']; $matches = $res['matches']; $dbfilm = spClass('dbfilm'); $dbsj = spClass('dbsj'); $this->sjresults = $sjresults; $arr = array(); if ($total_found > 15) { for ($x = 0; $x <= 15; $x++) { if ($page > 1) { $w = $page - 1; $i = $w * 15 + $x + 1; } else { $i = $x; } $id = $matches[$i]['id']; $conditions = array("id" => "{$id}"); $result = $dbfilm->find($conditions); $arr[$x] = $result; } } else { for ($x = 0; $x <= $total_found; $x++) { if ($page > 1) { $w = $page - 1; $i = $w * 15 + $x + 1; } else { $i = $x; } $id = $matches[$i]['id']; $conditions = array("id" => "{$id}"); $result = $dbfilm->find($conditions); $arr[$x] = $result; } } $this->total_found = $total_found; $this->time = $time; $this->results = $kw; $this->page = $page; $this->pages = $pages; $this->px = $px; $this->arr = $arr; $tpl = $this->spArgs("tpl", "template"); $this->display("{$tpl}/search.html"); }
/** * Фильтр по аббривиатурам * * @Route("/ajax/abbr/{string}", name="ajax_abbr", defaults = {"string" = null}) */ public function letterForAbbriviature(Request $request, $string = null) { if (!$string) { $string = $request->query->get('string'); } $type = $request->query->has('type') ? $request->query->get('type') : 'publication'; $order = $request->query->get('order', '') == 'relevant' ? 'relevant' : 'created'; //$order = $request->query->get('order', '') == 'created' ? 'created' : 'relevant'; $page = $request->query->has('page') ? $request->query->get('page') : $request->query->get('p', 1); $page = intval($page); # удаляем лишние символы и пробелы $string = preg_replace('/[^a-zа-я\\s]/iu', ' ', $string); $string = preg_replace('/\\s+/iu', ' ', $string); $params = array('search' => $string); $params['string'] = $string; $params['type'] = $type; $params['order'] = $order; $params['page'] = $page; $params['currentPage'] = $page; if ($page < 1) { throw $this->createNotFoundException('Incorrect page number: ' . $page); } # удаляем лишние символы из запроса $string = preg_replace('/[^a-zа-я0-9-, :\\.\\(\\)]/iu', '', $string); $string = preg_replace('/[,:\\.\\(\\)]/', ' ', $string); # проверка, есть ли поисковое слово if (mb_strlen(trim($string), 'utf-8') < 2) { return $this->render('EvrikaMainBundle:Search:search_error.html.twig'); } # разбиваем на слова, отсекаем окончания if (!preg_match('/[A-Z]/', $string) && !preg_match('/[А-Я]/u', $string)) { # берем основу слов, если нету собственных имен (заглавных) $string = $this->get('evrika.lingua_stem')->stem_string($string); } # каждое слово дополняется с конца звездочкой (wildcard), разделитеть - ИЛИ $words = explode(' ', $string); # клиентский запрос $s = new \SphinxClient(); $s->SetServer("localhost", 9312); // должна быть запущена служба по порту: searchd --config /c/sphinx/shinx.cnf //$s->SetRankingMode(SPH_RANK_PROXIMITY); $s->SetMatchMode(SPH_MATCH_EXTENDED2); // SPH_MATCH_ALL will match all words in the search term $s->SetArrayResult(true); $s->SetLimits(($page - 1) * self::SEARCH_PER_PAGE, self::SEARCH_PER_PAGE); # получаем результаты поиска if ($order == 'created') { $s->setSortMode(SPH_SORT_EXTENDED, 'created DESC'); } else { $s->SetFieldWeights(array('title' => 10, 'shortText' => 3, 'body' => 1)); $s->SetSortMode('SPH_SORT_EXTENDED', '@weight desc, mydate desc, @id asc'); } # находим публикации по всем введенным словам $query = implode('* &', $words) . '*'; $s_publications = $s->Query("@(title,shortText,body) {$query} & @type=publication", 'publication'); if (!isset($s_publications['matches'])) { # если не нашли - находим по любому из слов $query = implode('* |', $words) . '*'; $s_publications = $s->Query("@(title,shortText,body) {$query} & @type=publication", 'publication'); } # находим события по всем введенным словам $s_events = $s->Query("@(title,shortText,body) {$query} & @type=event", 'publication'); if (!isset($s_events['matches'])) { # если не нашли - находим по любому из слов $query = implode('* |', $words) . '*'; $s_events = $s->Query("@(title,shortText,body) {$query} & @type=event", 'publication'); } # если поймали ошибку $error = $s->GetLastError(); if (!empty($error)) { throw $this->createNotFoundException($error); } # всего публикаций и событий $params['totalPublications'] = intval($s_publications['total']); $params['totalEvents'] = intval($s_events['total']); # заполняем публикации/события из базы данных по полученным ID из запроса Sphinx $publications = array(); $total = $type == 'event' ? $params['totalEvents'] : $params['totalPublications']; # если материалы найдены if ($total) { $em = $this->getDoctrine()->getManager(); $highlight = array('publications' => array(), 'events' => array()); if ($type == 'event') { foreach ($s_events['matches'] as $o) { if ($publication = $em->getRepository('EvrikaMainBundle:Event')->findEnabledById($o['id'] - 1000000)) { $publications[] = $publication; } } } else { foreach ($s_publications['matches'] as $o) { if ($publication = $em->getRepository('EvrikaMainBundle:Publication')->findEnabledById($o['id'])) { $publications[] = $publication; } } } # надо сделать подсветку частей с найденными словами $words = explode(' ', $string); $rep = array('$1<span class="yellow">$2</span>', '<span class="yellow">$0</span>'); for ($i = 0; $i < count($publications); $i++) { $id = $publications[$i]->getId() . ''; $title = $publications[$i]->getTitle(); $shortText = $publications[$i]->getShortText(); $isEvent = $publications[$i]->isEvent(); foreach ($words as $word) { if (!empty($word)) { $pat = array('/([ ,>\\.\\-])(' . $word . '[a-zа-я]*)/iu', '/^' . $word . '[a-zа-я]*/iu'); $title = preg_replace($pat, $rep, $title); if (!$isEvent) { $shortText = preg_replace($pat, $rep, $shortText); } } } if ($isEvent) { $highlight['events'][$id]['title'] = $title; } else { $highlight['publications'][$id]['title'] = $title; $highlight['publications'][$id]['shortText'] = $shortText; } } $params['highlight'] = $highlight; } # смотрим препараты $emDrug = $this->getDoctrine()->getManager('drug'); list($products, $anyOfWord) = $emDrug->getRepository('VidalDrugBundle:Product')->findByQuery($string, false); if (!empty($products)) { $params['totalProducts'] = count($products); if ($type == 'product') { $productIds = array(); foreach ($products as $product) { $productIds[] = $product['ProductID']; } $pagination = $this->get('knp_paginator')->paginate($products, $page, self::PRODUCTS_PER_PAGE); $params['productsPagination'] = $pagination; $params['anyOfWord'] = $anyOfWord; $params['companies'] = $emDrug->getRepository('VidalDrugBundle:Company')->findByProducts($productIds); $params['pictures'] = $emDrug->getRepository('VidalDrugBundle:Picture')->findByProductIds($productIds, date('Y')); $params['infoPages'] = $emDrug->getRepository('VidalDrugBundle:InfoPage')->findByProducts($pagination); } } # смотрим федеральные стандарты $em = $this->getDoctrine()->getManager(); $standarts = $em->getRepository('EvrikaMainBundle:Standart')->findByQuery($string); if (!empty($standarts)) { $params['totalStandarts'] = count($standarts); if ($type == 'standart') { $params['standarts'] = $standarts; } } $params['feedType'] = 'search'; $params['category'] = 'all'; $params['displayedPages'] = self::DISPLAYED_PAGES; $params['bookmarks'] = $this->get('evrika.session_manager')->getBookmarks(); $params['type'] = $type; $params['total'] = $total; $params['numberOfPages'] = ceil($total / self::SEARCH_PER_PAGE); $params['publications'] = $publications; $return = array(); foreach ($publications as $item) { $return[] = ['id' => $item->getId(), 'name' => $item->getTitle()]; } return $this->render('EvrikaMainBundle:Abbreviation:ajax.json.twig', array('data' => $return)); }
public function index() { C('TOKEN_ON', false); $seo = seo(); $this->assign("seo", $seo); if (isset($_GET['q'])) { G('search'); //关键字 $q = Input::forSearch(safe_replace($this->_get("q"))); $q = htmlspecialchars(strip_tags($q)); //时间范围 $time = $this->_get("time"); //模型 $mid = (int) $this->_get("modelid"); //栏目 $catid = (int) $this->_get("catid"); //排序 $order = array("adddate" => "DESC", "searchid" => "DESC"); //搜索历史记录 $shistory = cookie("shistory"); if (!$shistory) { $shistory = array(); } $model = F("Model"); $category = F("Category"); if (trim($_GET['q']) == '') { header('Location: ' . U("Search/Index/index")); exit; } array_unshift($shistory, $q); $shistory = array_slice(array_unique($shistory), 0, 10); //加入搜索历史 cookie("shistory", $shistory); $where = array(); //每页显示条数 $pagesize = $this->config['pagesize'] ? $this->config['pagesize'] : 10; //缓存时间 $cachetime = (int) $this->config['cachetime']; //按时间搜索 if ($time == 'day') { //一天 $search_time = time() - 86400; $where['adddate'] = array("GT", $search_time); } elseif ($time == 'week') { //一周 $search_time = time() - 604800; $where['adddate'] = array("GT", $search_time); } elseif ($time == 'month') { //一月 $search_time = time() - 2592000; $where['adddate'] = array("GT", $search_time); } elseif ($time == 'year') { //一年 $search_time = time() - 31536000; $where['adddate'] = array("GT", $search_time); } else { $search_time = 0; } //可用数据源 $this->config['modelid'] = $this->config['modelid'] ? $this->config['modelid'] : array(); //按模型搜索 if ($mid && in_array($mid, $this->config['modelid'])) { $where['modelid'] = array("EQ", (int) $mid); } //按栏目搜索 if ($catid) { //不支持多栏目搜索,和父栏目搜索。 $where['catid'] = array("EQ", (int) $catid); } //分页模板 $TP = '共有{recordcount}条信息 {pageindex}/{pagecount} {first}{prev}{liststart}{list}{listend}{next}{last}'; //如果开启sphinx if ($this->config['sphinxenable']) { import("Sphinxapi", APP_PATH . C("APP_GROUP_PATH") . '/Search/Class/'); $sphinxhost = $this->config['sphinxhost']; $sphinxport = $this->config['sphinxport']; $cl = new SphinxClient(); //设置searchd的主机名和TCP端口 $cl->SetServer($sphinxhost, $sphinxport); //设置连接超时 $cl->SetConnectTimeout(1); //控制搜索结果集的返回格式 $cl->SetArrayResult(true); //设置全文查询的匹配模式 api http://docs.php.net/manual/zh/sphinxclient.setmatchmode.php $cl->SetMatchMode(SPH_MATCH_EXTENDED2); //设置排名模式 api http://docs.php.net/manual/zh/sphinxclient.setrankingmode.php $cl->SetRankingMode(SPH_RANK_PROXIMITY_BM25); //按一种类似SQL的方式将列组合起来,升序或降序排列。用weight是权重排序 $cl->SetSortMode(SPH_SORT_EXTENDED, "@weight desc"); //设置返回结果集偏移量和数目 $page = (int) $this->_get(C("VAR_PAGE")); $page = $page < 1 ? 1 : $page; $offset = $pagesize * ($page - 1); $cl->SetLimits($offset, $pagesize, $pagesize > 1000 ? $pagesize : 1000); if (in_array($time, array("day", "week", "month", "year"))) { //过滤时间 $cl->SetFilterRange('adddate', $search_time, time(), false); } if ($mid && in_array($mid, $this->config['modelid'])) { //过滤模型 $cl->SetFilter('modelid', (int) $mid); } if ($catid) { //过滤栏目 $cl->SetFilter('catid', (int) $catid); } //执行搜索 api http://docs.php.net/manual/zh/sphinxclient.query.php $res = $cl->Query($q, "*"); //信息总数 $count = $res['total']; //如果结果不为空 if (!empty($res['matches'])) { $result_sphinx = $res['matches']; } $result = array(); //数组重新组合 foreach ($result_sphinx as $k => $v) { $result[$k] = array("searchid" => $v['id'], "adddate" => $v['attrs']['adddate'], "catid" => $v['attrs']['catid'], "id" => $v['attrs']['id'], "modelid" => $v['attrs']['modelid']); } $words = array(); //搜索关键字 foreach ($res['words'] as $k => $v) { $words[] = $k; } $page = page($count, $pagesize); $page->SetPager('default', $TP, array("listlong" => "6", "first" => "首页", "last" => "尾页", "prev" => "上一页", "next" => "下一页", "list" => "*", "disabledclass" => "")); $this->assign("Page", $page->show('default')); } else { import("Segment", APP_PATH . C("APP_GROUP_PATH") . '/Search/Class/'); $Segment = new Segment(); //分词结果 $segment_q = $Segment->get_keyword($Segment->split_result($q)); $words = explode(" ", $segment_q); if (!empty($segment_q)) { $where['_string'] = " MATCH (`data`) AGAINST ('{$segment_q}' IN BOOLEAN MODE) "; } else { //这种搜索最不行 $where['data'] = array('like', "%{$q}%"); } //查询结果缓存 if ($cachetime) { //统计 $count = M("Search")->cache(true, $cachetime)->where($where)->count(); $page = page($count, $pagesize); $result = M("Search")->cache(true, $cachetime)->where($where)->limit($page->firstRow . ',' . $page->listRows)->order($order)->select(); } else { $count = M("Search")->where($where)->count(); $page = $this->page($count, $pagesize); $result = M("Search")->where($where)->limit($page->firstRow . ',' . $page->listRows)->order($order)->select(); } $page->SetPager('default', $TP, array("listlong" => "6", "first" => "首页", "last" => "尾页", "prev" => "上一页", "next" => "下一页", "list" => "*", "disabledclass" => "")); $this->assign("Page", $page->show('default')); } //搜索结果处理 if ($result && is_array($result)) { foreach ($result as $k => $r) { $modelid = $r['modelid']; $id = $r['id']; $tablename = ucwords($model[$modelid]['tablename']); if ($tablename) { $result[$k] = M($tablename)->where(array("id" => $id))->find(); } } } //搜索记录 if (strlen($q) < 17 && strlen($q) > 1 && $result) { $res = M("SearchKeyword")->where(array('keyword' => $q))->find(); if ($res) { //关键词搜索数+1 M("SearchKeyword")->where(array('keyword' => $q))->setInc("searchnums"); } else { //关键词转换为拼音 load("@.iconvfunc"); $pinyin = gbk_to_pinyin(iconv('utf-8', 'gbk//IGNORE', $q)); if (is_array($pinyin)) { $pinyin = implode('', $pinyin); } M("SearchKeyword")->add(array('keyword' => $q, 'searchnums' => 1, 'data' => $segment_q, 'pinyin' => $pinyin)); } } //相关搜索功能 if ($this->config['relationenble']) { $map = array(); //相关搜索 if (!empty($segment_q)) { $relation_q = str_replace(' ', '%', $segment_q); } else { $relation_q = $q; } $map['_string'] = " MATCH (`data`) AGAINST ('%{$relation_q}%' IN BOOLEAN MODE) "; $relation = M("SearchKeyword")->where($map)->select(); $this->assign("relation", $relation); } foreach ($this->config['modelid'] as $modelid) { $source[$modelid] = array("name" => $model[$modelid]['name'], "modelid" => $modelid); } //搜索结果 $this->assign("result", $result); //运行时间 $search_time = G('search', 'end', 6); $this->assign("count", $count ? $count : 0); $this->assign("search_time", $search_time); $this->assign("keyword", $q); $this->assign("category", $category); $this->assign("source", $source); $this->assign("time", $time); $this->assign("modelid", $mid); $this->assign("shistory", $shistory); //分词后的搜索关键字 $this->assign("words", $words); $this->display("search"); } else { $this->display(); } }
public function run($subject_id, $clean = true, $query_offset = 0, $from, $to) { $this->load->helper('sphinxapi'); $this->load->helper('mood'); // skip if matching_status is "matching" $matching_status = $this->custom_model->get_value('subject', 'matching_status', $subject_id); if ($matching_status == 'matching') { echo "subject is matching"; return false; } // flag subject as matching.. do other bot runs this queue. //$this->db->update('subject',array('matching_status'=>'matching'),array('id'=>$subject_id)); // clear all match record for this subject $config['hostname'] = "192.168.1.102"; $config['username'] = "******"; $config['password'] = "******"; $config['database'] = "thothconnect"; $config['dbdriver'] = "mysql"; $config['dbprefix'] = ""; $config['pconnect'] = FALSE; $config['db_debug'] = TRUE; $config['cache_on'] = FALSE; $config['cachedir'] = ""; $config['char_set'] = "utf8"; $config['dbcollat'] = "utf8_general_ci"; $thothconnect_db = $this->load->database($config, true); $query = $this->db->query("SELECT client_id FROM subject WHERE id = " . $subject_id); $row = $query->row(); $client_id = $row->client_id; if ($clean) { $thothconnect_db->delete('website_c' . $client_id, array('subject_id' => $subject_id)); $thothconnect_db->delete('twitter_c' . $client_id, array('subject_id' => $subject_id)); $thothconnect_db->delete('facebook_c' . $client_id, array('subject_id' => $subject_id)); } // // begin re-matching this subject // // get search string from subject_id $query = $this->custom_model->get_value('subject', 'query', $subject_id); // sphinx init $cl = new SphinxClient(); $q = $query; $sql = ""; $mode = SPH_MATCH_EXTENDED; $host = "192.168.1.102"; $port = 9312; $index = "*"; $groupby = ""; $groupsort = "@group desc"; $filter = "group_id"; $filtervals = array(); $distinct = ""; $sortby = "@id ASC"; $sortexpr = ""; $offset = $query_offset; $limit = 1000000; $ranker = SPH_RANK_PROXIMITY_BM25; $select = ""; echo 'limit=' . $limit . ' offset=' . $offset . PHP_EOL; //Extract subject keyword from search string $keywords = get_keywords($q); //////////// // do query //////////// $cl->SetServer($host, $port); $cl->SetConnectTimeout(1); $cl->SetArrayResult(true); $cl->SetWeights(array(100, 1)); $cl->SetMatchMode($mode); // if ( count($filtervals) ) $cl->SetFilter ( $filter, $filtervals ); // if ( $groupby ) $cl->SetGroupBy ( $groupby, SPH_GROUPBY_ATTR, $groupsort ); if ($sortby) { $cl->SetSortMode(SPH_SORT_EXTENDED, $sortby); } // if ( $sortexpr ) $cl->SetSortMode ( SPH_SORT_EXPR, $sortexpr ); if ($distinct) { $cl->SetGroupDistinct($distinct); } if ($select) { $cl->SetSelect($select); } if ($limit) { $cl->SetLimits(0, $limit, $limit > 1000000 ? $limit : 1000000); } $cl->SetRankingMode($ranker); $res = $cl->Query($q, $index); //$res = true; //////////// // do Insert to DB //////////// // Current matching $current_matching = array(); /*$query_matchs = $this->db->get_where('matchs',array('subject_id'=>$subject_id)); if($query_matchs->num_rows() > 0) { echo PHP_EOL.'currents matching :'.$query_matchs->num_rows(); foreach($query_matchs->result() as $match) { $current_matching[] = $match->post_id; } }*/ // set matching date range from-to $from = strtotime($from); $to = strtotime($to); // Search and Update if ($res === false) { echo "Query failed: " . $cl->GetLastError() . ".\n"; } else { if ($cl->GetLastWarning()) { echo "WARNING: " . $cl->GetLastWarning() . "\n\n"; } echo "Query '{$q}' \nretrieved {$res['total']} of {$res['total_found']} matches in {$res['time']} sec.\n"; if ($res['total'] == 0) { echo "no result<br/>\n"; } else { if ($res['total'] > $limit + $offset) { $this->run($subject_id, $limit + $offset); } else { echo "Updating..."; foreach ($res["matches"] as $k => $docinfo) { // echo '('.$k.')'.$docinfo["id"]." "; // Reset PHP Timeout to 1min // if found in $current_matching then skip if (in_array($docinfo["id"], $current_matching)) { continue; } else { // else insert new match set_time_limit(60); $post = new Post_model(); $post->init($docinfo["id"]); // if post_date is our of range then skip $post_date = strtotime($post->post_date); if ($post_date < $from || $post_date > $to) { continue; } $mood = get_mood($post->body, $keywords); //----------------------------------------------------- $subject = $post->get_subject($subject_id); //print_r($subject); if ($post->type == "post" || $post->type == "comment") { $postData = $post->get_post_website($post->id); if ($postData != null) { $data = array(); $data["post_id"] = $postData->post_id; $data["post_date"] = $postData->post_date; $data["title"] = $postData->title; $data["body"] = $postData->body; $data["type"] = $postData->type; $data["author_id"] = $postData->author_id; $data["author"] = $postData->author; $data["website_id"] = $postData->website_id; $data["website_name"] = $postData->website_name; $data["website_cate_id"] = $postData->website_cate_id; $data["website_cate"] = $postData->website_cate; $data["website_type_id"] = $postData->website_type_id; $data["website_type"] = $postData->website_type; $data["group_id"] = $subject->group_id; $data["group"] = $subject->group; $data["url"] = substr($postData->root_url, 0, -1) . "" . $postData->url; $data["page_id"] = $postData->page_id; $data["subject_id"] = $subject->subject_id; $data["subject_name"] = $subject->subject_name; $data["mood"] = $mood; $data["mood_by"] = 'system'; $thothconnect_db->insert("website_c" . $subject->client_id, $data); $post->insert_post_comment($postData->page_id, $subject->client_id, $thothconnect_db); } } else { if ($post->type == "tweet" || $post->type == "retweet") { $postData = $post->get_post_twitter($post->id); if ($postData != null) { $data = array(); $data["post_id"] = $postData->post_id; $data["post_date"] = $postData->post_date; $data["body"] = $postData->body; $data["type"] = $postData->type; $data["author_id"] = $postData->author_id; $data["author"] = $postData->author; $data["group_id"] = $subject->group_id; $data["group"] = $subject->group; $data["tweet_id"] = $postData->tweet_id; $data["subject_id"] = $subject->subject_id; $data["subject_name"] = $subject->subject_name; $data["mood"] = $mood; $data["mood_by"] = 'system'; $thothconnect_db->insert("twitter_c" . $subject->client_id, $data); } } else { if ($post->type == "fb_post" || $post->type == "fb_comment") { $postData = $post->get_post_facebook($post->id); if ($postData != null) { $data = array(); $data["post_id"] = $postData->post_id; $data["post_date"] = $postData->post_date; $data["body"] = $postData->body; $data["type"] = $postData->type; $data["author_id"] = $postData->author_id; $data["author"] = $postData->author; $data["group_id"] = $subject->group_id; $data["group"] = $subject->group; $data["facebook_page_id"] = $postData->facebook_page_id; $data["facebook_page_name"] = $postData->facebook_page_name; $data["subject_id"] = $subject->subject_id; $data["subject_name"] = $subject->subject_name; $data["facebook_id"] = $postData->facebook_id; $data["parent_post_id"] = $postData->parent_post_id; $data["likes"] = $postData->likes; $data["shares"] = $postData->shares; $data["mood"] = $mood; $data["mood_by"] = 'system'; $thothconnect_db->insert("facebook_c" . $subject->client_id, $data); } } } } /* $data = array( 'post_id'=> $post->id, 'subject_id' => $subject_id , 'matching_date' => null, 'sentiment' => $mood, 'by' => 'system', 'system_correct' => $mood, 'system_correct_date' => mdate('%Y-%m-%d %H:%i',time()) ); $this->db->insert('matchs',$data); */ //--------------------------------------- } } } } } // flag subject as update.. $data = array('matching_status' => 'update', 'latest_matching' => mdate('%Y-%m-%d %H:%i:%s', time()), 'from' => mdate('%Y-%m-%d %H:%i:%s', $from), 'to' => mdate('%Y-%m-%d %H:%i:%s', $to)); $this->db->update('subject', $data, array('id' => $subject_id)); }