/** * DOCUMENT ME * @param sfWebRequest $request * @return mixed */ public function executeSearch(sfWebRequest $request) { $now = date('YmdHis'); // create the array of pages matching the query $q = $request->getParameter('q'); if ($request->hasParameter('x')) { // We sometimes like to use input type="image" for presentation reasons, but it generates // ugly x and y parameters with click coordinates. Get rid of those and come back. return $this->redirect(sfContext::getInstance()->getController()->genUrl('a/search', true) . '?' . http_build_query(array("q" => $q))); } $key = strtolower(trim($q)); $key = preg_replace('/\\s+/', ' ', $key); $replacements = sfConfig::get('app_a_search_refinements', array()); if (isset($replacements[$key])) { $q = $replacements[$key]; } try { $values = aZendSearch::searchLuceneWithValues(Doctrine::getTable('aPage'), $q, aTools::getUserCulture()); } catch (Exception $e) { // Lucene search error. TODO: display it nicely if they are always safe things to display. For now: just don't crash $values = array(); } // The truth is that Zend cannot do all of our filtering for us, especially // permissions-based. So we can do some other filtering as well, although it // would be bad not to have Zend take care of the really big cuts (if 99% are // not being prefiltered by Zend, and we have a Zend max results of 1000, then // we are reduced to working with a maximum of 10 real results). $nvalues = array(); $index = Doctrine::getTable('aPage')->getLuceneIndex(); foreach ($values as $value) { $document = $index->getDocument($value->id); // $published_at = $value->published_at; // New way: don't touch anything but $hit->id directly and you won't force a persistent // use of memory for the lazy loaded columns http://zendframework.com/issues/browse/ZF-8267 $published_at = $document->getFieldValue('published_at'); if ($published_at > $now) { continue; } // 1.5: the names under which we store columns in Zend Lucene have changed to // avoid conflict with also indexing them $info = unserialize($document->getFieldValue('info_stored')); if (!aPageTable::checkPrivilege('view', $info)) { continue; } $slug = $document->getFieldValue('slug_stored'); if (substr($slug, 0, 1) !== '@' && strpos($slug, '/') === false) { // A virtual page slug which is not a route is not interested in being part of search results continue; } $nvalues[] = $value; } $values = $nvalues; if ($this->searchAddResults($values, $q)) { foreach ($values as $value) { if (get_class($value) === 'stdClass') { // bc with existing implementations of searchAddResults if (!isset($value->slug_stored)) { if (isset($value->slug)) { $value->slug_stored = $value->slug; } else { $value->slug_stored = null; } } if (!isset($value->title_stored)) { $value->title_stored = $value->title; } if (!isset($value->summary_stored)) { $value->summary_stored = $value->summary; } if (!isset($value->engine_stored)) { if (isset($value->engine)) { $value->engine_stored = $value->engine; } else { $value->engine_stored = null; } } } } // $value = new stdClass(); // $value->url = $url; // $value->title = $title; // $value->score = $scores[$id]; // $value->summary = $summary; // $value->class = 'Article'; // $values[] = $value; usort($values, "aActions::compareScores"); } $this->pager = new aArrayPager(null, sfConfig::get('app_a_search_results_per_page', 10)); $this->pager->setResultArray($values); $this->pager->setPage($request->getParameter('page', 1)); $this->pager->init(); $this->pagerUrl = "a/search?" . http_build_query(array("q" => $q)); // setTitle takes care of escaping things $this->getResponse()->setTitle(aTools::getOptionI18n('title_prefix') . 'Search for ' . $q . aTools::getOptionI18n('title_suffix')); $results = $this->pager->getResults(); // Now that we have paginated and obtained the short list of results we really // care about it's OK to use the lazy load features of Lucene for the last mile $nresults = array(); foreach ($results as $value) { $nvalue = $value; $nvalue->slug = $nvalue->slug_stored; $nvalue->title = $nvalue->title_stored; $nvalue->summary = $nvalue->summary_stored; if (strlen($nvalue->engine_stored)) { $helperClass = $nvalue->engine_stored . 'SearchHelper'; if (class_exists($helperClass)) { $searchHelper = new $helperClass(); $nvalue->partial = $searchHelper->getPartial(); } } if (!isset($nvalue->url)) { if (substr($nvalue->slug, 0, 1) === '@') { // Virtual page slug is a named Symfony route, it wants search results to go there $nvalue->url = $this->getController()->genUrl($nvalue->slug, true); } else { $slash = strpos($nvalue->slug, '/'); if ($slash === false) { // A virtual page (such as global) that isn't the least bit interested in // being part of search results continue; } if ($slash > 0) { // A virtual page slug which is a valid Symfony route, such as foo/bar?id=55 $nvalue->url = $this->getController()->genUrl($nvalue->slug, true); } else { // A normal CMS page $nvalue->url = aTools::urlForPage($nvalue->slug); } } } $nvalue->class = 'aPage'; $nresults[] = $nvalue; } $this->results = $nresults; }
/** * DOCUMENT ME * @param mixed $privilege * @param mixed $user * @return mixed */ public function userHasPrivilege($privilege, $user = false) { return aPageTable::checkPrivilege($privilege, $this, $user); }
public function executeSearch(sfWebRequest $request) { // create the array of pages matching the query $q = $request->getParameter('q'); if ($request->hasParameter('x')) { // We like to use input type="image" for presentation reasons, but it generates // ugly x and y parameters with click coordinates. Get rid of those and come back. return $this->redirect(sfContext::getInstance()->getController()->genUrl('a/search', true) . '?' . http_build_query(array("q" => $q))); } $key = strtolower(trim($q)); $key = preg_replace('/\\s+/', ' ', $key); $replacements = sfConfig::get('app_a_search_refinements', array()); if (isset($replacements[$key])) { $q = $replacements[$key]; } $values = aZendSearch::searchLuceneWithValues(Doctrine::getTable('aPage'), $q, aTools::getUserCulture()); $nvalues = array(); foreach ($values as $value) { // doesn't implement isset if (strlen($value->info)) { $info = unserialize($value->info); if (!aPageTable::checkPrivilege('view', $info)) { continue; } } $nvalue = $value; if (substr($nvalue->slug, 0, 1) === '@') { // Virtual page slug is a named Symfony route, it wants search results to go there $nvalue->url = $this->getController()->genUrl($nvalue->slug, true); } else { $slash = strpos($nvalue->slug, '/'); if ($slash === false) { // A virtual page (such as global) taht isn't the least bit interested in // being part of search results continue; } if ($slash > 0) { // A virtual page slug which is a valid Symfony route, such as foo/bar?id=55 $nvalue->url = $this->getController()->genUrl($nvalue->slug, true); } else { // A normal CMS page $nvalue->url = aTools::urlForPage($nvalue->slug); } } $nvalue->class = 'aPage'; $nvalues[] = $nvalue; } $values = $nvalues; if ($this->searchAddResults($values, $q)) { usort($values, "aActions::compareScores"); } $this->pager = new aArrayPager(null, sfConfig::get('app_a_search_results_per_page', 10)); $this->pager->setResultArray($values); $this->pager->setPage($request->getParameter('page', 1)); $this->pager->init(); $this->pagerUrl = "a/search?" . http_build_query(array("q" => $q)); // setTitle takes care of escaping things $this->getResponse()->setTitle(aTools::getOptionI18n('title_prefix') . 'Search for ' . $q . aTools::getOptionI18n('title_suffix')); $this->results = $this->pager->getResults(); }
public static function filterForEngine($options) { // This method filters the virtual pages, tags and categories associated with a particular engine based on // specified criteria such as tag, category, publication date, etc. // Strategy: do Lucene queries and direct SQL queries that will get us all the info about relevant categories, // tags and virtual pages. Then turn that into a select distinct query for each of those things. The resulting // information is sufficient to populate the filters sidebar with options that are still relevant given the // other criteria in effect, and also to fetch the result pages (you'll want to do that with a LIMIT and an IN // query looking at the first n IDs returned by this method). // The options array looks like this. Note that all of these are optional and if each is unspecified or empty // no restriction is made on that particular basis. 'categoryIds' is used to limit to the categories associated // with the engine page, while 'categorySlug' is used to limit to a category specified by the user as a // filter. The 'q' option is Lucene search. // array( // 'q' => 'gromit', // 'categoryIds' => array(1, 3, 5), // 'categorySlug' => 'cheese', // 'tag' => 'wensleydale', // 'slugStem' => '@a_event_search_redirect', // 'year' => 2010, # Optional, if present only 2010 is shown // 'month' => 12, # Optional, if present only Dec. 2010 is shown // 'day' => 15, # Optional, if present only Dec. 15th 2010 is shown // 'byEventDateRange' => true, # For events only, joins with a_blog_item to get the range // 'byPublishedAt' => true, # For blog posts or pages // The returned value looks like this: // array( // 'categoriesInfo' => array('slug' => 'cheese', 'name' => 'Cheese'), // 'tagNames' => array('wensleydale'), // 'pageIds' => array(10, 15, 20, 25) $alphaSort = isset($options['alphaSort']) && $options['alphaSort']; if (isset($options['q']) && strlen($options['q'])) { $q = $options['q']; $key = strtolower(trim($q)); $key = preg_replace('/\\s+/', ' ', $key); $replacements = sfConfig::get('app_a_search_refinements', array()); if (isset($replacements[$key])) { $q = $replacements[$key]; } if (isset($options['slugStem'])) { $q = "({$q}) AND slug:" . $options['slugStem']; } try { $values = aZendSearch::searchLuceneWithValues(Doctrine::getTable('aPage'), $q, aTools::getUserCulture()); } catch (Exception $e) { // Lucene search error. TODO: display it nicely if they are always safe things to display. For now: just don't crash $values = array(); } $now = date('YmdHis'); $pageIds = array(); foreach ($values as $value) { // Regardless of the above if it ain't published yet we can't see it. // We filter on that in the Doctrine query too but take advantage of // this chance to preempt a little work if ($value->published_at > $now) { continue; } // 1.5: the names under which we store columns in Zend Lucene have changed to // avoid conflict with also indexing them $info = unserialize($value->info_stored); if (!aPageTable::checkPrivilege('view', $info)) { continue; } $pageIds[] = $info['id']; } } $mysql = new aMysql(); if (isset($options['slugStem'])) { $params['slug_pattern'] = $options['slugStem'] . '%'; } // Select the relevant virtual pages for this engine $q = 'from a_page p '; // If alpha sort is present we need title slots if ($alphaSort) { if (!isset($options['culture'])) { $options['culture'] = aTools::getUserCulture(); } $culture = $options['culture']; $q .= "\n LEFT JOIN a_area a ON a.page_id = p.id AND a.name = 'title' AND a.culture = :culture\n LEFT JOIN a_area_version v ON v.area_id = a.id AND a.latest_version = v.version \n LEFT JOIN a_area_version_slot avs ON avs.area_version_id = v.id\n LEFT JOIN a_slot s ON s.id = avs.slot_id "; $params['culture'] = $culture; } // Merge in categories. A left join unless we are restricted to certain categories $hasCategoryIds = isset($options['categoryIds']) && count($options['categoryIds']); $hasCategorySlug = isset($options['categorySlug']) && strlen($options['categorySlug']); $restrictedByCategory = $hasCategoryIds || $hasCategorySlug; if ($restrictedByCategory) { $cjoin = 'inner join'; } else { $cjoin = 'left join'; } $q .= $cjoin . ' a_page_to_category ptc on ptc.page_id = p.id ' . $cjoin . ' a_category c on ptc.category_id = c.id '; // The engine page is locked down to these categories. If none are specified it is not // locked down by category if ($hasCategoryIds) { $q .= "and c.id in :category_ids "; $params['category_ids'] = $options['categoryIds']; } // Bring in tags... $hasTag = isset($options['tag']) && strlen($options['tag']); if ($hasTag) { $q .= 'inner join '; } else { $q .= 'left join '; } $q .= 'tagging ti on ti.taggable_id = p.id and ti.taggable_model = "aPage" left join tag t on ti.tag_id = t.id '; // Get ready to filter posts or events chronologically $year = sprintf("%04d", isset($options['year']) ? $options['year'] : 0); $month = sprintf("%02d", isset($options['month']) ? $options['month'] : 0); $day = sprintf("%02d", isset($options['day']) ? $options['day'] : 0); $startYear = $year; $endYear = $year; if ($year > 0) { if ($month == 0) { // Do not mess up the two digit strings please $startMonth = '01'; $startDay = '01'; $endMonth = '12'; $endDay = '31'; } else { $startMonth = $month; $endMonth = $month; if ($day == 0) { // Do not mess up the two digit strings please $startDay = '01'; $endDay = '31'; } else { $startDay = $day; $endDay = $day; } } } else { // For posts "today and forward" is not a relevant concept (and a separate clause // already makes sure we don't see unpublished stuff). For events we'll override // the start date below $startYear = '0000'; $startMonth = '01'; $startDay = '01'; $endYear = '9999'; $endMonth = '12'; $endDay = '31'; } $events = isset($options['byEventDateRange']) && $options['byEventDateRange']; if ($events && $startYear === '0000') { list($startYear, $startMonth, $startDay) = preg_split('/-/', date('Y-m-d')); } if ($events) { // The event's start and end dates are part of the blog item table $q .= ' inner join a_blog_item bi on bi.page_id = p.id '; $q .= "and bi.start_date <= :end_date "; $params['end_date'] = "{$endYear}-{$endMonth}-{$endDay}"; $q .= "and bi.end_date >= :start_date "; $params['start_date'] = "{$startYear}-{$startMonth}-{$startDay}"; } // Criteria for the pages themselves $q .= 'where p.slug like :slug_pattern '; // We often filter posts (not events) by a range of publication dates if (isset($options['byPublishedAt']) && $options['byPublishedAt']) { $q .= "and p.published_at <= :p_end_date "; $params['p_end_date'] = "{$endYear}-{$endMonth}-{$endDay}"; $q .= "and p.published_at >= :p_start_date "; $params['p_start_date'] = "{$startYear}-{$startMonth}-{$startDay}"; } // In no case do we show unpublished material $q .= 'and p.published_at <= NOW() and (p.archived IS NULL or p.archived IS FALSE) '; // ... But only those matching the Lucene search that already gave us specific IDs. // NOTE: if pageIds is not null and is empty, NOTHING should be returned // (someone searched for something that doesn't appear in the system) if (isset($pageIds)) { if (count($pageIds)) { $q .= 'and p.id in :pageIds '; $params['pageIds'] = $pageIds; } else { $q .= 'and 0 <> 0 '; } } if ($alphaSort) { $pagesOrderBy = 's.value asc'; } elseif ($events) { $pagesOrderBy = 'bi.start_date asc, bi.start_time asc'; } else { // Oops: blog presentation is typically descending, not ascending $pagesOrderBy = 'p.published_at desc'; } // Separate queries, but quite fast because we're not bogged down in Doctrineland $c_q = $q; $t_q = $q; $p_q = $q; // We are filtering by this specific category if ($hasCategorySlug) { // Limit tags and pages by this specific category, but don't limit // categories by it, otherwise we can't present a choice of categories // meeting the other criteria $t_q .= "and c.slug = :category_slug "; $p_q .= "and c.slug = :category_slug "; $params['category_slug'] = $options['categorySlug']; } if ($hasTag) { // Limit pages and categories by this specific tag, but don't limit // tags by it, otherwise we can't present a choice of tags // meeting the other criteria $p_q .= 'and t.name = :tag_name '; $c_q .= 'and t.name = :tag_name '; $params['tag_name'] = $options['tag']; } // In the cases where we are looking for categories or tags, be sure to // discard the null rows from the LEFT JOINs. This is simpler than // determining when to switch them to INNER JOINs $result = array('categoriesInfo' => $mysql->query('select distinct c.slug, c.name ' . $c_q . 'and c.slug is not null order by c.name', $params), 'tagsByName' => $mysql->query('select t.name, count(distinct p.id) as t_count ' . $t_q . 'and t.name is not null group by t.name order by t.name', $params), 'tagsByPopularity' => $mysql->query('select t.name, count(distinct p.id) as t_count ' . $t_q . 'and t.name is not null group by t.name order by t_count desc limit 10', $params), 'pageIds' => $mysql->queryScalar('select distinct p.id ' . $p_q . ' order by ' . $pagesOrderBy, $params)); return $result; }