Esempio n. 1
0
 /**
  * DOCUMENT ME
  * @param sfWebRequest $request
  * @return mixed
  */
 public function executeSearch(sfWebRequest $request)
 {
     $now = date('YmdHis');
     // create the array of pages matching the query
     $q = $request->getParameter('q');
     if ($request->hasParameter('x')) {
         // We sometimes like to use input type="image" for presentation reasons, but it generates
         // ugly x and y parameters with click coordinates. Get rid of those and come back.
         return $this->redirect(sfContext::getInstance()->getController()->genUrl('a/search', true) . '?' . http_build_query(array("q" => $q)));
     }
     $key = strtolower(trim($q));
     $key = preg_replace('/\\s+/', ' ', $key);
     $replacements = sfConfig::get('app_a_search_refinements', array());
     if (isset($replacements[$key])) {
         $q = $replacements[$key];
     }
     try {
         $values = aZendSearch::searchLuceneWithValues(Doctrine::getTable('aPage'), $q, aTools::getUserCulture());
     } catch (Exception $e) {
         // Lucene search error. TODO: display it nicely if they are always safe things to display. For now: just don't crash
         $values = array();
     }
     // The truth is that Zend cannot do all of our filtering for us, especially
     // permissions-based. So we can do some other filtering as well, although it
     // would be bad not to have Zend take care of the really big cuts (if 99% are
     // not being prefiltered by Zend, and we have a Zend max results of 1000, then
     // we are reduced to working with a maximum of 10 real results).
     $nvalues = array();
     $index = Doctrine::getTable('aPage')->getLuceneIndex();
     foreach ($values as $value) {
         $document = $index->getDocument($value->id);
         //      $published_at = $value->published_at;
         // New way: don't touch anything but $hit->id directly and you won't force a persistent
         // use of memory for the lazy loaded columns http://zendframework.com/issues/browse/ZF-8267
         $published_at = $document->getFieldValue('published_at');
         if ($published_at > $now) {
             continue;
         }
         // 1.5: the names under which we store columns in Zend Lucene have changed to
         // avoid conflict with also indexing them
         $info = unserialize($document->getFieldValue('info_stored'));
         if (!aPageTable::checkPrivilege('view', $info)) {
             continue;
         }
         $slug = $document->getFieldValue('slug_stored');
         if (substr($slug, 0, 1) !== '@' && strpos($slug, '/') === false) {
             // A virtual page slug which is not a route is not interested in being part of search results
             continue;
         }
         $nvalues[] = $value;
     }
     $values = $nvalues;
     if ($this->searchAddResults($values, $q)) {
         foreach ($values as $value) {
             if (get_class($value) === 'stdClass') {
                 // bc with existing implementations of searchAddResults
                 if (!isset($value->slug_stored)) {
                     if (isset($value->slug)) {
                         $value->slug_stored = $value->slug;
                     } else {
                         $value->slug_stored = null;
                     }
                 }
                 if (!isset($value->title_stored)) {
                     $value->title_stored = $value->title;
                 }
                 if (!isset($value->summary_stored)) {
                     $value->summary_stored = $value->summary;
                 }
                 if (!isset($value->engine_stored)) {
                     if (isset($value->engine)) {
                         $value->engine_stored = $value->engine;
                     } else {
                         $value->engine_stored = null;
                     }
                 }
             }
         }
         // $value = new stdClass();
         // $value->url = $url;
         // $value->title = $title;
         // $value->score = $scores[$id];
         // $value->summary = $summary;
         // $value->class = 'Article';
         // $values[] = $value;
         usort($values, "aActions::compareScores");
     }
     $this->pager = new aArrayPager(null, sfConfig::get('app_a_search_results_per_page', 10));
     $this->pager->setResultArray($values);
     $this->pager->setPage($request->getParameter('page', 1));
     $this->pager->init();
     $this->pagerUrl = "a/search?" . http_build_query(array("q" => $q));
     // setTitle takes care of escaping things
     $this->getResponse()->setTitle(aTools::getOptionI18n('title_prefix') . 'Search for ' . $q . aTools::getOptionI18n('title_suffix'));
     $results = $this->pager->getResults();
     // Now that we have paginated and obtained the short list of results we really
     // care about it's OK to use the lazy load features of Lucene for the last mile
     $nresults = array();
     foreach ($results as $value) {
         $nvalue = $value;
         $nvalue->slug = $nvalue->slug_stored;
         $nvalue->title = $nvalue->title_stored;
         $nvalue->summary = $nvalue->summary_stored;
         if (strlen($nvalue->engine_stored)) {
             $helperClass = $nvalue->engine_stored . 'SearchHelper';
             if (class_exists($helperClass)) {
                 $searchHelper = new $helperClass();
                 $nvalue->partial = $searchHelper->getPartial();
             }
         }
         if (!isset($nvalue->url)) {
             if (substr($nvalue->slug, 0, 1) === '@') {
                 // Virtual page slug is a named Symfony route, it wants search results to go there
                 $nvalue->url = $this->getController()->genUrl($nvalue->slug, true);
             } else {
                 $slash = strpos($nvalue->slug, '/');
                 if ($slash === false) {
                     // A virtual page (such as global) that isn't the least bit interested in
                     // being part of search results
                     continue;
                 }
                 if ($slash > 0) {
                     // A virtual page slug which is a valid Symfony route, such as foo/bar?id=55
                     $nvalue->url = $this->getController()->genUrl($nvalue->slug, true);
                 } else {
                     // A normal CMS page
                     $nvalue->url = aTools::urlForPage($nvalue->slug);
                 }
             }
         }
         $nvalue->class = 'aPage';
         $nresults[] = $nvalue;
     }
     $this->results = $nresults;
 }
Esempio n. 2
0
 /**
  * DOCUMENT ME
  * @param mixed $privilege
  * @param mixed $user
  * @return mixed
  */
 public function userHasPrivilege($privilege, $user = false)
 {
     return aPageTable::checkPrivilege($privilege, $this, $user);
 }
 public function executeSearch(sfWebRequest $request)
 {
     // create the array of pages matching the query
     $q = $request->getParameter('q');
     if ($request->hasParameter('x')) {
         // We like to use input type="image" for presentation reasons, but it generates
         // ugly x and y parameters with click coordinates. Get rid of those and come back.
         return $this->redirect(sfContext::getInstance()->getController()->genUrl('a/search', true) . '?' . http_build_query(array("q" => $q)));
     }
     $key = strtolower(trim($q));
     $key = preg_replace('/\\s+/', ' ', $key);
     $replacements = sfConfig::get('app_a_search_refinements', array());
     if (isset($replacements[$key])) {
         $q = $replacements[$key];
     }
     $values = aZendSearch::searchLuceneWithValues(Doctrine::getTable('aPage'), $q, aTools::getUserCulture());
     $nvalues = array();
     foreach ($values as $value) {
         // doesn't implement isset
         if (strlen($value->info)) {
             $info = unserialize($value->info);
             if (!aPageTable::checkPrivilege('view', $info)) {
                 continue;
             }
         }
         $nvalue = $value;
         if (substr($nvalue->slug, 0, 1) === '@') {
             // Virtual page slug is a named Symfony route, it wants search results to go there
             $nvalue->url = $this->getController()->genUrl($nvalue->slug, true);
         } else {
             $slash = strpos($nvalue->slug, '/');
             if ($slash === false) {
                 // A virtual page (such as global) taht isn't the least bit interested in
                 // being part of search results
                 continue;
             }
             if ($slash > 0) {
                 // A virtual page slug which is a valid Symfony route, such as foo/bar?id=55
                 $nvalue->url = $this->getController()->genUrl($nvalue->slug, true);
             } else {
                 // A normal CMS page
                 $nvalue->url = aTools::urlForPage($nvalue->slug);
             }
         }
         $nvalue->class = 'aPage';
         $nvalues[] = $nvalue;
     }
     $values = $nvalues;
     if ($this->searchAddResults($values, $q)) {
         usort($values, "aActions::compareScores");
     }
     $this->pager = new aArrayPager(null, sfConfig::get('app_a_search_results_per_page', 10));
     $this->pager->setResultArray($values);
     $this->pager->setPage($request->getParameter('page', 1));
     $this->pager->init();
     $this->pagerUrl = "a/search?" . http_build_query(array("q" => $q));
     // setTitle takes care of escaping things
     $this->getResponse()->setTitle(aTools::getOptionI18n('title_prefix') . 'Search for ' . $q . aTools::getOptionI18n('title_suffix'));
     $this->results = $this->pager->getResults();
 }
 public static function filterForEngine($options)
 {
     // This method filters the virtual pages, tags and categories associated with a particular engine based on
     // specified criteria such as tag, category, publication date, etc.
     // Strategy: do Lucene queries and direct SQL queries that will get us all the info about relevant categories,
     // tags and virtual pages. Then turn that into a select distinct query for each of those things. The resulting
     // information is sufficient to populate the filters sidebar with options that are still relevant given the
     // other criteria in effect, and also to fetch the result pages (you'll want to do that with a LIMIT and an IN
     // query looking at the first n IDs returned by this method).
     // The options array looks like this. Note that all of these are optional and if each is unspecified or empty
     // no restriction is made on that particular basis. 'categoryIds' is used to limit to the categories associated
     // with the engine page, while 'categorySlug' is used to limit to a category specified by the user as a
     // filter. The 'q' option is Lucene search.
     // array(
     //   'q' => 'gromit',
     //   'categoryIds' => array(1, 3, 5),
     //   'categorySlug' => 'cheese',
     //   'tag' => 'wensleydale',
     //   'slugStem' => '@a_event_search_redirect',
     //   'year' => 2010, # Optional, if present only 2010 is shown
     //   'month' => 12, # Optional, if present only Dec. 2010 is shown
     //   'day' => 15, # Optional, if present only Dec. 15th 2010 is shown
     //   'byEventDateRange' => true, # For events only, joins with a_blog_item to get the range
     //   'byPublishedAt' => true, # For blog posts or pages
     // The returned value looks like this:
     // array(
     //   'categoriesInfo' => array('slug' => 'cheese', 'name' => 'Cheese'),
     //   'tagNames' => array('wensleydale'),
     //   'pageIds' => array(10, 15, 20, 25)
     $alphaSort = isset($options['alphaSort']) && $options['alphaSort'];
     if (isset($options['q']) && strlen($options['q'])) {
         $q = $options['q'];
         $key = strtolower(trim($q));
         $key = preg_replace('/\\s+/', ' ', $key);
         $replacements = sfConfig::get('app_a_search_refinements', array());
         if (isset($replacements[$key])) {
             $q = $replacements[$key];
         }
         if (isset($options['slugStem'])) {
             $q = "({$q}) AND slug:" . $options['slugStem'];
         }
         try {
             $values = aZendSearch::searchLuceneWithValues(Doctrine::getTable('aPage'), $q, aTools::getUserCulture());
         } catch (Exception $e) {
             // Lucene search error. TODO: display it nicely if they are always safe things to display. For now: just don't crash
             $values = array();
         }
         $now = date('YmdHis');
         $pageIds = array();
         foreach ($values as $value) {
             // Regardless of the above if it ain't published yet we can't see it.
             // We filter on that in the Doctrine query too but take advantage of
             // this chance to preempt a little work
             if ($value->published_at > $now) {
                 continue;
             }
             // 1.5: the names under which we store columns in Zend Lucene have changed to
             // avoid conflict with also indexing them
             $info = unserialize($value->info_stored);
             if (!aPageTable::checkPrivilege('view', $info)) {
                 continue;
             }
             $pageIds[] = $info['id'];
         }
     }
     $mysql = new aMysql();
     if (isset($options['slugStem'])) {
         $params['slug_pattern'] = $options['slugStem'] . '%';
     }
     // Select the relevant virtual pages for this engine
     $q = 'from a_page p ';
     // If alpha sort is present we need title slots
     if ($alphaSort) {
         if (!isset($options['culture'])) {
             $options['culture'] = aTools::getUserCulture();
         }
         $culture = $options['culture'];
         $q .= "\n        LEFT JOIN a_area a ON a.page_id = p.id AND a.name = 'title' AND a.culture = :culture\n        LEFT JOIN a_area_version v ON v.area_id = a.id AND a.latest_version = v.version \n        LEFT JOIN a_area_version_slot avs ON avs.area_version_id = v.id\n        LEFT JOIN a_slot s ON s.id = avs.slot_id ";
         $params['culture'] = $culture;
     }
     // Merge in categories. A left join unless we are restricted to certain categories
     $hasCategoryIds = isset($options['categoryIds']) && count($options['categoryIds']);
     $hasCategorySlug = isset($options['categorySlug']) && strlen($options['categorySlug']);
     $restrictedByCategory = $hasCategoryIds || $hasCategorySlug;
     if ($restrictedByCategory) {
         $cjoin = 'inner join';
     } else {
         $cjoin = 'left join';
     }
     $q .= $cjoin . ' a_page_to_category ptc on ptc.page_id = p.id ' . $cjoin . ' a_category c on ptc.category_id = c.id ';
     // The engine page is locked down to these categories. If none are specified it is not
     // locked down by category
     if ($hasCategoryIds) {
         $q .= "and c.id in :category_ids ";
         $params['category_ids'] = $options['categoryIds'];
     }
     // Bring in tags...
     $hasTag = isset($options['tag']) && strlen($options['tag']);
     if ($hasTag) {
         $q .= 'inner join ';
     } else {
         $q .= 'left join ';
     }
     $q .= 'tagging ti on ti.taggable_id = p.id and ti.taggable_model = "aPage" left join tag t on ti.tag_id = t.id ';
     // Get ready to filter posts or events chronologically
     $year = sprintf("%04d", isset($options['year']) ? $options['year'] : 0);
     $month = sprintf("%02d", isset($options['month']) ? $options['month'] : 0);
     $day = sprintf("%02d", isset($options['day']) ? $options['day'] : 0);
     $startYear = $year;
     $endYear = $year;
     if ($year > 0) {
         if ($month == 0) {
             // Do not mess up the two digit strings please
             $startMonth = '01';
             $startDay = '01';
             $endMonth = '12';
             $endDay = '31';
         } else {
             $startMonth = $month;
             $endMonth = $month;
             if ($day == 0) {
                 // Do not mess up the two digit strings please
                 $startDay = '01';
                 $endDay = '31';
             } else {
                 $startDay = $day;
                 $endDay = $day;
             }
         }
     } else {
         // For posts "today and forward" is not a relevant concept (and a separate clause
         // already makes sure we don't see unpublished stuff). For events we'll override
         // the start date below
         $startYear = '0000';
         $startMonth = '01';
         $startDay = '01';
         $endYear = '9999';
         $endMonth = '12';
         $endDay = '31';
     }
     $events = isset($options['byEventDateRange']) && $options['byEventDateRange'];
     if ($events && $startYear === '0000') {
         list($startYear, $startMonth, $startDay) = preg_split('/-/', date('Y-m-d'));
     }
     if ($events) {
         // The event's start and end dates are part of the blog item table
         $q .= ' inner join a_blog_item bi on bi.page_id = p.id ';
         $q .= "and bi.start_date <= :end_date ";
         $params['end_date'] = "{$endYear}-{$endMonth}-{$endDay}";
         $q .= "and bi.end_date >= :start_date ";
         $params['start_date'] = "{$startYear}-{$startMonth}-{$startDay}";
     }
     // Criteria for the pages themselves
     $q .= 'where p.slug like :slug_pattern ';
     // We often filter posts (not events) by a range of publication dates
     if (isset($options['byPublishedAt']) && $options['byPublishedAt']) {
         $q .= "and p.published_at <= :p_end_date ";
         $params['p_end_date'] = "{$endYear}-{$endMonth}-{$endDay}";
         $q .= "and p.published_at >= :p_start_date ";
         $params['p_start_date'] = "{$startYear}-{$startMonth}-{$startDay}";
     }
     // In no case do we show unpublished material
     $q .= 'and p.published_at <= NOW() and (p.archived IS NULL or p.archived IS FALSE) ';
     // ... But only those matching the Lucene search that already gave us specific IDs.
     // NOTE: if pageIds is not null and is empty, NOTHING should be returned
     // (someone searched for something that doesn't appear in the system)
     if (isset($pageIds)) {
         if (count($pageIds)) {
             $q .= 'and p.id in :pageIds ';
             $params['pageIds'] = $pageIds;
         } else {
             $q .= 'and 0 <> 0 ';
         }
     }
     if ($alphaSort) {
         $pagesOrderBy = 's.value asc';
     } elseif ($events) {
         $pagesOrderBy = 'bi.start_date asc, bi.start_time asc';
     } else {
         // Oops: blog presentation is typically descending, not ascending
         $pagesOrderBy = 'p.published_at desc';
     }
     // Separate queries, but quite fast because we're not bogged down in Doctrineland
     $c_q = $q;
     $t_q = $q;
     $p_q = $q;
     // We are filtering by this specific category
     if ($hasCategorySlug) {
         // Limit tags and pages by this specific category, but don't limit
         // categories by it, otherwise we can't present a choice of categories
         // meeting the other criteria
         $t_q .= "and c.slug = :category_slug ";
         $p_q .= "and c.slug = :category_slug ";
         $params['category_slug'] = $options['categorySlug'];
     }
     if ($hasTag) {
         // Limit pages and categories by this specific tag, but don't limit
         // tags by it, otherwise we can't present a choice of tags
         // meeting the other criteria
         $p_q .= 'and t.name = :tag_name ';
         $c_q .= 'and t.name = :tag_name ';
         $params['tag_name'] = $options['tag'];
     }
     // In the cases where we are looking for categories or tags, be sure to
     // discard the null rows from the LEFT JOINs. This is simpler than
     // determining when to switch them to INNER JOINs
     $result = array('categoriesInfo' => $mysql->query('select distinct c.slug, c.name ' . $c_q . 'and c.slug is not null order by c.name', $params), 'tagsByName' => $mysql->query('select t.name, count(distinct p.id) as t_count ' . $t_q . 'and t.name is not null group by t.name order by t.name', $params), 'tagsByPopularity' => $mysql->query('select t.name, count(distinct p.id) as t_count ' . $t_q . 'and t.name is not null group by t.name order by t_count desc limit 10', $params), 'pageIds' => $mysql->queryScalar('select distinct p.id ' . $p_q . ' order by ' . $pagesOrderBy, $params));
     return $result;
 }