예제 #1
0
파일: Parser.php 프로젝트: aduroo/feed-api
 /**
  * Constructor.
  *
  * @param string $content       Feed content
  * @param string $http_encoding HTTP encoding (headers)
  * @param string $fallback_url  Fallback url when the feed provide relative or broken url
  */
 public function __construct($content, $http_encoding = '', $fallback_url = '')
 {
     $this->date = new DateParser();
     $this->fallback_url = $fallback_url;
     $xml_encoding = XmlParser::getEncodingFromXmlTag($content);
     // Strip XML tag to avoid multiple encoding/decoding in the next XML processing
     $this->content = Filter::stripXmlTag($content);
     // Encode everything in UTF-8
     Logger::setMessage(get_called_class() . ': HTTP Encoding "' . $http_encoding . '" ; XML Encoding "' . $xml_encoding . '"');
     $this->content = Encoding::convert($this->content, $xml_encoding ?: $http_encoding);
 }
예제 #2
0
파일: Scraper.php 프로젝트: aduroo/feed-api
 /**
  * Normalize encoding and strip head tag.
  */
 public function prepareHtml()
 {
     $html_encoding = XmlParser::getEncodingFromMetaTag($this->html);
     $this->html = Encoding::convert($this->html, $html_encoding ?: $this->encoding);
     $this->html = Filter::stripHeadTags($this->html);
     Logger::setMessage(get_called_class() . ': HTTP Encoding "' . $this->encoding . '" ; HTML Encoding "' . $html_encoding . '"');
 }