本文整理汇总了PHP中SimpleHtmlSaxParser类的典型用法代码示例。如果您正苦于以下问题:PHP SimpleHtmlSaxParser类的具体用法?PHP SimpleHtmlSaxParser怎么用?PHP SimpleHtmlSaxParser使用的例子?那么, 这里精选的类代码示例或许可以为您提供帮助。
在下文中一共展示了SimpleHtmlSaxParser类的8个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的PHP代码示例。
示例1: parse
/**
* Reads the raw content and send events
* into the page to be built.
* @param $response SimpleHttpResponse Fetched response.
* @return SimplePage Newly parsed page.
* @access public
*/
function parse($response)
{
$this->tags = array();
$this->page = $this->createPage($response);
$parser = new SimpleHtmlSaxParser($this);
$parser->parse($response->getContent());
$this->acceptPageEnd();
$page = $this->page;
$this->free();
return $page;
}
示例2: testHtmlEntityTranslation
function testHtmlEntityTranslation()
{
$this->assertEqual(SimpleHtmlSaxParser::normalise('<>"&''), '<>"&\'');
}
示例3: getText
/**
* Accessor for plain text of page as a text browser
* would see it.
* @return string Plain text of page.
* @access public
*/
function getText()
{
if (!$this->_text) {
$this->_text = SimpleHtmlSaxParser::normalise($this->_raw);
}
return $this->_text;
}
示例4: getDefault
/**
* Accessor for starting value.
* @return string Parsed value.
* @access public
*/
function getDefault()
{
return $this->_wrap(SimpleHtmlSaxParser::decodeHtml($this->getContent()));
}
示例5: testNestedFrameInFrameset
function testNestedFrameInFrameset()
{
$listener = $this->createListener();
$listener->expectAt(0, 'startElement', array('frameset', array()));
$listener->expectAt(1, 'startElement', array('frame', array('src' => 'frame.html')));
$listener->expectCallCount('startElement', 2);
$listener->expectOnce('addContent', array('<noframes>Hello</noframes>'));
$listener->expectOnce('endElement', array('frameset'));
$parser = new SimpleHtmlSaxParser($listener);
$this->assertTrue($parser->parse('<frameset><frame src="frame.html"><noframes>Hello</noframes></frameset>'));
}
示例6: normalise
/**
* Turns HTML into text browser visible text. Images
* are converted to their alt text and tags are supressed.
* Entities are converted to their visible representation.
* @param string $html HTML to convert.
* @return string Plain text.
* @access public
*/
static function normalise($html)
{
$text = preg_replace('|<!--.*?-->|', '', $html);
$text = preg_replace('|<script[^>]*>.*?</script>|', '', $text);
$text = preg_replace('|<img[^>]*alt\\s*=\\s*"([^"]*)"[^>]*>|', ' \\1 ', $text);
$text = preg_replace('|<img[^>]*alt\\s*=\\s*\'([^\']*)\'[^>]*>|', ' \\1 ', $text);
$text = preg_replace('|<img[^>]*alt\\s*=\\s*([a-zA-Z_]+)[^>]*>|', ' \\1 ', $text);
$text = preg_replace('|<[^>]*>|', '', $text);
$text = SimpleHtmlSaxParser::decodeHtml($text);
$text = preg_replace('|\\s+|', ' ', $text);
return trim(trim($text), "�");
// TODO: The \xAO is a . Add a test for this.
}
示例7: normalise
/**
* Turns HTML into text browser visible text. Images
* are converted to their alt text and tags are supressed.
* Entities are converted to their visible representation.
* @param string $html HTML to convert.
* @return string Plain text.
* @access public
* @static
*/
function normalise($html)
{
$text = preg_replace('|<!--.*?-->|', '', $html);
$text = preg_replace('|<img.*?alt\\s*=\\s*"(.*?)".*?>|', ' \\1 ', $text);
$text = preg_replace('|<img.*?alt\\s*=\\s*\'(.*?)\'.*?>|', ' \\1 ', $text);
$text = preg_replace('|<img.*?alt\\s*=\\s*([a-zA-Z_]+).*?>|', ' \\1 ', $text);
$text = preg_replace('|<.*?>|', '', $text);
$text = SimpleHtmlSaxParser::decodeHtml($text);
$text = preg_replace('|\\s+|', ' ', $text);
return trim($text);
}
示例8: normalise
/**
* Turns HTML into text browser visible text. Images
* are converted to their alt text and tags are supressed.
* Entities are converted to their visible representation.
* @param string $html HTML to convert.
* @return string Plain text.
* @access public
* @static
*/
function normalise($html)
{
$text = preg_replace('|<!--.*?-->|', '', $html);
$text = preg_replace('|<script[^>]*>.*?</script>|', '', $text);
$text = preg_replace('|<img[^>]*alt\\s*=\\s*"([^>]*)"[^>]*>|', ' \\1 ', $text);
$text = preg_replace('|<img[^>]*alt\\s*=\\s*\'([^>]*)\'[^>]*>|', ' \\1 ', $text);
$text = preg_replace('|<img[^>]*alt\\s*=\\s*([a-zA-Z_]+)[^>]*>|', ' \\1 ', $text);
$text = preg_replace('|<[^>]*>|', '', $text);
$text = SimpleHtmlSaxParser::decodeHtml($text);
$text = preg_replace('|\\s+|', ' ', $text);
return trim($text);
}