功能:
1.擷取內容中的url,email,image。
2.替換內容中的url,email,image。
url:<a href="url">xxx</a>email:admin@admin.comimage:<img src="image">
Grep.class.php
<?php/** grep class* Date: 2013-06-15* Author: fdipzone* Ver: 1.0** Func:** set: 設定內容* get: 返回指定的內容* replace: 返回替換後的內容* get_pattern 根據type返回pattern*/class Grep{ // class start private $_pattern = array( 'url' => '/<a.*?href="((http(s)?:\/\/).*?)".*?/si', 'email' => '/([\w\-\.]+@[\w\-\.]+(\.\w+))/', 'image' => '/<img.*?src=\"(http:\/\/.+\.(jpg|jpeg|gif|bmp|png))\">/i' ); private $_content = ''; // 源內容 /* 設置搜尋的內容 * @param String $content */ public function set($content=''){ $this->_content = $content; } /* 擷取指定內容 * @param String $type * @param int $unique 0:all 1:unique * @return Array */ public function get($type='', $unique=0){ $type = strtolower($type); if($this->_content=='' || !in_array($type, array_keys($this->_pattern))){ return array(); } $pattern = $this->get_pattern($type); // 擷取pattern preg_match_all($pattern, $this->_content, $matches); return isset($matches[1])? ( $unique==0? $matches[1] : array_unique($matches[1]) ) : array(); } /* 擷取替換後的內容 * @param String $type * @param String $callback * @return String */ public function replace($type='', $callback=''){ $type = strtolower($type); if($this->_content=='' || !in_array($type, array_keys($this->_pattern)) || $callback==''){ return $this->_content; } $pattern = $this->get_pattern($type); return preg_replace_callback($pattern, $callback, $this->_content); } /* 根據type擷取pattern * @param String $type * @return String */ private function get_pattern($type){ return $this->_pattern[$type]; }} // class end?>
Demo
<?phpheader('content-type:text/htm;charset=utf8');require('Grep.class.php');$content = file_get_contents('http://www.test.com/');$obj = new Grep();$obj->set($content);$url = $obj->get('url', 0);$email = $obj->get('email', 1);$image = $obj->get('image', 1);print_r($url);print_r($email);print_r($image);$url_new = $obj->replace('url', 'replace_url');echo $url_new;function replace_url($matches){ return isset($matches[1])? '[url]'.$matches[1].'[/url]' : '';}?>
以上就是php 擷取頁面中的指定內容類別的內容,更多相關內容請關注topic.alibabacloud.com(www.php.cn)!