在给网站页面做SEO的时候,长用到得一些函数。
比如:良好URL生成,用户名过滤,email检测,截取字符串,全角替换成半角,删除html等
1. [PHP]代码
<?php class SeoTools { public function friendlyURL($string, $replacement = '-') { $map = array( '/à|á|å|â|ä/' => 'a', '/è|é|ê|ẽ|ë/' => 'e', '/ì|í|î/' => 'i', '/ò|ó|ô|ø/' => 'o', '/ù|ú|ů|û/' => 'u', '/ç|č/' => 'c', '/ñ|ň/' => 'n', '/ľ/' => 'l', '/ý/' => 'y', '/ť/' => 't', '/ž/' => 'z', '/š/' => 's', '/æ/' => 'ae', '/ö/' => 'oe', '/ü/' => 'ue', '/Ä/' => 'Ae', '/Ü/' => 'Ue', '/Ö/' => 'Oe', '/ß/' => 'ss', '/ /'=>' ', '/ /'=>'', '/~|·|!|@|#|¥|%|…|&|×|(|)|-|\+|=|『|【|』|】|、|:|;|“|”|\'| 《|,|》|。|?|\/|—|_|:|√|<|°|丶|>|-|★|||│|‖|ˇ/'=>' ', '/[^\w\s\x80-\xff]/' => ' ', '/\\s+/' => $replacement ); $string = trim($string); $string = preg_replace(array_keys($map), array_values($map), $string); $string = preg_replace('/\\s+/',$replacement, strtolower($string)); $string = trim($string,$replacement); return $string; } //判断email public function isEmail($mailAddr) { return strlen($mailAddr) > 6 && preg_match("/^[\w\-\.]+@[\w\-]+(\.\w+)+$/", $mailAddr); } //过滤用户 public function CheckUser($string,$replacement = '_') { $map = array( '/à|á|å|â|ä/' => 'a', '/è|é|ê|ẽ|ë/' => 'e', '/ì|í|î/' => 'i', '/ò|ó|ô|ø/' => 'o', '/ù|ú|ů|û/' => 'u', '/ç|č/' => 'c', '/ñ|ň/' => 'n', '/ľ/' => 'l', '/ý/' => 'y', '/ť/' => 't', '/ž/' => 'z', '/š/' => 's', '/æ/' => 'ae', '/ö/' => 'oe', '/ü/' => 'ue', '/Ä/' => 'Ae', '/Ü/' => 'Ue', '/Ö/' => 'Oe', '/ß/' => 'ss', '/ /'=>' ', '/ /'=>'', '/~|·|!|@|#|¥|%|…|&|×|(|)|-|\+|=|『|【|』|】|、|:|;|“|”|\'|《|,|》|。 |?|\/|—|_|:|√|<|°|丶|>|-|★|||│|‖|ˇ/'=>' ', '/[^\w\s\x80-\xff]/' => ' ', '/\\s+/' => $replacement ); $string = trim($string); $string = preg_replace(array_keys($map), array_values($map), $string); $string = preg_replace('/\\s+/',$replacement, strtolower($string)); $string = trim($string,$replacement); return $string; } public function mktitle($string, $replacement = '_') { $map = array( '/à|á|å|â|ä/' => 'a', '/è|é|ê|ẽ|ë/' => 'e', '/ì|í|î/' => 'i', '/ò|ó|ô|ø/' => 'o', '/ù|ú|ů|û/' => 'u', '/ç|č/' => 'c', '/ñ|ň/' => 'n', '/ľ/' => 'l', '/ý/' => 'y', '/ť/' => 't', '/ž/' => 'z', '/š/' => 's', '/æ/' => 'ae', '/ö/' => 'oe', '/ü/' => 'ue', '/Ä/' => 'Ae', '/Ü/' => 'Ue', '/Ö/' => 'Oe', '/ß/' => 'ss', '/ /'=>' ', '/ /'=>'', '/~|·|!|@|#|¥|%|…|&|×|(|)|-|\+|=|『|【|』|】|、|:|;|“|”|\'|《|,|》|。 |?|\/|—|_|:|√|<|°|丶|>|-|★|||│|‖|ˇ/'=>' ', '/[^\w\s^.\x80-\xff]/' => ' ', '/\\s+/' => $replacement ); $string = trim($string); $string = preg_replace(array_keys($map), array_values($map), $string); $string = preg_replace('/\\s+/',$replacement, strtolower($string)); $string = trim($string,$replacement); return $string; } // 全角替换成半角 public function Qj2bj($string) { $qj2bj = array( '1' => '1', '2' => '2', '3' => '3', '4' => '4', '5' => '5', '6' => '6', '7' => '7', '8' => '8', '9' => '9', '0' => '0', 'a' => 'a', 'b' => 'b', 'c' => 'c', 'd' => 'd', 'e' => 'e', 'f' => 'f', 'g' => 'g', 'h' => 'h', 'i' => 'i', 'j' => 'j', 'k' => 'k', 'l' => 'l', 'm' => 'm', 'n' => 'n', 'o' => 'o', 'p' => 'p', 'q' => 'q', 'r' => 'r', 's' => 's', 't' => 't', 'u' => 'u', 'v' => 'v', 'w' => 'w', 'x' => 'x', 'y' => 'y', 'z' => 'z', 'A' => 'A', 'B' => 'B', 'C' => 'C', 'D' => 'D', 'E' => 'E', 'F' => 'F', 'G' => 'G', 'H' => 'H', 'I' => 'I', 'J' => 'J', 'K' => 'K', 'L' => 'L', 'M' => 'M', 'N' => 'N', 'O' => 'O', 'P' => 'P', 'Q' => 'Q', 'R' => 'R', 'S' => 'S', 'T' => 'T', 'U' => 'U', 'V' => 'V', 'W' => 'W', 'X' => 'X', 'Y' => 'Y', 'Z' => 'Z', ' ' => ' ' ); return strtr($string, $qj2bj); } public function DelNbsp($string) { $map = array( '/ /'=>' ', '/\?/'=>' ', '/ /'=>'', ); $string = preg_replace(array_keys($map), array_values($map), $string); $string = preg_replace('/\\s+/','',$string); return $string; } public function getZipcode($str) { $pattern = "/[0-9]{1}(\d+){4,5}/"; preg_match_all($pattern,$str,$zipcodeArr); if(empty($zipcodeArr[0])) { return ''; } else { return $zipcodeArr[0][0]; } } public function checkZipcode($str) { $strwidth=strlen($str); $zipcode=$str; switch($strwidth) { case 4:$zipcode="00".$str;break; case 5:$zipcode="0".$str;break; case 6:$zipcode=$str;break; default:$zipcode="";break; } return $zipcode; } public function getEmail($str) { $pattern = "/\w+([-+.]\w+)*@\w+([-.]\w+)*\.\w+([-.]\w+)*/i"; preg_match_all($pattern,$str,$emailArr); if(empty($emailArr[0])) { return ''; } else { $email_str=implode(",", $emailArr[0]); return $email_str; } } public function getUrl($str) { $pattern = "/(http:\/\/|https:\/\/|ftp:\/\/)?([\w:\/\.\?=&-_]+)/is"; preg_match_all($pattern,$str,$urlArr); if(empty($urlArr[0])) { return ''; } else { $url_str=implode(",", $urlArr[0]); $url_str=preg_replace('/(http:\/\/|https:\/\/|ftp:\/\/)/','',$url_str); return $url_str; } } public function match_links($document) { $match=array(); preg_match_all("'<\s*a\s.*?href\s*=\s*([\"\'])?(?(1)(.*?)\\1|([^\s\>]+))[^>]*>?(.*?) </a>'isx",$document,$links); while(list($key,$val) = each($links[2])) { if(!empty($val)) $match['link'][] = $val; } while(list($key,$val) = each($links[3])) { if(!empty($val)) $match['link'][] = $val; } while(list($key,$val) = each($links[4])) { if(!empty($val)) $match['content'][] = $val; } while(list($key,$val) = each($links[0])) { if(!empty($val)) $match['all'][] = $val; } return $match; } public function DelNoStr($string) { $map = array( '/à|á|å|â|ä/' => 'a', '/è|é|ê|ẽ|ë/' => 'e', '/ì|í|î/' => 'i', '/ò|ó|ô|ø/' => 'o', '/ù|ú|ů|û/' => 'u', '/ç|č/' => 'c', '/ñ|ň/' => 'n', '/ľ/' => 'l', '/ý/' => 'y', '/ť/' => 't', '/ž/' => 'z', '/š/' => 's', '/æ/' => 'ae', '/ö/' => 'oe', '/ü/' => 'ue', '/Ä/' => 'Ae', '/Ü/' => 'Ue', '/Ö/' => 'Oe', '/ß/' => 'ss', '/ /'=>' ', '/ /'=>'', '/~|·|!|@|#|¥|%|…|&|×|(|)|-|\+|=|『|【|』|】|、|:|;|“|”|’|《|,|》|。 |?|\/|—|_|‘|:|√|<|°|丶|ˇ/'=>' ', '/[^\w\s\x80-\xff]/' => ' ', // '/\\s+/' => $replacement ); $string = trim($string); $string = preg_replace(array_keys($map), array_values($map), $string); $string = preg_replace('/\\s+/','',$string); $string = trim($string,''); return $string; } public function UrlToStr($string, $find = '/-/') { $string = preg_replace($find," ", strtolower($string)); $string = trim($string); return $string; } public function GetPyLetter($str) { return substr(pinyin($str, $ucfirst=true), 0,1); } public function GetPinYin($str) { return strtolower(pinyin($str, $ucfirst=true)); } public function DelCode($str) { $search = array("'<script[^>]*?>.*?</script>'si", // strip out javascript "'<[\/\!]*?[^<>]*?>'si", // strip out html tags "'([\r\n])[\s]+'", // strip out white space "'&(quot|#34|#034|#x22);'i", // replace html entities "'&(amp|#38|#038|#x26);'i", // added hexadecimal values "'&(lt|#60|#060|#x3c);'i", "'&(gt|#62|#062|#x3e);'i", "'&(nbsp|#160|#xa0);'i", "'&(iexcl|#161);'i", "'&(cent|#162);'i", "'&(pound|#163);'i", "'&(copy|#169);'i", "'&(reg|#174);'i", "'&(deg|#176);'i", "'&(#39|#039|#x27);'", "'&(euro|#8364);'i", // europe "'&a(uml|UML);'", // german "'&o(uml|UML);'", "'&u(uml|UML);'", "'&A(uml|UML);'", "'&O(uml|UML);'", "'&U(uml|UML);'", "'ß'i", ); $replace = array("", "", "\\1", "\"", "&", "<", ">", " ", chr(161), chr(162), chr(163), chr(169), chr(174), chr(176), chr(39), chr(128), "?", "?", "?", "?", "?", "?", "?", ); $str = preg_replace($search,$replace,$str); return trim($str); } public function CutStr($sourcestr,$cutlength) { $returnstr=''; $i=0; $n=0; $sourcestr=rtrim(SeoTools::DelCode($sourcestr)); $str_length=strlen($sourcestr);//字符串的字节数 while (($n<$cutlength) and ($i<=$str_length)) { $temp_str=substr($sourcestr,$i,1); $ascnum=Ord($temp_str);//得到字符串中第$i位字符的ascii码 if ($ascnum>=224) //如果ASCII位高与224, { $returnstr=$returnstr.substr($sourcestr,$i,3); //根据UTF-8编码规范,将3个连续的字符计为单个字符 $i=$i+3; //实际Byte计为3 $n++; //字串长度计1 } elseif ($ascnum>=192) //如果ASCII位高与192, { $returnstr=$returnstr.substr($sourcestr,$i,2); //根据UTF-8编码规范,将2个连续的字符计为单个字符 $i=$i+2; //实际Byte计为2 $n++; //字串长度计1 } elseif ($ascnum>=65 && $ascnum<=90) //如果是大写字母, { $returnstr=$returnstr.substr($sourcestr,$i,1); $i=$i+1; //实际的Byte数仍计1个 $n++; //但考虑整体美观,大写字母计成一个高位字符 } else //其他情况下,包括小写字母和半角标点符号, { $returnstr=$returnstr.substr($sourcestr,$i,1); $i=$i+1; //实际的Byte数计1个 $n=$n+0.5; //小写字母和半角标点等与半个高位字符宽... } } if ($str_length>$i){ $returnstr = $returnstr . ".";//超过长度时在尾处加上省略号 } return htmlspecialchars($returnstr); } public function CreateTagLink($tags_str) { $tags_array=explode(",",$tags_str); $link_tpl=""; foreach($tags_array as $v) { $tag=trim($v); $alias=SeoTools::friendlyURL($tag); // $link_tpl.='<a href="/s/'.urlencode($alias).'" title="'.$tag.'">'.$tag.'</a> '; $link_tpl.=$tag.' '; } return $link_tpl; } } /** * 中文转拼类 * * @author Lukin <my@lukin.cn> * @date 2011-01-25 10:44 */ class PinYin { // 码表 private $fp = null; private $dat = 'pinyin.dat'; public function __construct(){ $this->dat = dirname(__FILE__).'/'.$this->dat; if (is_file($this->dat)) { $this->fp = fopen($this->dat, 'rb'); } } /** * 转拼音 * * @param string $str 汉字 * @param bool $ucfirst 首字母大写 * @param bool $polyphony 忽略多读音 * @return string */ public function encode($str, $ucfirst=true, $polyphony=true) { $ret = ''; $len = mb_strlen($str, 'UTF-8'); for ($i = 0; $i < $len; $i++) { $py = $this->pinyin(mb_substr($str, $i, 1, 'UTF-8')); if ($ucfirst && strpos($py,',') !== false) { $pys = explode(',', $py); $ret.= implode(',', array_map('ucfirst', ($polyphony ? array_slice($pys, 0, 1) : $pys))); } else { $ret.= $ucfirst ? ucfirst($py) : $py; } } return $ret; } /** * 汉字转十进制 * * @param string $word * @return number */ private function char2dec($word) { $bins = ''; $chars = str_split($word); foreach($chars as $char) $bins.= decbin(ord($char)); $bins = preg_replace('/^.{4}(.{4}).{2}(.{6}).{2}(.{6})$/', '$1$2$3', $bins); return bindec($bins); } /** * 单个字转拼音 * * @param string $char 汉字 * @return string */ public function pinyin($char){ if (strlen($char) == 3 && $this->fp) { $offset = $this->char2dec($char); // 判断 off 值 if ($offset >= 0) { fseek($this->fp, ($offset - 19968) << 4, SEEK_SET); return trim(fread($this->fp, 16)); } } return $char; } public function __destruct() { if ($this->fp) { fclose($this->fp); } } } /** * 取得实例 * * @return $pinyin */ function &_pinyin_get_object() { static $pinyin; if ( is_null($pinyin) ) $pinyin = new PinYin(); return $pinyin; } if (!function_exists('pinyin')) : /** * 取得拼音 * * @param string $str * @param bool $ucfirst 首字母大写 * @return string */ function pinyin($str, $ucfirst=true) { $py = _pinyin_get_object(); return $py->encode($str, $ucfirst); } endif;
以上就是分享一个PHP 网站SEO及过滤类,方便使用的内容,更多相关内容请关注PHP中文网(www.php.cn)!

熱AI工具

Undresser.AI Undress
人工智慧驅動的應用程序,用於創建逼真的裸體照片

AI Clothes Remover
用於從照片中去除衣服的線上人工智慧工具。

Undress AI Tool
免費脫衣圖片

Clothoff.io
AI脫衣器

AI Hentai Generator
免費產生 AI 無盡。

熱門文章

熱工具

DVWA
Damn Vulnerable Web App (DVWA) 是一個PHP/MySQL的Web應用程序,非常容易受到攻擊。它的主要目標是成為安全專業人員在合法環境中測試自己的技能和工具的輔助工具,幫助Web開發人員更好地理解保護網路應用程式的過程,並幫助教師/學生在課堂環境中教授/學習Web應用程式安全性。 DVWA的目標是透過簡單直接的介面練習一些最常見的Web漏洞,難度各不相同。請注意,該軟體中

MinGW - Minimalist GNU for Windows
這個專案正在遷移到osdn.net/projects/mingw的過程中,你可以繼續在那裡關注我們。 MinGW:GNU編譯器集合(GCC)的本機Windows移植版本,可自由分發的導入函式庫和用於建置本機Windows應用程式的頭檔;包括對MSVC執行時間的擴展,以支援C99功能。 MinGW的所有軟體都可以在64位元Windows平台上運作。

Safe Exam Browser
Safe Exam Browser是一個安全的瀏覽器環境,安全地進行線上考試。該軟體將任何電腦變成一個安全的工作站。它控制對任何實用工具的訪問,並防止學生使用未經授權的資源。

Atom編輯器mac版下載
最受歡迎的的開源編輯器

mPDF
mPDF是一個PHP庫,可以從UTF-8編碼的HTML產生PDF檔案。原作者Ian Back編寫mPDF以從他的網站上「即時」輸出PDF文件,並處理不同的語言。與原始腳本如HTML2FPDF相比,它的速度較慢,並且在使用Unicode字體時產生的檔案較大,但支援CSS樣式等,並進行了大量增強。支援幾乎所有語言,包括RTL(阿拉伯語和希伯來語)和CJK(中日韓)。支援嵌套的區塊級元素(如P、DIV),