| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265 | 
							- <?php
 
- define('CODETABLEDIR', dirname(__FILE__).DIRECTORY_SEPARATOR.'encoding'.DIRECTORY_SEPARATOR);
 
- /**
 
-  * utf8转gbk
 
-  * @param $utfstr
 
-  */
 
- function utf8_to_gbk($utfstr) {
 
- 	global $UC2GBTABLE;
 
- 	$okstr = '';
 
- 	if(empty($UC2GBTABLE)) {
 
- 		$filename = CODETABLEDIR.'gb-unicode.table';
 
- 		$fp = fopen($filename, 'rb');
 
- 		while($l = fgets($fp,15)) {        
 
- 			$UC2GBTABLE[hexdec(substr($l, 7, 6))] = hexdec(substr($l, 0, 6));
 
- 		}
 
- 		fclose($fp);
 
- 	}
 
- 	$okstr = '';
 
- 	$ulen = strlen($utfstr);
 
- 	for($i=0; $i<$ulen; $i++) {
 
- 		$c = $utfstr[$i];
 
- 		$cb = decbin(ord($utfstr[$i]));
 
- 		if(strlen($cb)==8) { 
 
- 			$csize = strpos(decbin(ord($cb)),'0');
 
- 			for($j = 0; $j < $csize; $j++) {
 
- 				$i++; 
 
- 				$c .= $utfstr[$i];
 
- 			}
 
- 			$c = utf8_to_unicode($c);
 
- 			if(isset($UC2GBTABLE[$c])) {
 
- 				$c = dechex($UC2GBTABLE[$c]+0x8080);
 
- 				$okstr .= chr(hexdec($c[0].$c[1])).chr(hexdec($c[2].$c[3]));
 
- 			} else {
 
- 				$okstr .= '&#'.$c.';';
 
- 			}
 
- 		} else {
 
- 			$okstr .= $c;
 
- 		}
 
- 	}
 
- 	$okstr = trim($okstr);
 
- 	return $okstr;
 
- }
 
- /**
 
-  * gbk转utf8
 
-  * @param $gbstr
 
-  */
 
- function gbk_to_utf8($gbstr) {
 
- 	global $CODETABLE;
 
- 	if(empty($CODETABLE)) {
 
- 		$filename = CODETABLEDIR.'gb-unicode.table';
 
- 		$fp = fopen($filename, 'rb');
 
- 		while($l = fgets($fp,15)) { 
 
- 			$CODETABLE[hexdec(substr($l, 0, 6))] = substr($l, 7, 6); 
 
- 		}
 
- 		fclose($fp);
 
- 	}
 
- 	$ret = '';
 
- 	$utf8 = '';
 
- 	while($gbstr) {
 
- 		if(ord(substr($gbstr, 0, 1)) > 0x80) {
 
- 			$thisW = substr($gbstr, 0, 2);
 
- 			$gbstr = substr($gbstr, 2, strlen($gbstr));
 
- 			$utf8 = '';
 
- 			@$utf8 = unicode_to_utf8(hexdec($CODETABLE[hexdec(bin2hex($thisW)) - 0x8080]));
 
- 			if($utf8 != '') {
 
- 				for($i = 0; $i < strlen($utf8); $i += 3) $ret .= chr(substr($utf8, $i, 3));
 
- 			}
 
- 		} else {
 
- 			$ret .= substr($gbstr, 0, 1);
 
- 			$gbstr = substr($gbstr, 1, strlen($gbstr));
 
- 		}
 
- 	}
 
- 	return $ret;
 
- }
 
- /**
 
-  * 繁体转简体
 
-  * @param  $Text
 
-  */
 
- function big5_to_gbk($Text) {
 
- 	global $BIG5_DATA;
 
- 	if(empty($BIG5_DATA)) {
 
- 		$filename = CODETABLEDIR.'big5-gb.table';
 
- 		$fp = fopen($filename, 'rb');
 
- 		$BIG5_DATA = fread($fp, filesize($filename));
 
- 		fclose($fp);
 
- 	}
 
- 	$max = strlen($Text)-1;
 
- 	for($i = 0; $i < $max; $i++) {
 
- 		$h = ord($Text[$i]);
 
- 		if($h >= 0x80) {
 
- 			$l = ord($Text[$i+1]);
 
- 			if($h==161 && $l==64) {
 
- 				$gbstr = ' ';
 
- 			} else {
 
- 				$p = ($h-160)*510+($l-1)*2;
 
- 				$gbstr = $BIG5_DATA[$p].$BIG5_DATA[$p+1];
 
- 			}
 
- 			$Text[$i] = $gbstr[0];
 
- 			$Text[$i+1] = $gbstr[1];
 
- 			$i++;
 
- 		}
 
- 	}
 
- 	return $Text;
 
- }
 
- /**
 
-  * 简体转繁体
 
-  * @param  $Text
 
-  */
 
- function gbk_to_big5($Text) {
 
- 	global $GB_DATA;
 
- 	if(empty($GB_DATA)) {
 
- 		$filename = CODETABLEDIR.'gb-big5.table';
 
- 		$fp = fopen($filename, 'rb');
 
- 		$gb = fread($fp, filesize($filename));
 
- 		fclose($fp);
 
- 	}
 
- 	$max = strlen($Text)-1;
 
- 	for($i = 0; $i < $max; $i++) {
 
- 		$h = ord($Text[$i]);
 
- 		if($h >= 0x80) {
 
- 			$l = ord($Text[$i+1]);
 
- 			if($h==161 && $l==64) {
 
- 				$big = ' ';
 
- 			} else {
 
- 				$p = ($h-160)*510+($l-1)*2;
 
- 				$big = $GB_DATA[$p].$GB_DATA[$p+1];
 
- 			}
 
- 			$Text[$i] = $big[0];
 
- 			$Text[$i+1] = $big[1];
 
- 			$i++;
 
- 		}
 
- 	}
 
- 	return $Text;
 
- }
 
- /**
 
-  * unicode转utf8
 
-  * @param  $c
 
-  */
 
- function unicode_to_utf8($c) {
 
- 	$str = '';
 
- 	if($c < 0x80) {
 
- 		$str .= $c;
 
- 	} elseif($c < 0x800) {
 
- 		$str .= (0xC0 | $c >> 6);
 
- 		$str .= (0x80 | $c & 0x3F);
 
- 	} elseif($c < 0x10000) {
 
- 		$str .= (0xE0 | $c >> 12);
 
- 		$str .= (0x80 | $c >> 6 & 0x3F);
 
- 		$str .= (0x80 | $c & 0x3F);
 
- 	} elseif($c < 0x200000) {
 
- 		$str .= (0xF0 | $c >> 18);
 
- 		$str .= (0x80 | $c >> 12 & 0x3F);
 
- 		$str .= (0x80 | $c >> 6 & 0x3F);
 
- 		$str .= (0x80 | $c & 0x3F);
 
- 	}
 
- 	return $str;
 
- }
 
- /**
 
-  * utf8转unicode
 
-  * @param  $c
 
-  */
 
- function utf8_to_unicode($c) {
 
- 	switch(strlen($c)) {
 
- 		case 1:
 
- 		  return ord($c);
 
- 		case 2:
 
- 		  $n = (ord($c[0]) & 0x3f) << 6;
 
- 		  $n += ord($c[1]) & 0x3f;
 
- 		  return $n;
 
- 		case 3:
 
- 		  $n = (ord($c[0]) & 0x1f) << 12;
 
- 		  $n += (ord($c[1]) & 0x3f) << 6;
 
- 		  $n += ord($c[2]) & 0x3f;
 
- 		  return $n;
 
- 		case 4:
 
- 		  $n = (ord($c[0]) & 0x0f) << 18;
 
- 		  $n += (ord($c[1]) & 0x3f) << 12;
 
- 		  $n += (ord($c[2]) & 0x3f) << 6;
 
- 		  $n += ord($c[3]) & 0x3f;
 
- 		  return $n;
 
- 	}
 
- }
 
- /**
 
-  * Ascii转拼音
 
-  * @param $asc
 
-  * @param $pyarr
 
-  */
 
- function asc_to_pinyin($asc,&$pyarr) {
 
- 	if($asc < 128)return chr($asc);
 
- 	elseif(isset($pyarr[$asc]))return $pyarr[$asc];
 
- 	else {
 
- 		foreach($pyarr as $id => $p) {
 
- 			if($id >= $asc)return $p;
 
- 		}
 
- 	}
 
- }
 
- /**
 
-  * gbk转拼音
 
-  * @param $txt
 
-  */
 
- function gbk_to_pinyin($txt) {
 
- 	if(CHARSET != 'gbk') {
 
- 		$txt = iconv(CHARSET,'GBK',$txt);
 
- 	}	
 
- 	$l = strlen($txt);
 
- 	$i = 0;
 
- 	$pyarr = array();
 
- 	$py = array();
 
- 	$filename = CODETABLEDIR.'gb-pinyin.table';
 
- 	$fp = fopen($filename,'r');
 
- 	while(!feof($fp)) {
 
- 		$p = explode("-",fgets($fp,32));
 
- 		$pyarr[intval($p[1])] = trim($p[0]);
 
- 	}
 
- 	fclose($fp);
 
- 	ksort($pyarr);
 
- 	while($i<$l) {
 
- 		$tmp = ord($txt[$i]);
 
- 		if($tmp>=128) {
 
- 			$asc = abs($tmp*256+ord($txt[$i+1])-65536);
 
- 			$i = $i+1;
 
- 		} else $asc = $tmp;
 
- 		$py[] = asc_to_pinyin($asc,$pyarr);
 
- 		$i++;
 
- 	}
 
- 	return $py;
 
- }
 
- /**
 
-  * 数组 utf8转gbk
 
-  * @param $utfstr
 
-  */
 
- function array_utf8_to_gbk($data) {
 
- 	if (!is_array($data)) {
 
- 		return utf8_to_gbk($data);
 
- 	} else {
 
- 		foreach ($data as $key=>$val) {
 
- 			if(is_array($val)) {
 
- 				$data[$key] = array_utf8_to_gbk($val);
 
- 			} else {
 
- 				$data[$key] = utf8_to_gbk($val);
 
- 			}
 
- 		}
 
- 		return $data;
 
- 	}
 
- }
 
- /**
 
-  * 数组 gbk转utf8
 
-  * @param $utfstr
 
-  */
 
- function array_gbk_to_utf8($data) {
 
- 	if (!is_array($data)) {
 
- 		return gbk_to_utf8($data);
 
- 	} else {
 
- 		foreach ($data as $key=>$val) {
 
- 			if(is_array($val)) {
 
- 				$data[$key] = array_gbk_to_utf8($val);
 
- 			} else {
 
- 				$data[$key] = gbk_to_utf8($val);
 
- 			}
 
- 		}
 
- 		return $data;
 
- 	}
 
- }
 
- ?>
 
 
  |