查到一个好用的汉字转拼音封装类
- <?php
- /**
- * PHP 汉字转拼音
- * @author Jerryli(hzjerry@gmail.com)
- * @version V0.20140715
- * @package SPFW.core.lib.final
- * @global SEA_PHP_FW_VAR_ENV
- * @example
- * echo CUtf8_PY::encode('阿里巴巴科技有限公司'); //编码为拼音首字母
- * echo CUtf8_PY::encode('阿里巴巴科技有限公司', 'all'); //编码为全拼音
- */
- class CUtf8_PY {
- /**
- * 拼音字符转换图
- * @var array
- */
- private static $_aMaps = array(
- 'a'=>-20319,'ai'=>-20317,'an'=>-20304,'ang'=>-20295,'ao'=>-20292,
- 'ba'=>-20283,'bai'=>-20265,'ban'=>-20257,'bang'=>-20242,'bao'=>-20230,'bei'=>-20051,'ben'=>-20036,'beng'=>-20032,'bi'=>-20026,'bian'=>-20002,'biao'=>-19990,'bie'=>-19986,'bin'=>-19982,'bing'=>-19976,'bo'=>-19805,'bu'=>-19784,
- 'ca'=>-19775,'cai'=>-19774,'can'=>-19763,'cang'=>-19756,'cao'=>-19751,'ce'=>-19746,'ceng'=>-19741,'cha'=>-19739,'chai'=>-19728,'chan'=>-19725,'chang'=>-19715,'chao'=>-19540,'che'=>-19531,'chen'=>-19525,'cheng'=>-19515,'chi'=>-19500,'chong'=>-19484,'chou'=>-19479,'chu'=>-19467,'chuai'=>-19289,'chuan'=>-19288,'chuang'=>-19281,'chui'=>-19275,'chun'=>-19270,'chuo'=>-19263,'ci'=>-19261,'cong'=>-19249,'cou'=>-19243,'cu'=>-19242,'cuan'=>-19238,'cui'=>-19235,'cun'=>-19227,'cuo'=>-19224,
- 'da'=>-19218,'dai'=>-19212,'dan'=>-19038,'dang'=>-19023,'dao'=>-19018,'de'=>-19006,'deng'=>-19003,'di'=>-18996,'dian'=>-18977,'diao'=>-18961,'die'=>-18952,'ding'=>-18783,'diu'=>-18774,'dong'=>-18773,'dou'=>-18763,'du'=>-18756,'duan'=>-18741,'dui'=>-18735,'dun'=>-18731,'duo'=>-18722,
- 'e'=>-18710,'en'=>-18697,'er'=>-18696,
- 'fa'=>-18526,'fan'=>-18518,'fang'=>-18501,'fei'=>-18490,'fen'=>-18478,'feng'=>-18463,'fo'=>-18448,'fou'=>-18447,'fu'=>-18446,
- 'ga'=>-18239,'gai'=>-18237,'gan'=>-18231,'gang'=>-18220,'gao'=>-18211,'ge'=>-18201,'gei'=>-18184,'gen'=>-18183,'geng'=>-18181,'gong'=>-18012,'gou'=>-17997,'gu'=>-17988,'gua'=>-17970,'guai'=>-17964,'guan'=>-17961,'guang'=>-17950,'gui'=>-17947,'gun'=>-17931,'guo'=>-17928,
- 'ha'=>-17922,'hai'=>-17759,'han'=>-17752,'hang'=>-17733,'hao'=>-17730,'he'=>-17721,'hei'=>-17703,'hen'=>-17701,'heng'=>-17697,'hong'=>-17692,'hou'=>-17683,'hu'=>-17676,'hua'=>-17496,'huai'=>-17487,'huan'=>-17482,'huang'=>-17468,'hui'=>-17454,'hun'=>-17433,'huo'=>-17427,
- 'ji'=>-17417,'jia'=>-17202,'jian'=>-17185,'jiang'=>-16983,'jiao'=>-16970,'jie'=>-16942,'jin'=>-16915,'jing'=>-16733,'jiong'=>-16708,'jiu'=>-16706,'ju'=>-16689,'juan'=>-16664,'jue'=>-16657,'jun'=>-16647,
- 'ka'=>-16474,'kai'=>-16470,'kan'=>-16465,'kang'=>-16459,'kao'=>-16452,'ke'=>-16448,'ken'=>-16433,'keng'=>-16429,'kong'=>-16427,'kou'=>-16423,'ku'=>-16419,'kua'=>-16412,'kuai'=>-16407,'kuan'=>-16403,'kuang'=>-16401,'kui'=>-16393,'kun'=>-16220,'kuo'=>-16216,
- 'la'=>-16212,'lai'=>-16205,'lan'=>-16202,'lang'=>-16187,'lao'=>-16180,'le'=>-16171,'lei'=>-16169,'leng'=>-16158,'li'=>-16155,'lia'=>-15959,'lian'=>-15958,'liang'=>-15944,'liao'=>-15933,'lie'=>-15920,'lin'=>-15915,'ling'=>-15903,'liu'=>-15889,'long'=>-15878,'lou'=>-15707,'lu'=>-15701,'lv'=>-15681,'luan'=>-15667,'lue'=>-15661,'lun'=>-15659,'luo'=>-15652,
- 'ma'=>-15640,'mai'=>-15631,'man'=>-15625,'mang'=>-15454,'mao'=>-15448,'me'=>-15436,'mei'=>-15435,'men'=>-15419,'meng'=>-15416,'mi'=>-15408,'mian'=>-15394,'miao'=>-15385,'mie'=>-15377,'min'=>-15375,'ming'=>-15369,'miu'=>-15363,'mo'=>-15362,'mou'=>-15183,'mu'=>-15180,
- 'na'=>-15165,'nai'=>-15158,'nan'=>-15153,'nang'=>-15150,'nao'=>-15149,'ne'=>-15144,'nei'=>-15143,'nen'=>-15141,'neng'=>-15140,'ni'=>-15139,'nian'=>-15128,'niang'=>-15121,'niao'=>-15119,'nie'=>-15117,'nin'=>-15110,'ning'=>-15109,'niu'=>-14941,'nong'=>-14937,'nu'=>-14933,'nv'=>-14930,'nuan'=>-14929,'nue'=>-14928,'nuo'=>-14926,
- 'o'=>-14922,'ou'=>-14921,
- 'pa'=>-14914,'pai'=>-14908,'pan'=>-14902,'pang'=>-14894,'pao'=>-14889,'pei'=>-14882,'pen'=>-14873,'peng'=>-14871,'pi'=>-14857,'pian'=>-14678,'piao'=>-14674,'pie'=>-14670,'pin'=>-14668,'ping'=>-14663,'po'=>-14654,'pu'=>-14645,
- 'qi'=>-14630,'qia'=>-14594,'qian'=>-14429,'qiang'=>-14407,'qiao'=>-14399,'qie'=>-14384,'qin'=>-14379,'qing'=>-14368,'qiong'=>-14355,'qiu'=>-14353,'qu'=>-14345,'quan'=>-14170,'que'=>-14159,'qun'=>-14151,
- 'ran'=>-14149,'rang'=>-14145,'rao'=>-14140,'re'=>-14137,'ren'=>-14135,'reng'=>-14125,'ri'=>-14123,'rong'=>-14122,'rou'=>-14112,'ru'=>-14109,'ruan'=>-14099,'rui'=>-14097,'run'=>-14094,'ruo'=>-14092,
- 'sa'=>-14090,'sai'=>-14087,'san'=>-14083,'sang'=>-13917,'sao'=>-13914,'se'=>-13910,'sen'=>-13907,'seng'=>-13906,'sha'=>-13905,'shai'=>-13896,'shan'=>-13894,'shang'=>-13878,'shao'=>-13870,'she'=>-13859,'shen'=>-13847,'sheng'=>-13831,'shi'=>-13658,'shou'=>-13611,'shu'=>-13601,'shua'=>-13406,'shuai'=>-13404,'shuan'=>-13400,'shuang'=>-13398,'shui'=>-13395,'shun'=>-13391,'shuo'=>-13387,'si'=>-13383,'song'=>-13367,'sou'=>-13359,'su'=>-13356,'suan'=>-13343,'sui'=>-13340,'sun'=>-13329,'suo'=>-13326,
- 'ta'=>-13318,'tai'=>-13147,'tan'=>-13138,'tang'=>-13120,'tao'=>-13107,'te'=>-13096,'teng'=>-13095,'ti'=>-13091,'tian'=>-13076,'tiao'=>-13068,'tie'=>-13063,'ting'=>-13060,'tong'=>-12888,'tou'=>-12875,'tu'=>-12871,'tuan'=>-12860,'tui'=>-12858,'tun'=>-12852,'tuo'=>-12849,
- 'wa'=>-12838,'wai'=>-12831,'wan'=>-12829,'wang'=>-12812,'wei'=>-12802,'wen'=>-12607,'weng'=>-12597,'wo'=>-12594,'wu'=>-12585,
- 'xi'=>-12556,'xia'=>-12359,'xian'=>-12346,'xiang'=>-12320,'xiao'=>-12300,'xie'=>-12120,'xin'=>-12099,'xing'=>-12089,'xiong'=>-12074,'xiu'=>-12067,'xu'=>-12058,'xuan'=>-12039,'xue'=>-11867,'xun'=>-11861,
- 'ya'=>-11847,'yan'=>-11831,'yang'=>-11798,'yao'=>-11781,'ye'=>-11604,'yi'=>-11589,'yin'=>-11536,'ying'=>-11358,'yo'=>-11340,'yong'=>-11339,'you'=>-11324,'yu'=>-11303,'yuan'=>-11097,'yue'=>-11077,'yun'=>-11067,
- 'za'=>-11055,'zai'=>-11052,'zan'=>-11045,'zang'=>-11041,'zao'=>-11038,'ze'=>-11024,'zei'=>-11020,'zen'=>-11019,'zeng'=>-11018,'zha'=>-11014,'zhai'=>-10838,'zhan'=>-10832,'zhang'=>-10815,'zhao'=>-10800,'zhe'=>-10790,'zhen'=>-10780,'zheng'=>-10764,'zhi'=>-10587,'zhong'=>-10544,'zhou'=>-10533,'zhu'=>-10519,'zhua'=>-10331,'zhuai'=>-10329,'zhuan'=>-10328,'zhuang'=>-10322,'zhui'=>-10315,'zhun'=>-10309,'zhuo'=>-10307,'zi'=>-10296,'zong'=>-10281,'zou'=>-10274,'zu'=>-10270,'zuan'=>-10262,'zui'=>-10260,'zun'=>-10256,'zuo'=>-10254
- );
- /**
- * 将中文编码成拼音
- * @param string $utf8Data utf8字符集数据
- * @param string $sRetFormat 返回格式 [head:首字母|all:全拼音]
- * @return string
- */
- public static function encode($utf8Data, $sRetFormat='head'){
- $sGBK = iconv('UTF-8', 'GBK', $utf8Data);
- $aBuf = array();
- for ($i=0, $iLoop=strlen($sGBK); $i<$iLoop; $i++) {
- $iChr = ord($sGBK{$i});
- if ($iChr>160)
- $iChr = ($iChr<<8) + ord($sGBK{++$i}) - 65536;
- if ('head' === $sRetFormat)
- $aBuf[] = substr(self::zh2py($iChr),0,1);
- else
- $aBuf[] = self::zh2py($iChr);
- }
- if ('head' === $sRetFormat)
- return implode('', $aBuf);
- else
- return implode(' ', $aBuf);
- }
- /**
- * 中文转换到拼音(每次处理一个字符)
- * @param number $iWORD 待处理字符双字节
- * @return string 拼音
- */
- private static function zh2py($iWORD) {
- if($iWORD>0 && $iWORD<160 ) {
- return chr($iWORD);
- } elseif ($iWORD<-20319||$iWORD>-10247) {
- return '';
- } else {
- foreach (self::$_aMaps as $py => $code) {
- if($code > $iWORD) break;
- $result = $py;
- }
- return $result;
- }
- }
- }
- ?>
查到一个好用的汉字转拼音封装类相关推荐
- 汉字转拼音---PHP
思路: 在文件中放入一个UTF-8的中文汉字与拼音对照的文件.在汉字转拼音时,只要用正则匹配到对照文件的相应的汉字,就能得到拼音. 汉字与拼音对照文件下载地址:链接:https://pan.baidu ...
- 大创项目学习日志(二)——汉字转拼音软件的选择与尝试
我希望,至少我们的孙儿孙女这一代能够两条腿走路,既能用汉字写,也能用拼音字母写,听报告作笔记,用拼音字母写,会比汉字写得快.如果可能,还能用上拼音字母的打字机.这样该是多么幸福呢!我并不幻想,在不远的 ...
- 汉字转拼音android实现(HanziToPinyin类)
对Contacts了解就会知道(不了解可以了解下),每个联系人都有一个sort_key字段,如果查询中没有设置sortOrder,默认就会以 sort_key字段为排序依据.名字的检索其实也是根据so ...
- oracle把中文转换为拼音,怎样将“Oracle”的外部表汉字转换为拼音
怎样将"Oracle"的外部表汉字转换为拼音 2008-03-07 eNet&Ciweek 我在原来的应用中使用代码表加一个函数来处理汉字转拼音的转换问题,现在由于工作需要 ...
- 汉字转拼音 python_python把汉字转换成拼音实现程序
python把汉字转换成拼音实现程序 文章一个简洁干的汉字转拼音 程序,复制下载就可以直接使用,有需要的同学可以参考一下下. #coding:utf-8 #基于python2.6 table = 'a ...
- python中如何判断输入的是英文字母_python如何判断一个字符是否为汉字,英文字母,数字,空还是其他...
一直在忙工作的事情,对不起大家,今后一定抽出时间来写python,和大家一起学python. 今天给大家一段代码,大家可以看一下哈. # 判断一个字符是否为汉字,英文字母,数字,空还是其他 # 使用U ...
- 【Python入门】一个有意思还有用的Python包-汉字转换拼音
一.应用概述 最近做一个项目,发现很多场景,把汉字转换成拼音,然后进行深度学习分类,能够取得非常不错的效果,在做内容识别,特别是涉及到同音字的时候,转换成拼音就显得特别重要.比如垃圾广告识别:公众号. ...
- 得到一个汉字的拼音第一个字母
/// <summary> /// 在指定的字符串列表CnStr中检索符合拼音索引字符串 /// </summary> /// <param name="CnS ...
- 从gb2py.idx中获取一个汉字的拼音首字母
function GetPinyinFromFile(aHanzi:string):AnsiChar; //从gb2py.idx中获取一个汉字的拼音首字母 var sfile:TMemoryStrea ...
最新文章
- 新公司研发能力低下,何去何从?
- 用C#的Raw Socket实现网络封包监视
- MyBatis包含这9种设计模式,你知道几个?
- mac 终端快捷命令
- 2019年东莞特长生 散步
- 棍子节快乐~ 顺便转一篇weka源码分析解析~【转自weka中文网】
- html li 做瀑布流,js实现瀑布流效果(自动生成新的内容)
- charts引入icon图片_v-charts 踩坑之路
- Elipse 、Idea配置 Java-Code-Formatter
- Squid 2.6 Configuration Manual - Log File Path Names and Cache Directories
- 50 岁的他笑谈码农真相,看完清醒了!| 人物志
- Eclipse 使用
- [转载]Qt之自定义界面(二)添加最小化、关闭按钮、添加背景
- 真实网络环境下使用易邮搭建网络邮件服务器并测试通过
- 计算机学报发表论文格式,计算机学报论文格式(24页)-原创力文档
- Origin8画图:将多个worksheet表画在同一张图
- C# AutoCAD图纸插入块(另一个dwg文件)
- 排列组合解析与例题总结
- FQQ兵法,适用于各种版本以及种族
- matlab 发布商,MathWork发布MATLAB和Simulink版本2021a
热门文章
- 数据库概述-了解数据库-MySQL数据库服务配置-下载安装(强力推荐)
- 达人评测 i9 13900H 和i7 12700h差多少 酷睿i913900H 和i712700h对比
- 手撕图机器学习,图神经网络
- php silk文件转换pcm,微信小程序录音silk文件格式转换为MP3及PCM格式的方法
- PHP替代JavaScript的 js charCodeAt() 方法
- 看听读写想练口语 免费
- 什么是SQL数据类型?SQL数据类型总结
- Deeplabcut教程(二)使用
- 逻辑运算符和逻辑表达式
- HayeSep T 80-100多孔聚合物吸附剂,HayeSep A 80-100气相色谱担体填料,HayeSep Q 60-80气相色谱填充柱(国产推荐)