java如何获取汉字的拼音字母

java如何获取汉字的拼音字母,第1张

获取首字母需要对汉字表和字母表进行映射,如下示例代码是以gb2312编码为入手点,进行匹配的,也可以使用gbk、utf-8等编码进行匹配,但代码就完全不同了。

示例代码如下:

public class FirstLetterUtils {

// 简体中文的编码范围从B0A1(45217)一直到F7FE(63486)

private static int BEGIN = 45217;

private static int END = 63486;

// 按照声 母表示,这个表是在GB2312中的出现的第一个汉字,也就是说“啊”是代表首字母a的第一个汉字。

// i, u, v都不做声母, 自定规则跟随前面的字母

private static char[] chartable = { '啊', '芭', '擦', '搭', '蛾', '发', '噶', '哈', '哈', '击', '喀', '垃', '妈', '拿', '哦', '啪', '期', '然', '撒', '塌', '塌', '塌', '挖', '昔', '压', '匝', };

// 二十六个字母区间对应二十七个端点

// GB2312码汉字区间十进制表示

private static int[] table = new int[27];

// 对应首字母区间表

private static char[] initialtable = { 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'h', 'j', 'k', 'l', 'm', 'n', 'o', 'p', 'q', 'r', 's', 't', 't', 't', 'w', 'x', 'y', 'z', };

// 初始化

static {

for (int i = 0; i < 26; i++) {

table[i] = gbValue(chartable[i]);// 得到GB2312码的首字母区间端点表,十进制。

}

table[26] = END;// 区间表结尾

}

// ------------------------public方法区------------------------

// 根据一个包含汉字的字符串返回一个汉字拼音首字母的字符串 最重要的一个方法,思路如下:一个个字符读入、判断、输出

public static String cn2py(String SourceStr) {

String Result = "";

int StrLength = SourceStrlength();

int i;

try {

for (i = 0; i < StrLength; i++) {

Result += Char2Initial(SourceStrcharAt(i));

}

} catch (Exception e) {

Result = "";

eprintStackTrace();

}

return Result;

}

// ------------------------private方法区------------------------

/

输入字符,得到他的声母,英文字母返回对应的大写字母,其他非简体汉字返回 '0'

/

private static char Char2Initial(char ch) {

// 对英文字母的处理:小写字母转换为大写,大写的直接返回

if (ch >= 'a' && ch <= 'z') {

return (char) (ch - 'a' + 'A');

}

if (ch >= 'A' && ch <= 'Z') {

return ch;

}

// 对非英文字母的处理:转化为首字母,然后判断是否在码表范围内,

// 若不是,则直接返回。

// 若是,则在码表内的进行判断。

int gb = gbValue(ch);// 汉字转换首字母

if ((gb < BEGIN) || (gb > END))// 在码表区间之前,直接返回

{

return ch;

}

int i;

for (i = 0; i < 26; i++) {// 判断匹配码表区间,匹配到就break,判断区间形如“[,)”

if ((gb >= table[i]) && (gb < table[i + 1])) {

break;

}

}

if (gb == END) {// 补上GB2312区间最右端

i = 25;

}

return initialtable[i]; // 在码表区间中,返回首字母

}

/

取出汉字的编码 cn 汉字

/

private static int gbValue(char ch) {// 将一个汉字(GB2312)转换为十进制表示。

String str = new String();

str += ch;

try {

byte[] bytes = strgetBytes("GB2312");

if (byteslength < 2) {

return 0;

}

return (bytes[0] << 8 & 0xff00) + (bytes[1] & 0xff);

} catch (Exception e) {

return 0;

}

}

public static void main(String[] args) throws Exception {

Systemoutprintln(cn2py("这是一个获取首字母的class"));

}

}

function GetPYIndexChar( hzchar:string):char;

begin //的到一个汉字的拼音头个字母

case WORD(hzchar[1]) shl 8 + WORD(hzchar[2]) of

$B0A1$B0C4 : result := 'A';

$B0C5$B2C0 : result := 'B';

$B2C1$B4ED : result := 'C';

$B4EE$B6E9 : result := 'D';

$B6EA$B7A1 : result := 'E';

$B7A2$B8C0 : result := 'F';

$B8C1$B9FD : result := 'G';

$B9FE$BBF6 : result := 'H';

$BBF7$BFA5 : result := 'J';

$BFA6$C0AB : result := 'K';

$C0AC$C2E7 : result := 'L';

$C2E8$C4C2 : result := 'M';

$C4C3$C5B5 : result := 'N';

$C5B6$C5BD : result := 'O';

$C5BE$C6D9 : result := 'P';

$C6DA$C8BA : result := 'Q';

$C8BB$C8F5 : result := 'R';

$C8F6$CBF9 : result := 'S';

$CBFA$CDD9 : result := 'T';

$CDDA$CEF3 : result := 'W';

$CEF4$D188 : result := 'X';

$D1B9$D4D0 : result := 'Y';

$D4D1$D7F9 : result := 'Z';

else

result := char(0);

end;

end;

以下是我的原码100%可以

unit Unit1;

interface

uses

Windows, Messages, SysUtils, Variants, Classes, Graphics, Controls, Forms,

Dialogs, StdCtrls;

type

TForm1 = class(TForm)

Edit1: TEdit;

Edit2: TEdit;

Button1: TButton;

procedure Button1Click(Sender: TObject);

private

{ Private declarations }

public

{ Public declarations }

end;

function GetPYIndexChar( hzchar:string):char;

var

Form1: TForm1;

implementation

{$R dfm}

function GetPYIndexChar( hzchar:string):char;

begin //的到一个汉字的拼音头个字母

case WORD(hzchar[1]) shl 8 + WORD(hzchar[2]) of

$B0A1$B0C4 : result := 'A';

$B0C5$B2C0 : result := 'B';

$B2C1$B4ED : result := 'C';

$B4EE$B6E9 : result := 'D';

$B6EA$B7A1 : result := 'E';

$B7A2$B8C0 : result := 'F';

$B8C1$B9FD : result := 'G';

$B9FE$BBF6 : result := 'H';

$BBF7$BFA5 : result := 'J';

$BFA6$C0AB : result := 'K';

$C0AC$C2E7 : result := 'L';

$C2E8$C4C2 : result := 'M';

$C4C3$C5B5 : result := 'N';

$C5B6$C5BD : result := 'O';

$C5BE$C6D9 : result := 'P';

$C6DA$C8BA : result := 'Q';

$C8BB$C8F5 : result := 'R';

$C8F6$CBF9 : result := 'S';

$CBFA$CDD9 : result := 'T';

$CDDA$CEF3 : result := 'W';

$CEF4$D188 : result := 'X';

$D1B9$D4D0 : result := 'Y';

$D4D1$D7F9 : result := 'Z';

else

result := char(0);

end;

end;

procedure TForm1Button1Click(Sender: TObject);

begin

edit2Text:=GetPYIndexChar(edit1Text);

end;

end

步骤:

第一步、启动Excel 2003(其它版本请仿照 *** 作),打开相应的工作表;

第二步、执行“工具→宏→Visual Basic编辑器”命令(或者直接按“Alt+F11”组合键),进入Visual Basic编辑状态;

第三步、执行“插入→模块”命令,插入一个新模块。再双击插入的模块,进入模块代码编辑状态;

第四步、将代码输入其中;

Function pinyin(p As String) As String

i = Asc(p)

Select Case i

Case -20319 To -20284: pinyin = "A"

Case -20283 To -19776: pinyin = "B"

Case -19775 To -19219: pinyin = "C"

Case -19218 To -18711: pinyin = "D"

Case -18710 To -18527: pinyin = "E"

Case -18526 To -18240: pinyin = "F"

Case -18239 To -17923: pinyin = "G"

Case -17922 To -17418: pinyin = "H"

Case -17417 To -16475: pinyin = "J"

Case -16474 To -16213: pinyin = "K"

Case -16212 To -15641: pinyin = "L"

Case -15640 To -15166: pinyin = "M"

Case -15165 To -14923: pinyin = "N"

Case -14922 To -14915: pinyin = "O"

Case -14914 To -14631: pinyin = "P"

Case -14630 To -14150: pinyin = "Q"

Case -14149 To -14091: pinyin = "R"

Case -14090 To -13319: pinyin = "S"

Case -13318 To -12839: pinyin = "T"

Case -12838 To -12557: pinyin = "W"

Case -12556 To -11848: pinyin = "X"

Case -11847 To -11056: pinyin = "Y"

Case -11055 To -2050: pinyin = "Z"

Case Else: pinyin = p

End Select

End Function

Function getpy(str)

For i = 1 To Len(str)

getpy = getpy & pinyin(Mid(str, i, 1))

Next i

End Function

第五步、代码输入完成后,关闭Visual Basic编辑窗口,返回Excel编辑状态;

第六步、自定义函数就可以用了,如:选中A2单元格,输入公式:=getpy(A2)。

声母为C的有:擦、蔡、察、侧、测、差、搓、磋、蹉、词、祠、伺、兹、慈、磁、鹚、糍、此、疵、雌、柴、紫、次、瓷、才、材、财、豺、彩、睬、踩、菜、崔、催、摧、璀、粹、翠、淬、悴、萃、瘁、错、措、醋、挫、痤、矬、锉、参、惨、渗、曹、嘈、槽、漕、遭、糟等。

复制代码 代码如下: <php class GetPingYing { private $pylist = array( a => ai => an => ang => ao => ba => bai => ban => bang => bao => bei => ben => beng => bi => bian => biao => bie => bin => bing => bo => bu => ca => cai => can => cang => cao => ce => ceng => cha => chai => chan => chang => chao => che => chen => cheng => chi => chong => chou => chu => chuai => chuan => chuang => chui => chun => chuo => ci => cong => cou => cu => cuan => cui => cun => cuo => da => dai => dan => dang => dao => de => deng => di => dian => diao => die => ding => diu => dong => dou => du => duan => dui => dun => duo => e => en => er => fa => fan => fang => fei => fen => feng => fo => fou => fu => ga => gai => gan => gang => gao => ge => gei => gen => geng => gong => gou => gu => gua => guai => guan => guang => gui => gun => guo => ha => hai => han => hang => hao => he => hei => hen => heng => hong => hou => hu => hua => huai => huan => huang => hui => hun => huo => ji => jia => jian => jiang => jiao => jie => jin => jing => jiong => jiu => ju => juan => jue => jun => ka => kai => kan => kang => kao => ke => ken => keng => kong => kou => ku => kua => kuai => kuan => kuang => kui => kun => kuo => la => lai => lan => lang => lao => le => lei => leng => li => lia => lian => liang => liao => lie => lin => ling => liu => long => lou => lu => lv => luan => lue => lun => luo => ma => mai => man => mang => mao => me => mei => men => meng => mi => mian => miao => mie => min => ming => miu => mo => mou => mu => na => nai => nan => nang => nao => ne => nei => nen => neng => ni => nian => niang => niao => nie => nin => ning => niu => nong => nu => nv => nuan => nue => nuo => o => ou => pa => pai => pan => pang => pao => pei => pen => peng => pi => pian => piao => pie => pin => ping => po => pu => qi => qia => qian => qiang => qiao => qie => qin => qing => qiong => qiu => qu => quan => que => qun => ran => rang => rao => re => ren => reng => ri => rong => rou => ru => ruan => rui => run => ruo => sa => sai => san => sang => sao => se => sen => seng => sha => shai => shan => shang => shao => she => shen => sheng => shi => shou => shu => shua => shuai => shuan => shuang => shui => shun => shuo => si => song => sou => su => suan => sui => sun => suo => ta => tai => tan => tang => tao => te => teng => ti => tian => tiao => tie => ting => tong => tou => tu => tuan => tui => tun => tuo => wa => wai => wan => wang => wei => wen => weng => wo => wu => xi => xia => xian => xiang => xiao => xie => xin => xing => xiong => xiu => xu => xuan => xue => xun => ya => yan => yang => yao => ye => yi => yin => ying => yo => yong => you => yu => yuan => yue => yun => za => zai => zan => zang => zao => ze => zei => zen => zeng => zha => zhai => zhan => zhang => zhao => zhe => zhen => zheng => zhi => zhong => zhou => zhu => zhua => zhuai => zhuan => zhuang => zhui => zhun => zhuo => zi => zong => zou => zu => zuan => zui => zun => zuo => ); //全部拼音 public function getAllPY($chinese $delimiter = $length = ) { $py = $this >zh_to_pys($chinese $delimiter); if($length) { $py = substr($py $length); } return $py; } //拼音首个字母 public function getFirstPY($chinese){ $result = ; for ($i= ; $i<strlen($chinese); $i++) { $p = ord(substr($chinese $i )); if ($p> ) { $q = ord(substr($chinese ++$i )); $p = $p + $q ; } $result = substr($this >zh_to_py($p) ); } return $result ; } // 中文转拼音 // private function zh_to_py($num $blank = ) { if($num> && $num< ) { return chr($num); } elseif ($num< ||$num> ) { return $blank; } else { foreach ($this >pylist as $py => $code) { if($code > $num) break; $result = $py; } return $result; } } private function zh_to_pys($chinese $delimiter = $first= ){ $result = array(); for($i= ; $i<strlen($chinese); $i++) { $p = ord(substr($chinese $i )); if($p> ) { $q = ord(substr($chinese ++$i )); $p = $p + $q ; } $result[] = $this >zh_to_py($p); if ($first) { return $result[ ]; } } return implode($delimiter $result); } } // 中文转拼音结束 // //中文是双字节 所以需要两个字节连接起来(ASCII码的范围是在 ) $c = 齐秦 ; for($i= ; $i<strlen($c); $i++) { echo ord($c[$i]) ;// } echo <br> chr( ) chr( ) chr( ) chr( ) <br> ; //测试 $PingYing = new GetPingYing(); echo <br> $PingYing >getFirstPY( 羽泉乐队 歌不错 推荐 ) <br> ;//yqldgbc tj echo $PingYing >getAllPY( 羽泉乐队 歌不错 推荐 ) <br> ; //yuquanleduigebucuo tuijian > lishixinzhi/Article/program/PHP/201311/21313

以上就是关于java如何获取汉字的拼音字母全部的内容,包括:java如何获取汉字的拼音字母、delphi中如何获取汉字的拼音首字母~!、excel中如何实现提取汉字的拼音首字母等相关内容解答,如果想了解更多相关内容,可以关注我们,你们的支持是我们更新的动力!

欢迎分享,转载请注明来源:内存溢出

原文地址:https://54852.com/web/9485713.html

(0)
打赏 微信扫一扫微信扫一扫 支付宝扫一扫支付宝扫一扫
上一篇 2023-04-28
下一篇2023-04-28

发表评论

登录后才能评论

评论列表(0条)

    保存