您的位置:首页 > 编程语言 > Java开发

java实现中文转化为拼音与简称 .

2013-09-09 17:22 513 查看
package test;

import java.io.UnsupportedEncodingException;

import net.sourceforge.pinyin4j.PinyinHelper;

/** */

/**

* 取得给定汉字串的首字母串,即声母串

* <p>Title: ChineseCharToEn</p>

* <p>@author javer QQ:84831612</p>

*

* @version 1.0

* @date 2004-02-19

* 注:只支持GB2312字符集中的汉字

*/

public final class ChineseCharToEn {

private final static int[] li_SecPosValue =

{

1601, 1637, 1833, 2078, 2274, 2302, 2433, 2594, 2787, 3106, 3212, 3472,

3635, 3722, 3730, 3858, 4027, 4086, 4390, 4558, 4684, 4925, 5249, 5590

};

private final static String[] lc_FirstLetter =

{

"a", "b", "c", "d", "e", "f", "g", "h", "j", "k", "l", "m", "n", "o", "p",

"q", "r", "s", "t", "w", "x", "y", "z"

};

/** */

/**

* 取得给定汉字串的首字母串,即声母串

*

* @param str 给定汉字串

* @return 声母串

*/

public String getAllFirstLetter(String str) {

if (str == null || str.trim().length() == 0) {

return "";

}

String _str = "";

for (int i = 0; i < str.length(); i++) {

_str = _str + this.getFirstLetter(str.substring(i, i + 1));

}

System.out.println(str.length());

return _str;

}

/** */

/**

* 取得给定汉字的首字母,即声母

*

* @param chinese 给定的汉字

* @return 给定汉字的声母

*/

public String getFirstLetter(String chinese) {

if (chinese == null || chinese.trim().length() == 0) {

return "";

}

chinese = this.conversionStr(chinese, "GBK", "ISO8859-1");

if (chinese.length() > 1) //判断是不是汉字

{

int li_SectorCode = (int) chinese.charAt(0); //汉字区码

int li_PositionCode = (int) chinese.charAt(1); //汉字位码

li_SectorCode = li_SectorCode - 160;

li_PositionCode = li_PositionCode - 160;

int li_SecPosCode = li_SectorCode * 100 + li_PositionCode; //汉字区位码

if (li_SecPosCode > 1600 && li_SecPosCode < 5590) {

for (int i = 0; i < 23; i++) {

if (li_SecPosCode >= li_SecPosValue[i] &&

li_SecPosCode < li_SecPosValue[i + 1]) {

chinese = lc_FirstLetter[i];

break;

}

}

} else //非汉字字符,如图形符号或ASCII码

{

chinese = this.conversionStr(chinese, "ISO8859-1", "GBK");

chinese = chinese.substring(0, 1);

}

}

return chinese;

}

public String getAllFirstLetters(String str) {

String convert = "";

for (int j = 0; j < str.length(); j++) {

char word = str.charAt(j);

String[] pinyinArray = PinyinHelper.toHanyuPinyinStringArray(word);

if (pinyinArray != null) {

convert += pinyinArray[0].charAt(0);

}else {

convert += word;

}

}

return convert;

}

/** */

/**

* 字符串编码转换

*

* @param str 要转换编码的字符串

* @param charsetName 原来的编码

* @param toCharsetName 转换后的编码

* @return 经过编码转换后的字符串

*/

private String conversionStr(String str, String charsetName, String toCharsetName) {

try {

str = new String(str.getBytes(charsetName), toCharsetName);

}

catch (UnsupportedEncodingException ex) {

System.out.println("字符串编码转换异常:" + ex.getMessage());

}

return str;

}

public static void main(String[] args) {

ChineseCharToEn cte = new ChineseCharToEn();

System.out.println("'夜未眠'的首个拼音字母是:" + cte.getFirstLetter("夜未眠"));

System.out.println("'Javer夜未眠'的首个拼音字母是:" + cte.getFirstLetter("Javer夜未眠"));

System.out.println("大傻瓜于云龙" + cte.getAllFirstLetters("戬浜供销社"));

}

}

方式二:

package test;

import java.io.UnsupportedEncodingException;

import net.sourceforge.pinyin4j.PinyinHelper;

import net.sourceforge.pinyin4j.format.HanyuPinyinCaseType;

import net.sourceforge.pinyin4j.format.HanyuPinyinOutputFormat;

import net.sourceforge.pinyin4j.format.HanyuPinyinToneType;

import net.sourceforge.pinyin4j.format.HanyuPinyinVCharType;

import net.sourceforge.pinyin4j.format.exception.BadHanyuPinyinOutputFormatCombination;

public class CnToPy {

//将汉字转换为全拼

public static String getPingYin(String src){

char[] t1 = null;

t1=src.toCharArray();

String[] t2 = new String[t1.length];

HanyuPinyinOutputFormat t3 = new HanyuPinyinOutputFormat();

t3.setCaseType(HanyuPinyinCaseType.LOWERCASE);

t3.setToneType(HanyuPinyinToneType.WITHOUT_TONE);

t3.setVCharType(HanyuPinyinVCharType.WITH_V);

String t4="";

int t0=t1.length;

try {

for (int i=0;i<t0;i++)

{

//判断是否为汉字字符

if(java.lang.Character.toString(t1[i]).matches("[//u4E00-//u9FA5]+"))

{

t2 = PinyinHelper.toHanyuPinyinStringArray(t1[i], t3);

t4+=t2[0];

}

else

t4+=java.lang.Character.toString(t1[i]);

}

// System.out.println(t4);

return t4;

}

catch (BadHanyuPinyinOutputFormatCombination e1) {

e1.printStackTrace();

}

return t4;

}

//返回中文的首字母

public static String getPinYinHeadChar(String str) {

String convert = "";

for (int j = 0; j < str.length(); j++) {

char word = str.charAt(j);

String[] pinyinArray = PinyinHelper.toHanyuPinyinStringArray(word);

if (pinyinArray != null) {

convert += pinyinArray[0].charAt(0);

}else {

convert += word;

}

}

return convert;

}

//将字符串转移为ASCII码

public static String getCnASCII(String cnStr)

{

StringBuffer strBuf = new StringBuffer();

byte[] bGBK = cnStr.getBytes();

for(int i=0;i <bGBK.length;i++){

// System.out.println(Integer.toHexString(bGBK[i]&0xff));

strBuf.append(Integer.toHexString(bGBK[i]&0xff));

}

return strBuf.toString();

}

public static void main(String[] args) {

String cnStr = "中华人民共和国";

System.out.println(getPingYin(cnStr));

System.out.println(getPinYinHeadChar(cnStr));

}

}
内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签: