Java Chinese to spell tool class sharing

  • 2020-04-01 02:47:21
  • OfStack


import net.sourceforge.pinyin4j.PinyinHelper;
import net.sourceforge.pinyin4j.format.HanyuPinyinCaseType;
import net.sourceforge.pinyin4j.format.HanyuPinyinOutputFormat;
import net.sourceforge.pinyin4j.format.HanyuPinyinToneType;
import net.sourceforge.pinyin4j.format.HanyuPinyinVCharType;
import net.sourceforge.pinyin4j.format.exception.BadHanyuPinyinOutputFormatCombination;
public class Pinyin4jUtil {
 
 public static String getPinYin(String src) {
  char[] t1 = null;
  t1 = src.toCharArray();
  // System.out.println(t1.length);
  String[] t2 = new String[t1.length];
  // System.out.println(t2.length);
  //Set the output format of Chinese pinyin
  HanyuPinyinOutputFormat t3 = new HanyuPinyinOutputFormat();
  t3.setCaseType(HanyuPinyinCaseType.LOWERCASE);
  t3.setToneType(HanyuPinyinToneType.WITHOUT_TONE);
  t3.setVCharType(HanyuPinyinVCharType.WITH_V);
  String t4 = "";
  int t0 = t1.length;
  try {
   for (int i = 0; i < t0; i++) {
    //Determine whether it can be a Chinese character
    // System.out.println(t1[i]);
    if (Character.toString(t1[i]).matches("[\u4E00-\u9FA5]+")) {
     t2 = PinyinHelper.toHanyuPinyinStringArray(t1[i], t3);//Store the complete spelling of Chinese characters in a t2 array
     t4 += t2[0];//Take the first pronunciation of the Chinese character and connect it to the string t4
    } else {
     //If it is not a hanzi character, indirectly extract the character and connect it to the string t4
     t4 += Character.toString(t1[i]);
    }
   }
  } catch (BadHanyuPinyinOutputFormatCombination e) {
   e.printStackTrace();
  }
  return t4;
 }
 
 public static String getPinYinHeadChar(String str) {
  String convert = "";
  for (int j = 0; j < str.length(); j++) {
   char word = str.charAt(j);
   //Extract the first letter of a Chinese character
   String[] pinyinArray = PinyinHelper.toHanyuPinyinStringArray(word);
   if (pinyinArray != null) {
    convert += pinyinArray[0].charAt(0);
   } else {
    convert += word;
   }
  }
  return convert;
 }
 
 public static String getCnASCII(String cnStr) {
  StringBuffer strBuf = new StringBuffer();
  //Converts a string to a sequence of bytes
  byte[] bGBK = cnStr.getBytes();
  for (int i = 0; i < bGBK.length; i++) {
   // System.out.println(Integer.toHexString(bGBK[i] & 0xff));
   //Converts each character to ASCII code
   strBuf.append(Integer.toHexString(bGBK[i] & 0xff));
  }
  return strBuf.toString();
 }
 public static void main(String[] args) {
  String cnStr = " China ";
  System.out.println(getPinYin(cnStr));
  System.out.println(getPinYinHeadChar(cnStr));
  System.out.println(getCnASCII(cnStr));
 }
}


Related articles: