search
HomeJavajavaTutorialJava example of converting Chinese characters into Pinyin

Java implements the conversion of Chinese characters into Pinyin

Conversion class

public class PINYINChinese {
  private static int[] pyvalue = new int[] { -20319, -20317, -20304, -20295,
      -20292, -20283, -20265, -20257, -20242, -20230, -20051, -20036,
      -20032, -20026, -20002, -19990, -19986, -19982, -19976, -19805,
      -19784, -19775, -19774, -19763, -19756, -19751, -19746, -19741,
      -19739, -19728, -19725, -19715, -19540, -19531, -19525, -19515,
      -19500, -19484, -19479, -19467, -19289, -19288, -19281, -19275,
      -19270, -19263, -19261, -19249, -19243, -19242, -19238, -19235,
      -19227, -19224, -19218, -19212, -19038, -19023, -19018, -19006,
      -19003, -18996, -18977, -18961, -18952, -18783, -18774, -18773,
      -18763, -18756, -18741, -18735, -18731, -18722, -18710, -18697,
      -18696, -18526, -18518, -18501, -18490, -18478, -18463, -18448,
      -18447, -18446, -18239, -18237, -18231, -18220, -18211, -18201,
      -18184, -18183, -18181, -18012, -17997, -17988, -17970, -17964,
      -17961, -17950, -17947, -17931, -17928, -17922, -17759, -17752,
      -17733, -17730, -17721, -17703, -17701, -17697, -17692, -17683,
      -17676, -17496, -17487, -17482, -17468, -17454, -17433, -17427,
      -17417, -17202, -17185, -16983, -16970, -16942, -16915, -16733,
      -16708, -16706, -16689, -16664, -16657, -16647, -16474, -16470,
      -16465, -16459, -16452, -16448, -16433, -16429, -16427, -16423,
      -16419, -16412, -16407, -16403, -16401, -16393, -16220, -16216,
      -16212, -16205, -16202, -16187, -16180, -16171, -16169, -16158,
      -16155, -15959, -15958, -15944, -15933, -15920, -15915, -15903,
      -15889, -15878, -15707, -15701, -15681, -15667, -15661, -15659,
      -15652, -15640, -15631, -15625, -15454, -15448, -15436, -15435,
      -15419, -15416, -15408, -15394, -15385, -15377, -15375, -15369,
      -15363, -15362, -15183, -15180, -15165, -15158, -15153, -15150,
      -15149, -15144, -15143, -15141, -15140, -15139, -15128, -15121,
      -15119, -15117, -15110, -15109, -14941, -14937, -14933, -14930,
      -14929, -14928, -14926, -14922, -14921, -14914, -14908, -14902,
      -14894, -14889, -14882, -14873, -14871, -14857, -14678, -14674,
      -14670, -14668, -14663, -14654, -14645, -14630, -14594, -14429,
      -14407, -14399, -14384, -14379, -14368, -14355, -14353, -14345,
      -14170, -14159, -14151, -14149, -14145, -14140, -14137, -14135,
      -14125, -14123, -14122, -14112, -14109, -14099, -14097, -14094,
      -14092, -14090, -14087, -14083, -13917, -13914, -13910, -13907,
      -13906, -13905, -13896, -13894, -13878, -13870, -13859, -13847,
      -13831, -13658, -13611, -13601, -13406, -13404, -13400, -13398,
      -13395, -13391, -13387, -13383, -13367, -13359, -13356, -13343,
      -13340, -13329, -13326, -13318, -13147, -13138, -13120, -13107,
      -13096, -13095, -13091, -13076, -13068, -13063, -13060, -12888,
      -12875, -12871, -12860, -12858, -12852, -12849, -12838, -12831,
      -12829, -12812, -12802, -12607, -12597, -12594, -12585, -12556,
      -12359, -12346, -12320, -12300, -12120, -12099, -12089, -12074,
      -12067, -12058, -12039, -11867, -11861, -11847, -11831, -11798,
      -11781, -11604, -11589, -11536, -11358, -11340, -11339, -11324,
      -11303, -11097, -11077, -11067, -11055, -11052, -11045, -11041,
      -11038, -11024, -11020, -11019, -11018, -11014, -10838, -10832,
      -10815, -10800, -10790, -10780, -10764, -10587, -10544, -10533,
      -10519, -10331, -10329, -10328, -10322, -10315, -10309, -10307,
      -10296, -10281, -10274, -10270, -10262, -10260, -10256, -10254 };
  public static String[] pystr = new String[] { "a", "ai", "an", "ang", "ao",
      "ba", "bai", "ban", "bang", "bao", "bei", "ben", "beng", "bi",
      "bian", "biao", "bie", "bin", "bing", "bo", "bu", "ca", "cai",
      "can", "cang", "cao", "ce", "ceng", "cha", "chai", "chan", "chang",
      "chao", "che", "chen", "cheng", "chi", "chong", "chou", "chu",
      "chuai", "chuan", "chuang", "chui", "chun", "chuo", "ci", "cong",
      "cou", "cu", "cuan", "cui", "cun", "cuo", "da", "dai", "dan",
      "dang", "dao", "de", "deng", "di", "dian", "diao", "die", "ding",
      "diu", "dong", "dou", "du", "duan", "dui", "dun", "duo", "e", "en",
      "er", "fa", "fan", "fang", "fei", "fen", "feng", "fo", "fou", "fu",
      "ga", "gai", "gan", "gang", "gao", "ge", "gei", "gen", "geng",
      "gong", "gou", "gu", "gua", "guai", "guan", "guang", "gui", "gun",
      "guo", "ha", "hai", "han", "hang", "hao", "he", "hei", "hen",
      "heng", "hong", "hou", "hu", "hua", "huai", "huan", "huang", "hui",
      "hun", "huo", "ji", "jia", "jian", "jiang", "jiao", "jie", "jin",
      "jing", "jiong", "jiu", "ju", "juan", "jue", "jun", "ka", "kai",
      "kan", "kang", "kao", "ke", "ken", "keng", "kong", "kou", "ku",
      "kua", "kuai", "kuan", "kuang", "kui", "kun", "kuo", "la", "lai",
      "lan", "lang", "lao", "le", "lei", "leng", "li", "lia", "lian",
      "liang", "liao", "lie", "lin", "ling", "liu", "long", "lou", "lu",
      "lv", "luan", "lue", "lun", "luo", "ma", "mai", "man", "mang",
      "mao", "me", "mei", "men", "meng", "mi", "mian", "miao", "mie",
      "min", "ming", "miu", "mo", "mou", "mu", "na", "nai", "nan",
      "nang", "nao", "ne", "nei", "nen", "neng", "ni", "nian", "niang",
      "niao", "nie", "nin", "ning", "niu", "nong", "nu", "nv", "nuan",
      "nue", "nuo", "o", "ou", "pa", "pai", "pan", "pang", "pao", "pei",
      "pen", "peng", "pi", "pian", "piao", "pie", "pin", "ping", "po",
      "pu", "qi", "qia", "qian", "qiang", "qiao", "qie", "qin", "qing",
      "qiong", "qiu", "qu", "quan", "que", "qun", "ran", "rang", "rao",
      "re", "ren", "reng", "ri", "rong", "rou", "ru", "ruan", "rui",
      "run", "ruo", "sa", "sai", "san", "sang", "sao", "se", "sen",
      "seng", "sha", "shai", "shan", "shang", "shao", "she", "shen",
      "sheng", "shi", "shou", "shu", "shua", "shuai", "shuan", "shuang",
      "shui", "shun", "shuo", "si", "song", "sou", "su", "suan", "sui",
      "sun", "suo", "ta", "tai", "tan", "tang", "tao", "te", "teng",
      "ti", "tian", "tiao", "tie", "ting", "tong", "tou", "tu", "tuan",
      "tui", "tun", "tuo", "wa", "wai", "wan", "wang", "wei", "wen",
      "weng", "wo", "wu", "xi", "xia", "xian", "xiang", "xiao", "xie",
      "xin", "xing", "xiong", "xiu", "xu", "xuan", "xue", "xun", "ya",
      "yan", "yang", "yao", "ye", "yi", "yin", "ying", "yo", "yong",
      "you", "yu", "yuan", "yue", "yun", "za", "zai", "zan", "zang",
      "zao", "ze", "zei", "zen", "zeng", "zha", "zhai", "zhan", "zhang",
      "zhao", "zhe", "zhen", "zheng", "zhi", "zhong", "zhou", "zhu",
      "zhua", "zhuai", "zhuan", "zhuang", "zhui", "zhun", "zhuo", "zi",
      "zong", "zou", "zu", "zuan", "zui", "zun", "zuo" };
  private StringBuilder buffer;
  private String resource;
  private static CharacterParser characterParser = new CharacterParser();
 
  public static CharacterParser getInstance() {
    return characterParser;
  }
 
  public String getResource() {
    return resource;
  }
 
  public void setResource(String resource) {
    this.resource = resource;
  }
 
  /** * 汉字转成ASCII* * */
  private int getChsAscii(String chs) {
    int asc = 0;
    try {
      byte[] bytes = chs.getBytes("gb2312");
      if (bytes == null || bytes.length > 2 || bytes.length <= 0) {
        throw new RuntimeException("illegal resource string");
      }
      if (bytes.length == 1) {
        asc = bytes[0];
      }
      if (bytes.length == 2) {
        int hightByte = 256 + bytes[0];
        int lowByte = 256 + bytes[1];
        asc = (256 * hightByte + lowByte) - 256 * 256;
      }
    } catch (Exception e) {
      System.out
          .println("ERROR:ChineseSpelling.class-getChsAscii(String chs)"
              + e);
    }
    return asc;
  }
 
  /** * 单字解析 * * */
  public String convert(String str) {
    String result = null;
    int ascii = getChsAscii(str);
    if (ascii > 0 && ascii < 160) {
      result = String.valueOf((char) ascii);
    } else {
      for (int i = (pyvalue.length - 1); i >= 0; i--) {
        if (pyvalue[i] <= ascii) {
          result = pystr[i];
          break;
        }
      }
    }
    return result;
  }
 
  /** * 词组解析 * * */
  public String getSelling(String chs) {
    String key, value;
    buffer = new StringBuilder();
    for (int i = 0; i < chs.length(); i++) {
      key = chs.substring(i, i + 1);
      if (key.getBytes().length >= 2) {
        value = (String) convert(key);
        if (value == null) {
          value = "unknown";
        }
      } else {
        value = key;
      }
      buffer.append(value);
    }
    return buffer.toString();
  }
 
  public String getSpelling() {
    return this.getSelling(this.getResource());
  }
 
}

implementation

String country="汉字";
 public String getString() {
    //返回拼音
    return PINYINChinese.getInstance().getSelling(country);
  }

Thank you for reading, I hope it can help everyone, thank you for your support of this site!

For more Java-related examples of converting Chinese characters into pinyin, please pay attention to the PHP Chinese website!

Statement
The content of this article is voluntarily contributed by netizens, and the copyright belongs to the original author. This site does not assume corresponding legal responsibility. If you find any content suspected of plagiarism or infringement, please contact admin@php.cn
What are some strategies for mitigating platform-specific issues in Java applications?What are some strategies for mitigating platform-specific issues in Java applications?May 01, 2025 am 12:20 AM

How does Java alleviate platform-specific problems? Java implements platform-independent through JVM and standard libraries. 1) Use bytecode and JVM to abstract the operating system differences; 2) The standard library provides cross-platform APIs, such as Paths class processing file paths, and Charset class processing character encoding; 3) Use configuration files and multi-platform testing in actual projects for optimization and debugging.

What is the relationship between Java's platform independence and microservices architecture?What is the relationship between Java's platform independence and microservices architecture?May 01, 2025 am 12:16 AM

Java'splatformindependenceenhancesmicroservicesarchitecturebyofferingdeploymentflexibility,consistency,scalability,andportability.1)DeploymentflexibilityallowsmicroservicestorunonanyplatformwithaJVM.2)Consistencyacrossservicessimplifiesdevelopmentand

How does GraalVM relate to Java's platform independence goals?How does GraalVM relate to Java's platform independence goals?May 01, 2025 am 12:14 AM

GraalVM enhances Java's platform independence in three ways: 1. Cross-language interoperability, allowing Java to seamlessly interoperate with other languages; 2. Independent runtime environment, compile Java programs into local executable files through GraalVMNativeImage; 3. Performance optimization, Graal compiler generates efficient machine code to improve the performance and consistency of Java programs.

How do you test Java applications for platform compatibility?How do you test Java applications for platform compatibility?May 01, 2025 am 12:09 AM

ToeffectivelytestJavaapplicationsforplatformcompatibility,followthesesteps:1)SetupautomatedtestingacrossmultipleplatformsusingCItoolslikeJenkinsorGitHubActions.2)ConductmanualtestingonrealhardwaretocatchissuesnotfoundinCIenvironments.3)Checkcross-pla

What is the role of the Java compiler (javac) in achieving platform independence?What is the role of the Java compiler (javac) in achieving platform independence?May 01, 2025 am 12:06 AM

The Java compiler realizes Java's platform independence by converting source code into platform-independent bytecode, allowing Java programs to run on any operating system with JVM installed.

What are the advantages of using bytecode over native code for platform independence?What are the advantages of using bytecode over native code for platform independence?Apr 30, 2025 am 12:24 AM

Bytecodeachievesplatformindependencebybeingexecutedbyavirtualmachine(VM),allowingcodetorunonanyplatformwiththeappropriateVM.Forexample,JavabytecodecanrunonanydevicewithaJVM,enabling"writeonce,runanywhere"functionality.Whilebytecodeoffersenh

Is Java truly 100% platform-independent? Why or why not?Is Java truly 100% platform-independent? Why or why not?Apr 30, 2025 am 12:18 AM

Java cannot achieve 100% platform independence, but its platform independence is implemented through JVM and bytecode to ensure that the code runs on different platforms. Specific implementations include: 1. Compilation into bytecode; 2. Interpretation and execution of JVM; 3. Consistency of the standard library. However, JVM implementation differences, operating system and hardware differences, and compatibility of third-party libraries may affect its platform independence.

How does Java's platform independence support code maintainability?How does Java's platform independence support code maintainability?Apr 30, 2025 am 12:15 AM

Java realizes platform independence through "write once, run everywhere" and improves code maintainability: 1. High code reuse and reduces duplicate development; 2. Low maintenance cost, only one modification is required; 3. High team collaboration efficiency is high, convenient for knowledge sharing.

See all articles

Hot AI Tools

Undresser.AI Undress

Undresser.AI Undress

AI-powered app for creating realistic nude photos

AI Clothes Remover

AI Clothes Remover

Online AI tool for removing clothes from photos.

Undress AI Tool

Undress AI Tool

Undress images for free

Clothoff.io

Clothoff.io

AI clothes remover

Video Face Swap

Video Face Swap

Swap faces in any video effortlessly with our completely free AI face swap tool!

Hot Tools

Dreamweaver CS6

Dreamweaver CS6

Visual web development tools

mPDF

mPDF

mPDF is a PHP library that can generate PDF files from UTF-8 encoded HTML. The original author, Ian Back, wrote mPDF to output PDF files "on the fly" from his website and handle different languages. It is slower than original scripts like HTML2FPDF and produces larger files when using Unicode fonts, but supports CSS styles etc. and has a lot of enhancements. Supports almost all languages, including RTL (Arabic and Hebrew) and CJK (Chinese, Japanese and Korean). Supports nested block-level elements (such as P, DIV),

SAP NetWeaver Server Adapter for Eclipse

SAP NetWeaver Server Adapter for Eclipse

Integrate Eclipse with SAP NetWeaver application server.

SublimeText3 Mac version

SublimeText3 Mac version

God-level code editing software (SublimeText3)

MinGW - Minimalist GNU for Windows

MinGW - Minimalist GNU for Windows

This project is in the process of being migrated to osdn.net/projects/mingw, you can continue to follow us there. MinGW: A native Windows port of the GNU Compiler Collection (GCC), freely distributable import libraries and header files for building native Windows applications; includes extensions to the MSVC runtime to support C99 functionality. All MinGW software can run on 64-bit Windows platforms.