C#實現漢字轉漢語拼音的示例代碼
一、使用PinYinConverterCore獲取漢語拼音
最新在做一個搜索組件,需要使用漢語拼音的首字母查詢出符合條件的物品名稱,由於漢字存在多音字,所以自己寫查詢組件不太現實,因此,我們使用微軟提供的CHSPinYinConv
,CHSPinYinConv
在.net core下載安裝沒有問題,但在.net framework會由於兼容性會安裝失敗,因此使用瞭PinYinConverterCore
來實現漢字轉拼音,PinYinConverterCore
應該也是基於CHSPinYinConv
開發的兼容包,後續的代碼兩個安裝包環境下都可以使用。使用Nuget
搜索PinYinConverterCore
下載並安裝,具體如下:
二、編寫工具擴展類實現獲取漢字的拼音
由於漢字存在多音字,因此,通過漢字獲取到的拼音是一個數組,具體如下:
/// <summary> /// 漢字轉換拼音 /// </summary> public static class PingYinUtil { private static Dictionary<int, List<string>> GetTotalPingYinDictionary(string text) { var chs = text.ToCharArray(); //記錄每個漢字的全拼 Dictionary<int, List<string>> totalPingYinList = new Dictionary<int, List<string>>(); for (int i = 0; i < chs.Length; i++) { var pinyinList = new List<string>(); //是否是有效的漢字 if (ChineseChar.IsValidChar(chs[i])) { ChineseChar cc = new ChineseChar(chs[i]); pinyinList = cc.Pinyins.Where(p => !string.IsNullOrWhiteSpace(p)).ToList(); } else { pinyinList.Add(chs[i].ToString()); } //去除聲調,轉小寫 pinyinList = pinyinList.ConvertAll(p => Regex.Replace(p, @"\d", "").ToLower()); //去重 pinyinList = pinyinList.Where(p => !string.IsNullOrWhiteSpace(p)).Distinct().ToList(); if (pinyinList.Any()) { totalPingYinList[i] = pinyinList; } } return totalPingYinList; } /// <summary> /// 獲取漢語拼音全拼 /// </summary> /// <param name="text">The string.</param> /// <returns></returns> public static List<string> GetTotalPingYin(this string text) { var result = new List<string>(); foreach (var pys in GetTotalPingYinDictionary(text)) { var items = pys.Value; if (result.Count <= 0) { result = items; } else { //全拼循環匹配 var newTotalPingYinList = new List<string>(); foreach (var totalPingYin in result) { newTotalPingYinList.AddRange(items.Select(item => totalPingYin + item)); } newTotalPingYinList = newTotalPingYinList.Distinct().ToList(); result = newTotalPingYinList; } } return result; } /// <summary> /// 獲取漢語拼音首字母 /// </summary> /// <param name="text"></param> /// <returns></returns> public static List<string> GetFirstPingYin(this string text) { var result = new List<string>(); foreach (var pys in GetTotalPingYinDictionary(text)) { var items = pys.Value; if (result.Count <= 0) { result = items.ConvertAll(p => p.Substring(0, 1)).Distinct().ToList(); } else { //首字母循環匹配 var newFirstPingYinList = new List<string>(); foreach (var firstPingYin in result) { newFirstPingYinList.AddRange(items.Select(item => firstPingYin + item.Substring(0, 1))); } newFirstPingYinList = newFirstPingYinList.Distinct().ToList(); result = newFirstPingYinList; } } return result; } }
三、編寫測試用例
我們編寫一個測試用例,通過輸入的漢字獲取到漢語拼音的全拼和首字母縮寫,具體如下:
// 漢字輸入 string text = TextBoxInput.Text; // 獲取到漢語拼音的全拼 TextBoxTotal.Text = string.Join(",", text.GetTotalPingYin()); // 獲取到漢語拼音的首字母 TextBoxFirst.Text = string.Join(",", text.GetFirstPingYin());
我們編寫錄入一組用戶名,然後根據輸入輸入的用戶名的縮寫,篩選出符合條件的人,我們可以使用Linq
模糊查詢,具體如下:
public class Student { public string Name { get; set; } public List<string> Pinyin { get; set; } }
StudentList = new List<Student> { new Student() {Name = "張三"}, new Student() {Name = "章黎"}, new Student() {Name = "張三豐"}, new Student() {Name = "李四"}, new Student() {Name = "王五"}, new Student() {Name = "John"}, new Student() {Name = "W.吳"}, new Student() {Name = "阿姨"}, new Student() {Name = "阿膠"}, new Student() {Name = "麥合蘇提.麥合蘇提"} };
var text = TextBoxSearch.Text; foreach (var student in StudentList) { student.Pinyin = student.Name.GetFirstPingYin(); } StudentList = StudentList.Where(s => s.Pinyin.Exists(p=>p.Contains(text))).ToList();
到此這篇關於C#實現漢字轉漢語拼音的示例代碼的文章就介紹到這瞭,更多相關C#漢字轉拼音內容請搜索WalkonNet以前的文章或繼續瀏覽下面的相關文章希望大傢以後多多支持WalkonNet!