C# 获取汉字拼音首字母/全拼

最近悟出来一个道理，在这儿分享给大家：学历代表你的过去，能力代表你的现在，学习代表你的将来。

十年河东十年河西，莫欺少年穷

学无止境，精益求精

本节探讨C#获取汉字拼音首字母的方法：

代码类东西，直接上代码：

        /// <summary>

        /// 在指定的字符串列表CnStr中检索符合拼音索引字符串

        /// </summary>

        /// <param name="CnStr">汉字字符串</param>

        /// <returns>相对应的汉语拼音首字母串</returns>

        public static string GetSpellCode(string CnStr)

        {

            string strTemp = "";

            int iLen = CnStr.Length;

            int i = ;

            for (i = ; i <= iLen - ; i++)

            {

                strTemp += GetCharSpellCode(CnStr.Substring(i, ));

                break;

            }

            return strTemp;

        }

        /// <summary>

        /// 得到一个汉字的拼音第一个字母，如果是一个英文字母则直接返回大写字母

        /// </summary>

        /// <param name="CnChar">单个汉字</param>

        /// <returns>单个大写字母</returns>

        private static string GetCharSpellCode(string CnChar)

        {

            long iCnChar;

            byte[] ZW = System.Text.Encoding.Default.GetBytes(CnChar);

            //如果是字母，则直接返回首字母

            if (ZW.Length == )

            {

                return CommonMethod.CutString(CnChar.ToUpper(),);

            }

            else

            {

                // get the array of byte from the single char

                int i1 = (short)(ZW[]);

                int i2 = (short)(ZW[]);

                iCnChar = i1 *  + i2;

            }

            // iCnChar match the constant

            if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "A";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "B";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "C";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "D";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "E";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "F";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "G";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "H";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "J";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "K";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "L";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "M";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "N";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "O";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "P";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "Q";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "R";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "S";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "T";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "W";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "X";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "Y";

            }

            else if ((iCnChar >= ) && (iCnChar <= ))

            {

                return "Z";

            }

            else

                return ("?");

        }

截取字符串的方法：

#region 截取字符长度 static string CutString(string str, int len)

        /// <summary>

        /// 截取字符长度

        /// </summary>

        /// <param name="str">被截取的字符串</param>

        /// <param name="len">所截取的长度</param>

        /// <returns>子字符串</returns>

        public static string CutString(string str, int len)

        {

            if (str == null || str.Length ==  || len <= )

            {

                return string.Empty;

            }

            int l = str.Length;

            #region 计算长度

            int clen = ;

            while (clen < len && clen < l)

            {

                //每遇到一个中文，则将目标长度减一。

                if ((int)str[clen] > ) { len--; }

                clen++;

            }

            #endregion

            if (clen < l)

            {

                return str.Substring(, clen) + "...";

            }

            else

            {

                return str;

            }

        }

        /// <summary>

        /// //截取字符串中文 字母

        /// </summary>

        /// <param name="content">源字符串</param>

        /// <param name="length">截取长度！</param>

        /// <returns></returns>

        public static string SubTrueString(object content, int length)

        {

            string strContent = NoHTML(content.ToString());

            bool isConvert = false;

            int splitLength = ;

            int currLength = ;

            int code = ;

            int chfrom = Convert.ToInt32("4e00", );    //范围（0x4e00～0x9fff）转换成int（chfrom～chend）

            int chend = Convert.ToInt32("9fff", );

            for (int i = ; i < strContent.Length; i++)

            {

                code = Char.ConvertToUtf32(strContent, i);

                if (code >= chfrom && code <= chend)

                {

                    currLength += ; //中文

                }

                else

                {

                    currLength += ;//非中文

                }

                splitLength = i + ;

                if (currLength >= length)

                {

                    isConvert = true;

                    break;

                }

            }

            if (isConvert)

            {

                return strContent.Substring(, splitLength);

            }

            else

            {

                return strContent;

            }

        }

        public static int GetStringLenth(object content)

        {

            string strContent = NoHTML(content.ToString());

            int currLength = ;

            int code = ;

            int chfrom = Convert.ToInt32("4e00", );    //范围（0x4e00～0x9fff）转换成int（chfrom～chend）

            int chend = Convert.ToInt32("9fff", );

            for (int i = ; i < strContent.Length; i++)

            {

                code = Char.ConvertToUtf32(strContent, i);

                if (code >= chfrom && code <= chend)

                {

                    currLength += ; //中文

                }

                else

                {

                    currLength += ;//非中文

                }

            }

            return currLength;

        }

        #endregion

以上便是完整代码，谢谢！

在此，顺便说下数据库按照汉字首字母进行排序的方法：

oracle ：

在oracle9i中新增了按照拼音、部首、笔画排序功能。设置NLS_SORT值
SCHINESE_RADICAL_M 按照部首（第一顺序）、笔划（第二顺序）排序
SCHINESE_STROKE_M 按照笔划（第一顺序）、部首（第二顺序）排序
SCHINESE_PINYIN_M 按照拼音排序，系统的默认排序方式为拼音排序

举例如下：
表名为 dept ，其中name字段是中文，下面分别实现按照单位名称的笔划、部首和拼音排序。
//按照笔划排序
select * from dept order by nlssort(name,'NLS_SORT=SCHINESE_STROKE_M');
//按照部首排序
select * from dept order by nlssort(name,'NLS_SORT=SCHINESE_RADICAL_M');
//按照拼音排序，此为系统的默认排序方式
select * from dept order by nlssort(name,'NLS_SORT=SCHINESE_PINYIN_M');

sqlserver

select * from table order by name collate Chinese_PRC_CS_AS_KS_WS 

执行结果：select * from Table where cateFid=0 order by cateName collate Chinese_PRC_CS_AS_KS_WS

C# 获取汉字拼音首字母/全拼

如果您觉得不错，顶下吧！

2019年3月7日完善如下：

如何获取全拼呢？引用第三方DLL。可以在NuGet库中引用：NPinyin

！

获取全拼的代码！

  public static string GetSpellAllCode(string CnStr)

        {

           return NPinyin.Pinyin.GetPinyin(CnStr);

        }

上述代码获取的全拼有空格分隔，如果你不需要空格，可采用：.Replace(" ", "") 把空格替换掉！

但是有个问题需要完善下：

如果上述获取首字母的方法得到的结果中包含‘？’号，这就说明上述方法存在不能翻译的汉字，这时候我们可以将二者相结合，如下：

  string szm = PingYinHelper.GetSpellCode(smSupplierModel.SupplierName);

                if (szm.Contains("?"))

                {

                    szm = string.Empty;

                    var ary = PingYinHelper.GetSpellAllCode(smSupplierModel.SupplierName).Split(' ');

                    foreach (var py in ary)

                    {

                        szm += py.Substring(, );

                    }

                }

                string supplierSZM = szm.ToUpper() + "_" + PingYinHelper.GetSpellAllCode(smSupplierModel.SupplierName).Replace(" ", "");

                smSupplierEntity.Relatcpyno = supplierSZM;

@陈卧龙的博客

秒客网

C# 获取汉字拼音首字母/全拼

相关文章