近期在学习subtext,在Subtext.Framework中很类的写法,都很经典,值的我们深入去学习。
在Subtext.Framework中Entries.cs提供了"获取汉字第一个拼音",在后期会不断和大家一起分享学习心得。
在使用下列代码时,请引用
using System.Text;
using System.Text.RegularExpressions;
static string RemoveNonWordCharacters(string text)
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedBlockStart.gif)
{
string txt = getSpells(text);//中文转换成拼音
Regex regex = new Regex(@"[\w\d\.\- ]+", RegexOptions.Compiled);
MatchCollection matches = regex.Matches(txt);
string cleansedText = string.Empty;
![](https://www.cnblogs.com/Images/OutliningIndicators/InBlock.gif)
foreach (Match match in matches)
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedSubBlockStart.gif)
{
if (match.Value.Length > 0)
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedSubBlockStart.gif)
{
cleansedText += match.Value;
}
}
return cleansedText;
}
![](https://www.cnblogs.com/Images/OutliningIndicators/None.gif)
![](https://www.cnblogs.com/Images/OutliningIndicators/ContractedBlock.gif)
获取汉字第一个拼音#region 获取汉字第一个拼音
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedSubBlockStart.gif)
/**//// <summary>
/// 获取汉字第一个拼音
/// </summary>
/// <param name="input"></param>
/// <returns></returns>
static public string getSpells(string input)
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedSubBlockStart.gif)
{
int len = input.Length;
string reVal = "";
for (int i = 0; i < len; i++)
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedSubBlockStart.gif)
{
reVal += getSpell(input.Substring(i, 1));
}
return reVal;
}
![](https://www.cnblogs.com/Images/OutliningIndicators/InBlock.gif)
static public string getSpell(string cn)
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedSubBlockStart.gif)
{
byte[] arrCN = System.Text.Encoding.Default.GetBytes(cn);
if (arrCN.Length > 1)
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedSubBlockStart.gif)
{
int area = (short)arrCN[0];
int pos = (short)arrCN[1];
int code = (area << 8) + pos;
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedSubBlockStart.gif)
int[] areacode =
{ 45217, 45253, 45761, 46318, 46826, 47010, 47297, 47614, 48119, 48119, 49062, 49324, 49896, 50371, 50614, 50622, 50906, 51387, 51446, 52218, 52698, 52698, 52698, 52980, 53689, 54481 };
for (int i = 0; i < 26; i++)
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedSubBlockStart.gif)
{
int max = 55290;
if (i != 25) max = areacode[i + 1];
if (areacode[i] <= code && code < max)
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedSubBlockStart.gif)
{
![](https://www.cnblogs.com/Images/OutliningIndicators/ExpandedSubBlockStart.gif)
return System.Text.Encoding.Default.GetString(new byte[]
{ (byte)(65 + i) });
}
}
return "?";
}
else return cn;
}
#endregion
}