/// <summary>

        /// 内容格式刷

        /// </summary>

        /// <param name="strHtml">要格式的文本</param>

        /// <returns></returns>

        public static string HtmlToTxt(string strHtml)

        {

            string[] aryReg ={

            @"<script[^>]*?>.*?</script>",

            @"<(\/\s*)?!?((\w+:)?\w+)(\w+(\s*=?\s*(([""'])(\\[""'tbnr]|[^\7])*?\7|\w+)|.{0})|\s)*?(\/\s*)?>",

            @"([\r\n])[\s]+",

            @"&(quot|#34);",

            @"&(amp|#38);",

            @"&(lt|#60);",

            @"&(gt|#62);", 

            @"&(nbsp|#160);", 

            @"&(iexcl|#161);",

            @"&(cent|#162);",

            @"&(pound|#163);",

            @"&(copy|#169);",

            @"&#(\d+);",

            @"-->",

            @"<!--.*\n"

            };

 

            string newReg = aryReg[0];

            string strOutput = strHtml;

            for (int i = 0; i < aryReg.Length; i++)

            {

                Regex regex = new Regex(aryReg[i], RegexOptions.IgnoreCase);

                strOutput = regex.Replace(strOutput, string.Empty);

            }

 

            strOutput.Replace("<", "");

            strOutput.Replace(">", "");

            strOutput.Replace("\r\n", "");

 

 

            return strOutput;

        }

 

posted on 2017-02-16 15:00  遥望末班车  阅读(1005)  评论(0编辑  收藏  举报