Van Pan

导航

Edit Distance (编辑距离) .NET 实现

    /// <summary>
    /// Calculate Text Edit Distance Utility Class
    /// </summary>
    public static class TextEditDistanceUtility
    {
        /// <summary>
        /// get edit distance between two string
        /// </summary>
        /// <param name="str1"></param>
        /// <param name="str2"></param>
        /// <returns></returns>
        public static int GetEditDistance(string str1, string str2)
        {
            if (str1 == str2) return 0;
            else if (String.IsNullOrEmpty(str1) && String.IsNullOrEmpty(str2)) return 0;
            else if (String.IsNullOrEmpty(str1) && !String.IsNullOrEmpty(str2)) return str2.Length;
            else if (!String.IsNullOrEmpty(str1) && String.IsNullOrEmpty(str2)) return str1.Length;
            int[,] d = new int[str1.Length + 1, str2.Length + 1];
            d.Initialize();
            int cost = 0;
            for (int i = 0; i < d.GetLength(0); i++)
            {
                d[i, 0] = i;
            }
            for (int j = 0; j < d.GetLength(1); j++)
            {
                d[0, j] = j;
            }
            for (int i = 0; i < str1.Length; i++)
            {
                for (int j = 0; j < str2.Length; j++)
                {
                    if (str1[i] == str2[j]) cost = 0;
                    else cost = 1;
                    d[i + 1, j + 1] = Math.Min(Math.Min(d[i, j + 1] + 1, d[i + 1, j] + 1), Math.Min(d[i + 1, j] + 1, d[i, j] + cost));
                }
            }
            return d[str1.Length, str2.Length];
        }
    }


Edit Distance是比较两个字符串之间需要多少次基础操作才能变成对方的操作,增加一个字符,删除一个字符,修改一个字符,均算作一次操作

比如abb和bbb,编辑距离就是1,abc变成aa,编辑距离就是2

这个算法比较多的应用就是比较两次结果之间差别有多大

posted on 2012-11-14 14:44  Van Pan  阅读(207)  评论(0编辑  收藏  举报