LeetCode-Edit Distance

编辑距离,很常见的题目,貌似去年google笔试就考了这道题,

典型的DP,dp[i][j]表示word2[i]到word1[j]的最小编辑距离;

当word2[i]与word1[j]不相同时有三种方式:

1.改变字符,dp[i][j] = dp[i - 1][j- 1] + 1;

2.插入字符,dp[i][j] = dp[i ][j - 1]  + 1;

3.删除字符,dp[i][j] = dp[i - 1][j] + 1;

故dp[i][j] = min(1,2,3);

当word2[i]与word1[j]相同时:

dp[i][j] = dp[i - 1][j - 1];

 1 class Solution {
 2 public:
 3     int minDistance(string word1, string word2) {
 4         // Start typing your C/C++ solution below
 5         // DO NOT write int main() function
 6         int m = word1.size(), n = word2.size();
 7         vector<vector<int> > dp(n + 1, vector<int>(m + 1));
 8         for (int i = 0; i <= n; ++i)
 9             dp[i][0] = i;
10         for (int j = 0; j <= m; ++j)
11             dp[0][j] = j;
12         for (int i = 1; i <= n; ++i)
13             for (int j = 1; j <= m; ++j) {
14                 if (word2[i - 1] == word1[j - 1])
15                     dp[i][j] = dp[i - 1][j - 1];
16                 else 
17                     dp[i][j] = min(dp[i - 1][j - 1], min(dp[i][j - 1], dp[i - 1][j])) + 1;
18             }
19         return dp[n][m];
20     }
21 };

不过看到还有更好的方法,可以把空间复杂度降低到O(n),

n = word2.length();

dp[n + 1], dp[i]记录到word2[i]的最小编辑距离,

动态更新的过程要巧妙一点,从word1的开始逐步更新,

计算word1的(0, word1[i])到word2[j]的最小编辑距离,

更新dp[j];

递推过程:

当更新word1的第i个字符时,dp[j]中存的是上一步的值,即word[i - 1]与word2[j]的距离;

相当于前一种方法中的dp[i - 1][j],

按0<= j <=n 遍历word2,

dp[j]相当于dp[i - 1][j];

dp[j - 1]相当于dp[i - 1][j - 1];

在更新dp[j]为当前这一步(即遍历到word1[i])的值时,

当字符相同时:

当前的距离cur = dp[i - 1][j - 1] = dp[j - 1],

由于要用到上一步的dp[j - 1],所以使用之后才能更新;

当字符不同时:

1.改变字符,cur = dp[i - 1][j- 1] + 1;

2.插入字符,cur = dp[i ][j - 1]  + 1;

3.删除字符,cur = dp[i - 1][j] + 1;

1,3都要用到上一步的dp[j - 1], dp[j];

2为当前这一步已经更新了的dp[j - 1],

所以这里无法用dp[j - 1]表示两个值,故可以用一个变量pre记录当前上一次的值pre = dp[i][j - 1];

当执行到j时,

更新dp[j -1] = pre,然后令 pre = cur = dp[j];

 1 class Solution {
 2 public:
 3     int minDistance(string word1, string word2) {
 4         // Start typing your C/C++ solution below
 5         // DO NOT write int main() function
 6         if (word1.empty()) {
 7             return word2.size();
 8         }
 9         if (word2.empty()) {
10             return word1.size();
11         }
12         int m = word1.size(), n = word2.size();
13         int i = 0;
14         vector<int> dp(n + 1, 0);
15         for (int i = 0; i <= n; ++i)
16             dp[i] = i;
17         for (int i = 1; i <= m; ++i) {
18             int pre = i;
19             int cur = i;
20             for (int j = 1; j <= n; ++j) {
21                 if (word1[i - 1] == word2[j - 1])
22                     cur = dp[j - 1];
23                 else
24                     cur = min(min(dp[j - 1], dp[j]), pre) + 1;            
25                 dp[j - 1] = pre;
26                 pre = cur;
27             }
28             dp[n] = cur;
29         }
30         return dp[n];
31     }
32 };
原文地址:https://www.cnblogs.com/chasuner/p/editdist.html