# Sweet Snippet 之 字符串编辑距离

• 删除某一字符
• 增加某一字符

(这里我们不允许变更某一字符,注意一下)

C(i,j)C(i, j)C(i,j) : aaa 的(前缀)子串(长度为 iii) 与 bbb 的(前缀)子串(长度为 jjj) 的字符串编辑距离.

C(i,j)={i,if j=0j,if i=0C(i−1,j−1),if a[i]=b[j]min(C(i−1,j),C(i,j−1))+1,otherwise C(i, j) = \left\{ \begin{aligned} % &amp; 0, &amp; if \ i = 0\ and\ j = 0 \\ &amp; i, &amp; if \ j = 0 \\ &amp; j, &amp; if \ i = 0 \\ &amp; C(i - 1, j - 1), &amp; if\ a[i] = b[j] \\ &amp; min(C(i - 1, j), C(i, j - 1)) + 1, &amp; otherwise \end{aligned} \right. C(i,j)=⎩⎪⎪⎪⎪⎨⎪⎪⎪⎪⎧​​i,j,C(i−1,j−1),min(C(i−1,j),C(i,j−1))+1,​if j=0if i=0if a[i]=b[j]otherwise​

-- get key from two index
function get_key(m, n)
return m .. "_" .. n
end

function edit_dist_iter(a, b, m, n)
local edit_dist_buffer = {}

edit_dist_buffer[get_key(0, 0)] = 0

for i = 1, m do
edit_dist_buffer[get_key(i, 0)] = i
end

for i = 1, n do
edit_dist_buffer[get_key(0, i)] = i
end

for i = 1, m do
for j = 1, n do
local ac = a:sub(i, i)
local bc = b:sub(j, j)
if ac == bc then
edit_dist_buffer[get_key(i, j)] = edit_dist_buffer[get_key(i - 1, j - 1)]
else
local d1 = edit_dist_buffer[get_key(i - 1, j)]
local d2 = edit_dist_buffer[get_key(i, j - 1)]
edit_dist_buffer[get_key(i, j)] = math.min(d1, d2) + 1
end
end
end

return edit_dist_buffer[get_key(m, n)]
end

function edit_dist(a, b)
return edit_dist_iter(a, b, #a, #b)
end

-- get key from two index
function get_key(m, n)
return m .. "_" .. n
end

function edit_dist_recur(a, b, m, n, buffer)
if m <= 0 then
-- result is trivial, do not need buffer
return n
elseif n <= 0 then
-- result is trivial, do not need buffer
return m
else
local ac = a:sub(m, m)
local bc = b:sub(n, n)
if ac == bc then
local d = buffer[get_key(m - 1, n - 1)]
if d then
buffer[get_key(m, n)] = d
return d
else
local d = edit_dist_recur(a, b, m - 1, n - 1, buffer)
buffer[get_key(m, n)] = d
return d
end
else
local d1 = buffer[get_key(m - 1, n)]
if not d1 then
d1 = edit_dist_recur(a, b, m - 1, n, buffer)
end

local d2 = buffer[get_key(m, n - 1)]
if not d2 then
d2 = edit_dist_recur(a, b, m, n - 1, buffer)
end

local d = math.min(d1, d2) + 1
buffer[get_key(m, n)] = d
return d
end
end
end

function edit_dist(a, b)
-- create buffer
local edit_dist_buffer = {}
return edit_dist_recur(a, b, #a, #b, edit_dist_buffer)
end

