-
Notifications
You must be signed in to change notification settings - Fork 1
/
levenshtein.py
executable file
·76 lines (60 loc) · 2.5 KB
/
levenshtein.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
#!/usr/bin/env python
#
# levenshtein - calculate the Levenshtein distance between two strings
#
# Copyright (C) 2015 Michael Davies <[email protected]>
#
# This program is free software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License as
# published by the Free Software Foundation; either version 2 of the
# License, or (at your option) any later version.
#
# This program is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
# General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
# 02111-1307, USA.
#
import os
import sys
def levenshtein(first_str, second_str, first_idx=None,
second_idx=None):
if first_idx is None:
first_idx = len(first_str)
if second_idx is None:
second_idx = len(second_str)
if first_idx == 0:
return second_idx
if second_idx == 0:
return first_idx
if first_str[first_idx-1] == second_str[second_idx-1]:
cost = 0
else:
cost = 1
return min(levenshtein(first_str, second_str, first_idx-1, second_idx) + 1,
levenshtein(first_str, second_str, first_idx, second_idx-1) + 1,
levenshtein(first_str, second_str, first_idx-1,
second_idx-1) + cost)
if __name__ == '__main__':
progname = os.path.basename(__file__)
if len(sys.argv) == 2 and sys.argv[1] == "test":
import unittest
class TestLevenshtein(unittest.TestCase):
def test_simple(self):
self.assertEqual(3, levenshtein('Saturday', 'Sunday'))
self.assertEqual(1, levenshtein('Suzie', 'Susie'))
def test_symmetry(self):
self.assertEqual(3, levenshtein('kitten', 'sitting'))
self.assertEqual(3, levenshtein('sitting', 'kitten'))
def test_emptyness(self):
self.assertEqual(4, levenshtein('', 'fred'))
self.assertEqual(4, levenshtein('fred', ''))
unittest.main()
elif len(sys.argv) != 3:
sys.exit('Usage: %s first-string second-string' % progname)
print("The Levenshtein distance between '%s' and '%s' is %s" %
(sys.argv[1], sys.argv[2], levenshtein(sys.argv[1], sys.argv[2])))