|
@@ -26,26 +26,12 @@ from .jaccard import Jaccard
|
|
class TestJaccard(unittest.TestCase):
|
|
class TestJaccard(unittest.TestCase):
|
|
|
|
|
|
def test_jaccard(self):
|
|
def test_jaccard(self):
|
|
- a = Jaccard(1)
|
|
|
|
- s0 = ""
|
|
|
|
- s1 = ""
|
|
|
|
- s2 = "上海"
|
|
|
|
- s3 = "上海市"
|
|
|
|
- distance_format = "distance: {:.4}\t between {} and {}"
|
|
|
|
- similarity_format = "similarity: {:.4}\t between {} and {}"
|
|
|
|
- print(distance_format.format(str(a.distance(s0, s1)), s0, s1))
|
|
|
|
- print(distance_format.format(str(a.distance(s0, s2)), s0, s2))
|
|
|
|
- print(distance_format.format(str(a.distance(s0, s3)), s0, s3))
|
|
|
|
- print(distance_format.format(str(a.distance(s1, s2)), s1, s2))
|
|
|
|
- print(distance_format.format(str(a.distance(s1, s3)), s1, s3))
|
|
|
|
- print(distance_format.format(str(a.distance(s2, s3)), s2, s3))
|
|
|
|
-
|
|
|
|
- print(similarity_format.format(str(a.similarity(s0, s1)), s0, s1))
|
|
|
|
- print(similarity_format.format(str(a.similarity(s0, s2)), s0, s2))
|
|
|
|
- print(similarity_format.format(str(a.similarity(s0, s3)), s0, s3))
|
|
|
|
- print(similarity_format.format(str(a.similarity(s1, s2)), s1, s2))
|
|
|
|
- print(similarity_format.format(str(a.similarity(s1, s3)), s1, s3))
|
|
|
|
- print(similarity_format.format(str(a.similarity(s2, s3)), s2, s3))
|
|
|
|
|
|
+ jaccard = Jaccard(1)
|
|
|
|
+ s = ['', ' ', 'Shanghai', 'ShangHai', 'Shang Hai']
|
|
|
|
+ for i in range(len(s)):
|
|
|
|
+ for j in range(i, len(s)):
|
|
|
|
+ print('dis between \'%s\' and \'%s\': %.4f' % (s[i], s[j], jaccard.distance(s[i], s[j])))
|
|
|
|
+ print('sim between \'%s\' and \'%s\': %.4f' % (s[i], s[j], jaccard.similarity(s[i], s[j])))
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
if __name__ == "__main__":
|