| 123456789101112131415161718192021222324252627282930313233 |
- import numpy as np
- from .string_distance import StringDistance
- class LongestCommonSubsequence(StringDistance):
- def distance(self, s0, s1):
- if s0 is None:
- raise TypeError("Argument s0 is NoneType.")
- if s1 is None:
- raise TypeError("Argument s1 is NoneType.")
- if s0 == s1:
- return 0.0
- return len(s0) + len(s1) - 2 * self.length(s0, s1)
- @staticmethod
- def length(s0, s1):
- if s0 is None:
- raise TypeError("Argument s0 is NoneType.")
- if s1 is None:
- raise TypeError("Argument s1 is NoneType.")
- s0_len, s1_len = len(s0), len(s1)
- x, y = s0[:], s1[:]
- n, m = s0_len + 1, s1_len + 1
- matrix = np.zeros((n, m))
- for i in range(1, s0_len + 1):
- for j in range(1, s1_len + 1):
- if x[i - 1] == y[j - 1]:
- matrix[i][j] = matrix[i - 1][j - 1] + 1
- else:
- matrix[i][j] = max(matrix[i][j - 1], matrix[i - 1][j])
- return matrix[s0_len][s1_len]
|