import numpy as np from .string_distance import StringDistance class LongestCommonSubsequence(StringDistance): def distance(self, s0, s1): if s0 is None: raise TypeError("Argument s0 is NoneType.") if s1 is None: raise TypeError("Argument s1 is NoneType.") if s0 == s1: return 0.0 return len(s0) + len(s1) - 2 * self.length(s0, s1) @staticmethod def length(s0, s1): if s0 is None: raise TypeError("Argument s0 is NoneType.") if s1 is None: raise TypeError("Argument s1 is NoneType.") s0_len, s1_len = len(s0), len(s1) x, y = s0[:], s1[:] n, m = s0_len + 1, s1_len + 1 matrix = np.zeros((n, m)) for i in range(1, s0_len + 1): for j in range(1, s1_len + 1): if x[i - 1] == y[j - 1]: matrix[i][j] = matrix[i - 1][j - 1] + 1 else: matrix[i][j] = max(matrix[i][j - 1], matrix[i - 1][j]) return matrix[s0_len][s1_len]