X-Git-Url: https://git.kaliko.me/?a=blobdiff_plain;f=sima%2Flib%2Fsimastr.py;fp=sima%2Flib%2Fsimastr.py;h=9dacc45d1ea3af6302a1f56b08c9e6049b117a9b;hb=e73aeec41c2065c852294253a8ed85a5d0958f76;hp=c7162144cd95cb3b3d65b793e3e18871ed16e220;hpb=50a7a9b43940155f8b0a3b81bb91a79585104eb9;p=mpd-sima.git diff --git a/sima/lib/simastr.py b/sima/lib/simastr.py index c716214..9dacc45 100644 --- a/sima/lib/simastr.py +++ b/sima/lib/simastr.py @@ -80,6 +80,8 @@ class SimaStr(str): Specific string object for artist names and song titles. Here follows some class variables for regex to run on strings. """ + diafilter = True + leven_ratio = 0.82 regexp_dict = dict() # Leading patterns: The Le Les @@ -105,7 +107,8 @@ class SimaStr(str): self.stripped = str(fuzzstr.strip()) # fuzzy computation self._get_root() - self.remove_diacritics() + if self.__class__.diafilter: + self.remove_diacritics() def __new__(cls, fuzzstr): return super(SimaStr, cls).__new__(cls, fuzzstr) @@ -145,7 +148,7 @@ class SimaStr(str): other.stripped.lower()) if hash(self) == hash(other): return True - return levenr >= 0.82 + return levenr >= self.__class__.leven_ratio def __ne__(self, other): if not isinstance(other, SimaStr):