From 052027fb503220294e5709d9cc0a0e591cb0d3c7 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=B6=B5=E6=9B=A6?= Date: Wed, 13 Nov 2024 23:28:10 +0800 Subject: [PATCH] =?UTF-8?q?feat:=20=E6=96=B0=E5=A2=9E=E6=A8=A1=E7=B3=8A?= =?UTF-8?q?=E5=8C=B9=E9=85=8D=E6=B5=8B=E8=AF=95=E7=94=A8=E4=BE=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- test/test_difflib.py | 33 +++++++++++++++++++++++++++++++++ 1 file changed, 33 insertions(+) create mode 100644 test/test_difflib.py diff --git a/test/test_difflib.py b/test/test_difflib.py new file mode 100644 index 0000000..95a862a --- /dev/null +++ b/test/test_difflib.py @@ -0,0 +1,33 @@ +import difflib + +from xiaomusic.utils import ( + keyword_detection, + find_best_match, +) + +if __name__ == "__main__": + user_input = "八年的爱" + s1 = "冰冰超人 - 八年的爱新版" + s2 = "冰冰超人 - 八年的爱" + r1 = difflib.SequenceMatcher(None, s1, user_input).ratio() + r2 = difflib.SequenceMatcher(None, s2, user_input).ratio() + print(s1, r1) + print(s2, r2) + + s3 = "其他" + str_list = [s2, s1, s3] + matches, remains = keyword_detection(user_input, str_list, n=10) + print(matches, remains) + + extra_search_index = {} + extra_search_index["1"] = s1 + extra_search_index["2"] = s2 + extra_search_index["3"] = s3 + real_names = find_best_match( + user_input, + str_list, + cutoff=0.4, + n=100, + extra_search_index=extra_search_index, + ) + print(real_names)