diff --git a/工具/局部相似题目检测.py b/工具/局部相似题目检测.py index 8ed35a58..e1e77252 100644 --- a/工具/局部相似题目检测.py +++ b/工具/局部相似题目检测.py @@ -1,9 +1,9 @@ import os,re,difflib,Levenshtein,time,json # 重要!!! 新旧题目的范围(有重复默认为新题) -id_new_problems = "30000:39999" +id_new_problems = "15311:15331" id_old_problems = "1:50000" -threshold = 0.99 +threshold = 0.85 #生成数码列表, 逗号分隔每个区块, 区块内部用:表示整数闭区间 def generate_number_set(string): diff --git a/题库0.3/Problems.json b/题库0.3/Problems.json index 98b281d2..f4902e82 100644 --- a/题库0.3/Problems.json +++ b/题库0.3/Problems.json @@ -6485,7 +6485,9 @@ "same": [ "008818" ], - "related": [], + "related": [ + "015318" + ], "remark": "", "space": "12ex" }, @@ -6863,7 +6865,9 @@ "20220624\t王伟叶, 余利成" ], "same": [], - "related": [], + "related": [ + "015319" + ], "remark": "", "space": "12ex" }, @@ -60960,7 +60964,9 @@ "20220625\t王伟叶" ], "same": [], - "related": [], + "related": [ + "015311" + ], "remark": "", "space": "" }, @@ -267959,7 +267965,9 @@ "same": [ "008901" ], - "related": [], + "related": [ + "015316" + ], "remark": "", "space": "12ex" }, @@ -378093,7 +378101,9 @@ "20230420\t王伟叶" ], "same": [], - "related": [], + "related": [ + "002174" + ], "remark": "", "space": "" }, @@ -378114,7 +378124,9 @@ "20230420\t王伟叶" ], "same": [], - "related": [], + "related": [ + "031210" + ], "remark": "", "space": "" }, @@ -378198,7 +378210,9 @@ "20230420\t王伟叶" ], "same": [], - "related": [], + "related": [ + "010677" + ], "remark": "", "space": "" }, @@ -378240,7 +378254,9 @@ "20230420\t王伟叶" ], "same": [], - "related": [], + "related": [ + "000246" + ], "remark": "", "space": "" }, @@ -378261,7 +378277,9 @@ "20230420\t王伟叶" ], "same": [], - "related": [], + "related": [ + "000260" + ], "remark": "", "space": "" }, @@ -457349,7 +457367,8 @@ ], "same": [], "related": [ - "009985" + "009985", + "015312" ], "remark": "", "space": ""