修改database_tools中的两个函数, 排除OBSOLETE的题目被选入的可能

This commit is contained in:
weiye.wang 2023-07-09 16:13:27 +08:00
parent c1740186d8
commit b0a90fcf75
1 changed files with 2 additions and 2 deletions

View File

@ -61,7 +61,7 @@ def detectmaxsim(currentid,excludelist,adict): #检测与已知题目关联程
maxsim = -1
argmaxsim = "000000"
for id in adict:
if not id in excludelist:
if not id in excludelist and not "OBSOLETE" in adict[id]["content"]:
simrate = Levenshtein.jaro(adict[id]["content"],adict[currentid]["content"])
if simrate > maxsim:
maxsim = simrate
@ -76,7 +76,7 @@ def generate_sim_group(startingids,prodict,max_size,threshold): #生成与已知
while continue_flag:
appending_id_list = []
for oldid in id_list:
for newid in [id for id in prodict if not id in id_list and not id in output_list]:
for newid in [id for id in prodict if not id in id_list and not id in output_list and not "OBSOLETE" in treated_dict[id]["content"]]:
simrate = Levenshtein.jaro(treated_dict[oldid]["content"],treated_dict[newid]["content"])
if simrate >= threshold:
appending_id_list.append(newid)