修改database_tools中的refine_mathpix, 适配mathpix的新的$\qquad$字符
This commit is contained in:
parent
1dec369099
commit
e096f3c069
|
|
@ -1507,6 +1507,7 @@ def RefineMathpix(raw_string): # 进一步修改mathpix得到的字符串
|
|||
string = re.sub(r"[\.;](\}\{|\}\n)",lambda matchobj: matchobj.group(1),string) #去除选择题选项最末尾的句号或分号
|
||||
string = re.sub(r"\n\s+","\n",string) #删除多余的回车
|
||||
string = re.sub(r"\\q+uad","",string) #删除\quad,\qquad等
|
||||
string = re.sub(r"\$\\q+uad\$","",string)#删除两边有$的\quad,\qquad等
|
||||
string = re.sub(r"~","",string) #删除~
|
||||
string = re.sub(r"\s*\([\s]{,10}\)",r"\\bracket{20}",string)
|
||||
string = re.sub(r"\s*\\bracket\{20\}\s*\n",r"\\bracket{20}.\n",string)#行末无内容括号的处理
|
||||
|
|
@ -1541,6 +1542,8 @@ def RefineMathpix(raw_string): # 进一步修改mathpix得到的字符串
|
|||
string = RefineChineseComma(string) #改顿号
|
||||
string = RefineInterval(string) #改错误的dollars符号和括号的顺序
|
||||
string = string.replace("$$"," ")
|
||||
string = re.sub(r"\s+\\blank\{50\}",r"\\blank{50}",string)
|
||||
string = re.sub(r"\s+\\bracket\{20\}",r"\\bracket{20}",string)
|
||||
|
||||
|
||||
return string
|
||||
|
|
|
|||
Reference in New Issue