This repository has been archived on 2024-06-23. You can view files and clone it, but cannot push or open issues or pull requests.
mathdeptv2/工具/批量添加题库字段数据.ipynb

198 lines
11 KiB
Plaintext

{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"题号: 012508 , 字段: ans 中已有该数据: $(-2,0]$\n",
"题号: 012509 , 字段: ans 中已有该数据: $4$\n",
"题号: 012510 , 字段: ans 中已有该数据: $36\\pi$\n",
"题号: 012511 , 字段: ans 中已有该数据: $35$\n",
"题号: 012512 , 字段: ans 中已有该数据: $2$\n",
"题号: 012513 , 字段: ans 中已有该数据: $3$\n",
"题号: 012514 , 字段: ans 中已有该数据: $y=3x-1$\n",
"题号: 012515 , 字段: ans 中已有该数据: $\\dfrac 25$\n",
"题号: 012516 , 字段: ans 中已有该数据: $-1$\n",
"题号: 012517 , 字段: ans 中已有该数据: $\\cos(4x+\\dfrac \\pi 3)$\n",
"题号: 012518 , 字段: ans 中已有该数据: $\\dfrac{49}{24}\\sqrt{6}$\n",
"题号: 012519 , 字段: ans 中已有该数据: \\textcircled{1}\\textcircled{4}\n",
"题号: 012520 , 字段: ans 中已有该数据: A\n",
"题号: 012521 , 字段: ans 中已有该数据: D\n",
"题号: 012522 , 字段: ans 中已有该数据: B\n",
"题号: 012523 , 字段: ans 中已有该数据: C\n",
"题号: 012524 , 字段: ans 中已有该数据: (1) $\\dfrac \\pi 3$; (2) 证明略\n",
"题号: 012525 , 字段: ans 中已有该数据: (1) $a_n=2n$; (2) $6$\n",
"题号: 012526 , 字段: ans 中已有该数据: (1) 证明略; (2) $\\dfrac{2\\sqrt{42}}7$; (3) 存在, $|A_1E|=1$\n",
"题号: 012527 , 字段: ans 中已有该数据: (1) $X\\sim \\begin{pmatrix} 155 & 165 & 175 & 185 & 195 & 205\\\\ 0.22 & 0.27 & 0.25 & 0.15 & 0.1 & 0.01\\end{pmatrix}$, $E[X]=171.7$; (2) $0.0312$; (3) $27.25$\n",
"题号: 012528 , 字段: ans 中已有该数据: (1) 在$(-\\infty,2-\\dfrac{\\sqrt{3a}}3]$上是严格增函数, 在$[2-\\dfrac{\\sqrt{3a}}3,2+\\dfrac{\\sqrt{3a}}3]$上是严格减函数, 在$[2+\\dfrac{\\sqrt{3a}}3,+\\infty)$上是严格增函数; (2) 是定值$6$; (3) $\\{4,12\\}$\n",
"题号: 012676 , 字段: ans 中已有该数据: $(-2,1)$\n",
"题号: 012677 , 字段: ans 中已有该数据: $4$\n",
"题号: 012678 , 字段: ans 中已有该数据: $(-\\infty,2)$\n",
"题号: 012679 , 字段: ans 中已有该数据: $80$\n",
"题号: 012680 , 字段: ans 中已有该数据: $\\dfrac\\pi 2$\n",
"题号: 012681 , 字段: ans 中已有该数据: $-7$\n",
"题号: 012682 , 字段: ans 中已有该数据: $0.36$\n",
"题号: 012683 , 字段: ans 中已有该数据: $12$\n",
"题号: 012684 , 字段: ans 中已有该数据: $\\dfrac{18}{35}$\n",
"题号: 012685 , 字段: ans 中已有该数据: $8$\n",
"题号: 012686 , 字段: ans 中已有该数据: $(-\\pi,-\\dfrac\\pi 2)$和$(0,\\dfrac\\pi 2)$\n",
"题号: 012687 , 字段: ans 中已有该数据: $9$\n",
"题号: 012688 , 字段: ans 中已有该数据: B\n",
"题号: 012689 , 字段: ans 中已有该数据: D\n",
"题号: 012690 , 字段: ans 中已有该数据: B\n",
"题号: 012691 , 字段: ans 中已有该数据: D\n",
"题号: 012692 , 字段: ans 中已有该数据: (1) $a_n=5-n$; (2) $n=4$或$5$\n",
"题号: 012693 , 字段: ans 中已有该数据: (1) 证明略; (2) $\\dfrac 14$\n",
"题号: 012694 , 字段: ans 中已有该数据: (1) $247.4$米; (2) $AB=AD=100\\sqrt{5}$米, $\\angle C=\\dfrac\\pi 2$\n",
"题号: 012695 , 字段: ans 中已有该数据: (1) $F_1(-\\sqrt{3},0)$, $F_2(\\sqrt{3},0)$, $e_1=\\dfrac{\\sqrt{3}}2$; (2) $2$; (3) 证明略\n",
"题号: 012696 , 字段: ans 中已有该数据: (1) $f_1(x)$不是$T(1)$函数, $f_2(x)$是$T(1)$函数; (2) 存在, $b$的取值范围为$(1-\\dfrac 1{\\mathrm{e}},+\\infty)$; (3) 证明略\n",
"题号: 012697 , 字段: ans 中已修改数据: $\\{0,1\\}$\n",
"题号: 012698 , 字段: ans 中已修改数据: $-3$\n",
"题号: 012699 , 字段: ans 中已修改数据: $-3$\n",
"题号: 012700 , 字段: ans 中已修改数据: $14$\n",
"题号: 012701 , 字段: ans 中已修改数据: $\\sqrt{5}$\n",
"题号: 012702 , 字段: ans 中已修改数据: $1$\n",
"题号: 012703 , 字段: ans 中已修改数据: $462$\n",
"题号: 012704 , 字段: ans 中已修改数据: $4.8$\n",
"题号: 012705 , 字段: ans 中已修改数据: $\\dfrac 6{35}$\n",
"题号: 012706 , 字段: ans 中已修改数据: $2$\n",
"题号: 012707 , 字段: ans 中已修改数据: $\\dfrac{\\sqrt{5}-1}2$\n",
"题号: 012708 , 字段: ans 中已修改数据: $200$\n",
"题号: 012709 , 字段: ans 中已修改数据: D\n",
"题号: 012710 , 字段: ans 中已修改数据: B\n",
"题号: 012711 , 字段: ans 中已修改数据: A\n",
"题号: 012712 , 字段: ans 中已修改数据: B\n",
"题号: 012713 , 字段: ans 中已修改数据: (1) 最小正周期为$\\pi$, $f(x)=-\\sin 2x$; (2) $\\dfrac{4-3\\sqrt{3}}{10}$\n",
"题号: 012714 , 字段: ans 中已修改数据: (1) 证明略; (2) 图略, $\\dfrac{3\\sqrt{17}}{17}$\n",
"题号: 012715 , 字段: ans 中已修改数据: (1) 大约$9.46\\times 10^5\\text{hm}^2$; (2) 到$2021$年底这个地区的沙漠面积首次小于$8\\times 10^5\\text{hm}^2$\n",
"题号: 012716 , 字段: ans 中已修改数据: (1) $\\dfrac{x^2}{4}+y^2=1$; (2) $M(\\dfrac 65,\\dfrac 45)$; (3) $(0,1)$\n",
"题号: 012717 , 字段: ans 中已修改数据: (1) $y=x-1$; (2) 存在极小值点$x=\\sqrt{m}$, 无极大值点; (3) $[\\dfrac 12,+\\infty)$\n"
]
}
],
"source": [
"import os,re,json\n",
"\n",
"\"\"\"---明确数据文件位置---\"\"\"\n",
"datafile = \"文本文件/metadata.txt\"\n",
"# 双回车分隔,记录内单回车分隔列表,首行为字段名\n",
"\"\"\"---文件位置结束---\"\"\"\n",
"\n",
"def trim(string):\n",
" string = re.sub(r\"^[ \\t\\n]*\",\"\",string)\n",
" string = re.sub(r\"[ \\t\\n]*$\",\"\",string)\n",
" return string\n",
"def FloatToInt(string):\n",
" f = float(string)\n",
" if abs(f-round(f))<0.01:\n",
" f = round(f)\n",
" return f\n",
"\n",
"with open(datafile,\"r\",encoding=\"utf8\") as f:\n",
" data = f.read()\n",
"pos = data.index(\"\\n\")\n",
"field = data[:pos].strip()\n",
"appending_data = data[pos:]\n",
"\n",
"with open(r\"../题库0.3/Problems.json\",\"r\",encoding = \"utf8\") as f:\n",
" database = f.read()\n",
"pro_dict = json.loads(database)\n",
"with open(r\"../题库0.3/LessonObj.json\",\"r\",encoding = \"utf8\") as f:\n",
" database = f.read()\n",
"obj_dict = json.loads(database)\n",
"\n",
"#该字段列表可能需要更新\n",
"fields = [\"content\",\"objs\",\"tags\",\"genre\",\"ans\",\"solution\",\"duration\",\"usages\",\"origin\",\"edit\",\"same\",\"related\",\"remark\",\"space\"]\n",
"\n",
"if field in fields:\n",
" field_type = type(pro_dict[\"000001\"][field])\n",
" datalist = [record.strip() for record in appending_data.split(\"\\n\\n\") if len(trim(record)) > 0]\n",
" for record in datalist:\n",
" id = re.findall(r\"^[\\d]{1,}\",record)[0]\n",
" data = record[len(id):].strip()\n",
" id = id.zfill(6)\n",
" if not id in pro_dict:\n",
" print(\"题号:\",id,\"不在数据库中.\")\n",
" break\n",
" \n",
" #字符串类型字段添加数据\n",
" elif field_type == str and data in pro_dict[id][field]:\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已有该数据:\",data)\n",
" elif field_type == str and not data in pro_dict[id][field] and not field == \"ans\" and not field == \"space\":\n",
" origin_data = pro_dict[id][field]\n",
" new_data = trim(origin_data + \"\\n\" + data)\n",
" pro_dict[id][field] = new_data\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已添加数据:\",data)\n",
" elif field_type == str and not data in pro_dict[id][field] and field == \"ans\" or field == \"space\":\n",
" pro_dict[id][field] = data\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已修改数据:\",data)\n",
" \n",
" #数值类型字段添加数据\n",
" elif (field_type == int or field_type == float) and abs(float(data) - pro_dict[id][field])<0.01:\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已有该数据:\",FloatToInt(data))\n",
" elif (field_type == int or field_type == float) and abs(float(data) - pro_dict[id][field])>=0.01:\n",
" pro_dict[id][field] = FloatToInt(data)\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已修改数据:\",FloatToInt(data))\n",
" \n",
" #列表类型字段添加数据\n",
" elif field_type == list:\n",
" cell_data_list = [d.strip() for d in data.split(\"\\n\")]\n",
" for cell_data in cell_data_list:\n",
" if cell_data in pro_dict[id][field]:\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已有该数据:\",cell_data)\n",
" elif not field == \"objs\":\n",
" pro_dict[id][field].append(cell_data)\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已添加数据:\",cell_data)\n",
" else:\n",
" if not cell_data in obj_dict and not cell_data.upper() == \"KNONE\":\n",
" print(\"题号:\",id,\", 字段:\",field,\"目标编号有误:\",cell_data)\n",
" else:\n",
" pro_dict[id][field].append(cell_data.upper())\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已添加数据:\",cell_data.upper())\n",
"\n",
"with open(r\"../题库0.3/Problems.json\",\"w\",encoding = \"utf8\") as f:\n",
" f.write(json.dumps(pro_dict,indent=4,ensure_ascii=False))"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "mathdept",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.15"
},
"orig_nbformat": 4,
"vscode": {
"interpreter": {
"hash": "ff3c292c316ba85de6f1ad75f19c731e79d694e741b6f515ec18f14996fe48dc"
}
}
},
"nbformat": 4,
"nbformat_minor": 2
}