This repository has been archived on 2024-06-23. You can view files and clone it, but cannot push or open issues or pull requests.
mathdeptv2/工具/批量添加题库字段数据.ipynb

198 lines
11 KiB
Plaintext

{
"cells": [
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"题号: 012613 , 字段: ans 中已有该数据: $\\{2,4\\}$\n",
"题号: 012614 , 字段: ans 中已有该数据: $(1,2)$\n",
"题号: 012615 , 字段: ans 中已有该数据: $\\dfrac{\\sqrt{2}}2$\n",
"题号: 012616 , 字段: ans 中已有该数据: $3$\n",
"题号: 012617 , 字段: ans 中已有该数据: $3$\n",
"题号: 012618 , 字段: ans 中已有该数据: \\textcircled{1}\\textcircled{4}\n",
"题号: 012619 , 字段: ans 中已有该数据: $180$\n",
"题号: 012620 , 字段: ans 中已有该数据: $4$\n",
"题号: 012621 , 字段: ans 中已有该数据: $\\dfrac 52$\n",
"题号: 012622 , 字段: ans 中已有该数据: $\\dfrac\\pi 4$\n",
"题号: 012623 , 字段: ans 中已有该数据: $\\dfrac{8\\sqrt{2}\\pi}3$\n",
"题号: 012624 , 字段: ans 中已有该数据: $\\dfrac{8\\sqrt{3}}3$\n",
"题号: 012625 , 字段: ans 中已有该数据: A\n",
"题号: 012626 , 字段: ans 中已有该数据: C\n",
"题号: 012627 , 字段: ans 中已有该数据: D\n",
"题号: 012628 , 字段: ans 中已有该数据: C\n",
"题号: 012629 , 字段: ans 中已有该数据: (1) $b_n=3^{n-1}$; (2) $-8$\n",
"题号: 012630 , 字段: ans 中已有该数据: (1) $\\dfrac \\pi 4$; (2) $1$\n",
"题号: 012631 , 字段: ans 中已有该数据: (1) 证明略; (2) 证明略; (3) $\\dfrac\\pi 4$\n",
"题号: 012632 , 字段: ans 中已有该数据: (1) $\\sqrt{2}$; (2) $y=x+1$; (3) 过定点$(-3,0)$和$(1,0)$\n",
"题号: 012633 , 字段: ans 中已有该数据: (1) $y=x-1$; (2) 单调减区间为$(\\dfrac 12 1)$; 极小值为$-2$; (3) 证明略\n",
"题号: 012571 , 字段: ans 中已有该数据: $\\{1\\}$\n",
"题号: 012572 , 字段: ans 中已有该数据: $-1$\n",
"题号: 012573 , 字段: ans 中已有该数据: $\\dfrac\\pi 6$\n",
"题号: 012574 , 字段: ans 中已有该数据: $2$\n",
"题号: 012575 , 字段: ans 中已有该数据: $16\\pi$\n",
"题号: 012576 , 字段: ans 中已有该数据: $2800$, $31$\n",
"题号: 012577 , 字段: ans 中已有该数据: $2$\n",
"题号: 012578 , 字段: ans 中已有该数据: $(-\\infty,1)\\cup (1,3]$\n",
"题号: 012579 , 字段: ans 中已有该数据: $5$\n",
"题号: 012580 , 字段: ans 中已有该数据: $[\\dfrac 32,2]$\n",
"题号: 012581 , 字段: ans 中已有该数据: $(\\dfrac 72,0,\\dfrac 72)$\n",
"题号: 012582 , 字段: ans 中已有该数据: $\\dfrac{\\sqrt{3}}{20}v$\n",
"题号: 012583 , 字段: ans 中已有该数据: A\n",
"题号: 012584 , 字段: ans 中已有该数据: D\n",
"题号: 012585 , 字段: ans 中已有该数据: C\n",
"题号: 012586 , 字段: ans 中已有该数据: C\n",
"题号: 012587 , 字段: ans 中已有该数据: (1) 证明略; (2) $\\dfrac{3\\sqrt{22}}{11}$\n",
"题号: 012588 , 字段: ans 中已有该数据: (1) $\\dfrac 12$; (2) $a_n=\\dfrac{18}{2n+1}$\n",
"题号: 012589 , 字段: ans 中已有该数据: (1) 例如: 非通勤时段的车辆使用情况; 油价和电价的变化; 工作单位能否提供免费充电; 电动车的国家减免政策的变化; 车辆的外观、内饰与品牌效应; 车牌费用等; (2) 解答略\n",
"题号: 012590 , 字段: ans 中已有该数据: (1) $\\dfrac{x^2}4+\\dfrac{y^2}3=1$($y\\le 0$); (2) $P(-\\dfrac 32,\\dfrac{\\sqrt{3}}2)$, $Q(\\dfrac 32, \\dfrac{\\sqrt{3}}2)$; (3) $[\\sqrt{3}-1,\\sqrt{2}+1]$\n",
"题号: 012591 , 字段: ans 中已有该数据: (1) 导数为$y'=\\dfrac{1-\\ln x}{x^2}$, 单调性证明略; (2) 判断$89^{99}>99^{89}$, 证明略, 推广可以是:``对于实数$a,b$, 若$\\mathrm{e}<a<b$, 则$a^b>b^a$; (3) 证明略\n",
"题号: 010965 , 字段: ans 中已修改数据: $[0,2]$\n",
"题号: 010966 , 字段: ans 中已修改数据: $(-\\infty,0)$\n",
"题号: 030023 , 字段: ans 中已修改数据: $\\dfrac{3n^2-5n}2$\n",
"题号: 010968 , 字段: ans 中已修改数据: $\\dfrac{8\\pi}3$\n",
"题号: 010969 , 字段: ans 中已修改数据: $2(x+2)-(y-1)=0$\n",
"题号: 010970 , 字段: ans 中已修改数据: $\\dfrac 32$\n",
"题号: 030025 , 字段: ans 中已修改数据: $[0,\\dfrac 34]$\n",
"题号: 010972 , 字段: ans 中已修改数据: $25$\n",
"题号: 030024 , 字段: ans 中已修改数据: $\\dfrac 23(\\dfrac 1{4^n}-1)$\n",
"题号: 010974 , 字段: ans 中已修改数据: $[1,+\\infty)$\n",
"题号: 010975 , 字段: ans 中已修改数据: $\\sqrt{3}$\n",
"题号: 010976 , 字段: ans 中已修改数据: $3-\\sqrt{3}$\n",
"题号: 010977 , 字段: ans 中已修改数据: B\n",
"题号: 002745 , 字段: ans 中已修改数据: C\n",
"题号: 010979 , 字段: ans 中已修改数据: C\n",
"题号: 010980 , 字段: ans 中已修改数据: B\n",
"题号: 010981 , 字段: ans 中已修改数据: (1) $\\dfrac 23$; (2) $\\arctan {2\\sqrt{5}}5$\n",
"题号: 010982 , 字段: ans 中已修改数据: (1) $\\log_2 3$; (2) $a=2b\\ne 0$\n",
"题号: 010983 , 字段: ans 中已修改数据: (1) $\\sqrt{7}$千米; (2) 有$\\dfrac{8-\\sqrt{15}}7$小时, 两人不能通话\n",
"题号: 010984 , 字段: ans 中已修改数据: (1) $y^2=4\\sqrt{5} x$或$y^2=-4\\sqrt{5} x$; (2) $M$的坐标为$(0,0)$或$(-\\dfrac{4\\sqrt{5}}5,0)$; (3) 证明略\n",
"题号: 010985 , 字段: ans 中已修改数据: (1) $\\{-6,-3,-2,-1,0,1,2,3,4\\}$; (2) 证明略; (3) 元素个数为$\\dfrac 12 n(n+1)$; 元素之和为$\\dfrac{n+1}2(3^{n+1}-3)$\n"
]
}
],
"source": [
"import os,re,json\n",
"\n",
"\"\"\"---明确数据文件位置---\"\"\"\n",
"datafile = \"文本文件/metadata.txt\"\n",
"# 双回车分隔,记录内单回车分隔列表,首行为字段名\n",
"\"\"\"---文件位置结束---\"\"\"\n",
"\n",
"def trim(string):\n",
" string = re.sub(r\"^[ \\t\\n]*\",\"\",string)\n",
" string = re.sub(r\"[ \\t\\n]*$\",\"\",string)\n",
" return string\n",
"def FloatToInt(string):\n",
" f = float(string)\n",
" if abs(f-round(f))<0.01:\n",
" f = round(f)\n",
" return f\n",
"\n",
"with open(datafile,\"r\",encoding=\"utf8\") as f:\n",
" data = f.read()\n",
"pos = data.index(\"\\n\")\n",
"field = data[:pos].strip()\n",
"appending_data = data[pos:]\n",
"\n",
"with open(r\"../题库0.3/Problems.json\",\"r\",encoding = \"utf8\") as f:\n",
" database = f.read()\n",
"pro_dict = json.loads(database)\n",
"with open(r\"../题库0.3/LessonObj.json\",\"r\",encoding = \"utf8\") as f:\n",
" database = f.read()\n",
"obj_dict = json.loads(database)\n",
"\n",
"#该字段列表可能需要更新\n",
"fields = [\"content\",\"objs\",\"tags\",\"genre\",\"ans\",\"solution\",\"duration\",\"usages\",\"origin\",\"edit\",\"same\",\"related\",\"remark\",\"space\"]\n",
"\n",
"if field in fields:\n",
" field_type = type(pro_dict[\"000001\"][field])\n",
" datalist = [record.strip() for record in appending_data.split(\"\\n\\n\") if len(trim(record)) > 0]\n",
" for record in datalist:\n",
" id = re.findall(r\"^[\\d]{1,}\",record)[0]\n",
" data = record[len(id):].strip()\n",
" id = id.zfill(6)\n",
" if not id in pro_dict:\n",
" print(\"题号:\",id,\"不在数据库中.\")\n",
" break\n",
" \n",
" #字符串类型字段添加数据\n",
" elif field_type == str and data in pro_dict[id][field]:\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已有该数据:\",data)\n",
" elif field_type == str and not data in pro_dict[id][field] and not field == \"ans\" and not field == \"space\":\n",
" origin_data = pro_dict[id][field]\n",
" new_data = trim(origin_data + \"\\n\" + data)\n",
" pro_dict[id][field] = new_data\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已添加数据:\",data)\n",
" elif field_type == str and not data in pro_dict[id][field] and field == \"ans\" or field == \"space\":\n",
" pro_dict[id][field] = data\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已修改数据:\",data)\n",
" \n",
" #数值类型字段添加数据\n",
" elif (field_type == int or field_type == float) and abs(float(data) - pro_dict[id][field])<0.01:\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已有该数据:\",FloatToInt(data))\n",
" elif (field_type == int or field_type == float) and abs(float(data) - pro_dict[id][field])>=0.01:\n",
" pro_dict[id][field] = FloatToInt(data)\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已修改数据:\",FloatToInt(data))\n",
" \n",
" #列表类型字段添加数据\n",
" elif field_type == list:\n",
" cell_data_list = [d.strip() for d in data.split(\"\\n\")]\n",
" for cell_data in cell_data_list:\n",
" if cell_data in pro_dict[id][field]:\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已有该数据:\",cell_data)\n",
" elif not field == \"objs\":\n",
" pro_dict[id][field].append(cell_data)\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已添加数据:\",cell_data)\n",
" else:\n",
" if not cell_data in obj_dict and not cell_data.upper() == \"KNONE\":\n",
" print(\"题号:\",id,\", 字段:\",field,\"目标编号有误:\",cell_data)\n",
" else:\n",
" pro_dict[id][field].append(cell_data.upper())\n",
" print(\"题号:\",id,\", 字段:\",field,\"中已添加数据:\",cell_data.upper())\n",
"\n",
"with open(r\"../题库0.3/Problems.json\",\"w\",encoding = \"utf8\") as f:\n",
" f.write(json.dumps(pro_dict,indent=4,ensure_ascii=False))"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "mathdept",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.15"
},
"orig_nbformat": 4,
"vscode": {
"interpreter": {
"hash": "ff3c292c316ba85de6f1ad75f19c731e79d694e741b6f515ec18f14996fe48dc"
}
}
},
"nbformat": 4,
"nbformat_minor": 2
}