{"id":713,"date":"2025-06-21T21:57:51","date_gmt":"2025-06-21T13:57:51","guid":{"rendered":"\/?p=713"},"modified":"2025-06-21T21:58:54","modified_gmt":"2025-06-21T13:58:54","slug":"python%e5%a4%84%e7%90%86%e5%ad%a6%e4%b9%a0%e9%80%9a%e9%a2%98%e7%9b%ae","status":"publish","type":"post","link":"\/?p=713","title":{"rendered":"Python\u5904\u7406\u5b66\u4e60\u901a\u9898\u76ee"},"content":{"rendered":"\n<p>1.\u5bfc\u51fa\u5b66\u4e60\u901a\u9898\u76eehtml\u6587\u4ef6<\/p>\n\n\n\n<p>2.\u6539\u540d<\/p>\n\n\n\n<figure class=\"wp-block-image size-large\"><div class='fancybox-wrapper lazyload-container-unload' data-fancybox='post-images' href='\/wp-content\/uploads\/2025\/06\/Snipaste_2025-06-21_21-58-26-1024x474.png'><img class=\"lazyload lazyload-style-7\" src=\"data:image\/svg+xml;base64,PCEtLUFyZ29uTG9hZGluZy0tPgo8c3ZnIHdpZHRoPSIxIiBoZWlnaHQ9IjEiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyIgc3Ryb2tlPSIjZmZmZmZmMDAiPjxnPjwvZz4KPC9zdmc+\"  loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"474\" data-original=\"\/wp-content\/uploads\/2025\/06\/Snipaste_2025-06-21_21-58-26-1024x474.png\" src=\"data:image\/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAANSURBVBhXYzh8+PB\/AAffA0nNPuCLAAAAAElFTkSuQmCC\" alt=\"\" class=\"wp-image-716\"  sizes=\"(max-width: 1024px) 100vw, 1024px\" \/><\/div><\/figure>\n\n\n\n<p>3.\u8fd0\u884c\u7a0b\u5e8f<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>from bs4 import BeautifulSoup\nimport re\nfrom docx import Document\nfrom pathlib import Path\n\nfile_path = Path(\"output.docx\")\nif file_path.exists():\n    if file_path.is_file():  # \u7cbe\u786e\u5224\u65ad\u6587\u4ef6\n        print(\"\u6e90\u6587\u4ef6\u5b58\u5728\")\n        doc = Document(\"output.docx\")\n    else:\n        print(\"\u8def\u5f84\u5b58\u5728\uff0c\u4f46\u975e\u6587\u4ef6\")\nelse:\n    print(\"\u6e90\u6587\u4ef6\u4e0d\u5b58\u5728\")\n    doc = Document()\n\ndef extract_fill_in_questions(html_content):\n    soup = BeautifulSoup(html_content, 'html.parser')\n    # \u63d0\u53d6\u6240\u6709\u586b\u7a7a\u9898\n    fill_questions = soup.select(\"div.mark_item\")\n    for a in fill_questions:\n        c = a.select(\"div.aiArea\")\n        for d in c:\n            name = d.select(\"h3.mark_name\")\n            letter = d.select(\"ul.mark_letter\")\n            anser = d.select(\".rightAnswerContent\")\n            for i in name:\n                print(i.get_text())\n                # \u5199\u5165\u5230doc\u4e2d\n                doc.add_paragraph(i.get_text())\n            if letter:\n                for j in letter:\n                    print(j.get_text())\n                    doc.add_paragraph(j.get_text())\n            for k in anser:\n                print(k.get_text())\n                doc.add_paragraph(k.get_text())\n            print(\"===========================================================\")\n    doc.save('output.docx')\n\n# \u4f7f\u7528\u793a\u4f8b\nif __name__ == \"__main__\":\n    with open('222.html', 'r', encoding='utf-8') as f:\n        html_content = f.read()\n    extract_fill_in_questions(html_content)\n<\/code><\/pre>\n","protected":false},"excerpt":{"rendered":"<p>1.\u5bfc\u51fa\u5b66\u4e60\u901a\u9898\u76eehtml\u6587\u4ef6 2.\u6539\u540d 3.\u8fd0\u884c\u7a0b\u5e8f<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[18],"tags":[],"class_list":["post-713","post","type-post","status-publish","format-standard","hentry","category-python"],"_links":{"self":[{"href":"\/index.php?rest_route=\/wp\/v2\/posts\/713"}],"collection":[{"href":"\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=713"}],"version-history":[{"count":3,"href":"\/index.php?rest_route=\/wp\/v2\/posts\/713\/revisions"}],"predecessor-version":[{"id":717,"href":"\/index.php?rest_route=\/wp\/v2\/posts\/713\/revisions\/717"}],"wp:attachment":[{"href":"\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=713"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=713"},{"taxonomy":"post_tag","embeddable":true,"href":"\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=713"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}