{"id":5909,"date":"2024-09-01T01:38:03","date_gmt":"2024-08-31T17:38:03","guid":{"rendered":"https:\/\/www.aisharenet.com\/?p=5909"},"modified":"2024-09-10T02:03:13","modified_gmt":"2024-09-09T18:03:13","slug":"magic-html","status":"publish","type":"post","link":"https:\/\/www.kdjingpai.com\/de\/magic-html\/","title":{"rendered":"magic-html\uff1a\u4eceHTML\u7f51\u5740\u4e2d\u63d0\u53d6\u4e3b\u4f53\u6570\u636e\uff0c\u8f93\u51fa\u7eaf\u6587\u672c\/markdown"},"content":{"rendered":"<div class=\"el-h2\" data-heading=\"\u7f51\u9875\u6807\u9898\" data-tag-name=\"h2\"><\/div>\n<div class=\"el-h2\" data-heading=\"\u7efc\u5408\u4ecb\u7ecd\" data-tag-name=\"h2\">\n<h2 dir=\"auto\" data-heading=\"\u7efc\u5408\u4ecb\u7ecd\">\u7efc\u5408\u4ecb\u7ecd<\/h2>\n<\/div>\n<div class=\"el-p\" data-tag-name=\"p\">\n<p dir=\"auto\">magic-html\u662f\u4e00\u4e2aPython\u5e93\uff0c\u65e8\u5728\u7b80\u5316\u4eceHTML\u4e2d\u63d0\u53d6\u4e3b\u4f53\u533a\u57df\u5185\u5bb9\u7684\u8fc7\u7a0b\u3002\u65e0\u8bba\u5904\u7406\u7684\u662f\u590d\u6742\u7684HTML\u7ed3\u6784\u8fd8\u662f\u7b80\u5355\u7684\u7f51\u9875\uff0c\u8fd9\u4e2a\u5e93\u90fd\u65e8\u5728\u4e3a\u7528\u6237\u63d0\u4f9b\u4e00\u4e2a\u4fbf\u6377\u9ad8\u6548\u7684\u63a5\u53e3\u3002\u5b83\u652f\u6301\u591a\u6a21\u6001\u62bd\u53d6\uff0c\u652f\u6301\u591a\u79cd\u7248\u9762extractor\uff0c\u5305\u62ec\u6587\u7ae0\u3001\u8bba\u575b\u548c\u5fae\u4fe1\u6587\u7ae0\uff0c\u8fd8\u652f\u6301latex\u516c\u5f0f\u63d0\u53d6\u8f6c\u6362\u3002<\/p>\n<p dir=\"auto\">\n<\/div>\n<div class=\"el-h2\" data-heading=\"\u529f\u80fd\u5217\u8868\" data-tag-name=\"h2\">\n<h2 dir=\"auto\" data-heading=\"\u529f\u80fd\u5217\u8868\">\u529f\u80fd\u5217\u8868<\/h2>\n<\/div>\n<div class=\"el-ul\" data-tag-name=\"ul\">\n<ul class=\"has-list-bullet\">\n<li dir=\"auto\" data-line=\"0\">\u63d0\u53d6HTML\u4e3b\u4f53\u533a\u57df\u5185\u5bb9<\/li>\n<li dir=\"auto\" data-line=\"1\">\u652f\u6301\u591a\u6a21\u6001\u62bd\u53d6<\/li>\n<li dir=\"auto\" data-line=\"2\">\u652f\u6301\u6587\u7ae0\u3001\u8bba\u575b\u548c\u5fae\u4fe1\u6587\u7ae0\u7248\u9762<\/li>\n<li dir=\"auto\" data-line=\"3\">\u652f\u6301latex\u516c\u5f0f\u63d0\u53d6\u8f6c\u6362<\/li>\n<li dir=\"auto\" data-line=\"4\">\u81ea\u5b9a\u4e49\u8f93\u51fa\u7eaf\u6587\u672c\u6216markdown\u683c\u5f0f<\/li>\n<\/ul>\n<\/div>\n<p>&nbsp;<\/p>\n<div class=\"el-h2\" data-heading=\"\u4f7f\u7528\u5e2e\u52a9\" data-tag-name=\"h2\">\n<h2 dir=\"auto\" data-heading=\"\u4f7f\u7528\u5e2e\u52a9\">\u4f7f\u7528\u5e2e\u52a9<\/h2>\n<\/div>\n<div class=\"el-h3\" data-heading=\"\u5b89\u88c5\" data-tag-name=\"h3\">\n<h3 dir=\"auto\" data-heading=\"\u5b89\u88c5\">\u5b89\u88c5<\/h3>\n<\/div>\n<div class=\"el-p\" data-tag-name=\"p\">\n<p dir=\"auto\">\u8981\u5b89\u88c5magic-html\uff0c\u53ef\u4ee5\u4f7f\u7528pip\u547d\u4ee4\uff1a<\/p>\n<\/div>\n<div class=\"el-pre\" data-tag-name=\"pre\">\n<pre class=\"language-bash\" tabindex=\"0\"><code class=\"language-bash is-loaded\">pip <span class=\"token function\">install<\/span> magic-html\r\n<\/code><\/pre>\n<\/div>\n<div class=\"el-h3\" data-heading=\"\u4f7f\u7528\" data-tag-name=\"h3\">\n<h3 dir=\"auto\" data-heading=\"\u4f7f\u7528\">\u4f7f\u7528<\/h3>\n<\/div>\n<div class=\"el-p\" data-tag-name=\"p\">\n<p dir=\"auto\">\u5b89\u88c5\u5b8c\u6210\u540e\uff0c\u53ef\u4ee5\u901a\u8fc7\u4ee5\u4e0b\u4ee3\u7801\u8fdb\u884c\u4f7f\u7528\uff1a<\/p>\n<\/div>\n<div class=\"el-pre\" data-tag-name=\"pre\">\n<pre class=\"language-python\" tabindex=\"0\"><code class=\"language-python is-loaded\"><span class=\"token keyword\">from<\/span> magic_html <span class=\"token keyword\">import<\/span> GeneralExtractor\r\n\r\n<span class=\"token comment\"># \u521d\u59cb\u5316\u63d0\u53d6\u5668<\/span>\r\nextractor <span class=\"token operator\">=<\/span> GeneralExtractor<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span>\r\n\r\n<span class=\"token comment\"># \u793a\u4f8bHTML\u5185\u5bb9<\/span>\r\nhtml <span class=\"token operator\">=<\/span> <span class=\"token triple-quoted-string string\">\"\"\"\r\n&lt;!doctype html&gt;\r\n&lt;html&gt;\r\n&lt;head&gt;\r\n    &lt;title&gt;Example Domain&lt;\/title&gt;\r\n    &lt;meta charset=\"utf-8\" \/&gt;\r\n    &lt;meta http-equiv=\"Content-type\" content=\"text\/html; charset=utf-8\" \/&gt;\r\n    &lt;meta name=\"viewport\" content=\"width=device-width, initial-scale=1\" \/&gt;\r\n&lt;\/head&gt;\r\n&lt;body&gt;\r\n&lt;div&gt;\r\n    &lt;h1&gt;Example Domain&lt;\/h1&gt;\r\n    &lt;p&gt;This domain is for use in illustrative examples in documents. You may use this domain in literature without prior coordination or asking for permission.&lt;\/p&gt;\r\n    &lt;p&gt;&lt;a href=\"https:\/\/www.iana.org\/domains\/example\"&gt;More information...&lt;\/a&gt;&lt;\/p&gt;\r\n&lt;\/div&gt;\r\n&lt;\/body&gt;\r\n&lt;\/html&gt;\r\n\"\"\"<\/span>\r\n\r\n<span class=\"token comment\"># \u63d0\u53d6\u6570\u636e<\/span>\r\ndata <span class=\"token operator\">=<\/span> extractor<span class=\"token punctuation\">.<\/span>extract<span class=\"token punctuation\">(<\/span>html<span class=\"token punctuation\">)<\/span>\r\n<span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span>data<span class=\"token punctuation\">)<\/span>\r\n<\/code><\/pre>\n<\/div>\n<div class=\"el-h3\" data-heading=\"\u529f\u80fd\u64cd\u4f5c\u6d41\u7a0b\" data-tag-name=\"h3\">\n<h3 dir=\"auto\" data-heading=\"\u529f\u80fd\u64cd\u4f5c\u6d41\u7a0b\">\u529f\u80fd\u64cd\u4f5c\u6d41\u7a0b<\/h3>\n<\/div>\n<div class=\"el-ol\" data-tag-name=\"ol\">\n<ol>\n<li dir=\"auto\" data-line=\"0\"><strong>\u521d\u59cb\u5316\u63d0\u53d6\u5668<\/strong>\uff1a\u9996\u5148\u9700\u8981\u5bfc\u5165magic-html\u5e93\u5e76\u521d\u59cb\u5316\u63d0\u53d6\u5668\u3002<\/li>\n<li dir=\"auto\" data-line=\"1\"><strong>\u51c6\u5907HTML\u5185\u5bb9<\/strong>\uff1a\u5c06\u9700\u8981\u63d0\u53d6\u5185\u5bb9\u7684HTML\u4ee3\u7801\u51c6\u5907\u597d\uff0c\u53ef\u4ee5\u662f\u5b57\u7b26\u4e32\u5f62\u5f0f\u3002<\/li>\n<li dir=\"auto\" data-line=\"2\"><strong>\u8c03\u7528\u63d0\u53d6\u65b9\u6cd5<\/strong>\uff1a\u4f7f\u7528<code>extract<\/code>\u65b9\u6cd5\u63d0\u53d6\u4e3b\u4f53\u5185\u5bb9\u3002\u53ef\u4ee5\u6839\u636e\u9700\u8981\u6307\u5b9a\u4e0d\u540c\u7684HTML\u7c7b\u578b\uff0c\u5982\u6587\u7ae0\u3001\u8bba\u575b\u6216\u5fae\u4fe1\u6587\u7ae0\u3002<\/li>\n<li dir=\"auto\" data-line=\"3\"><strong>\u8f93\u51fa\u7ed3\u679c<\/strong>\uff1a\u63d0\u53d6\u7ed3\u679c\u53ef\u4ee5\u662f\u7eaf\u6587\u672c\u6216markdown\u683c\u5f0f\uff0c\u5177\u4f53\u53d6\u51b3\u4e8e\u7528\u6237\u7684\u9700\u6c42\u3002<\/li>\n<\/ol>\n<\/div>\n<div class=\"el-h3\" data-heading=\"\u793a\u4f8b\" data-tag-name=\"h3\">\n<h3 dir=\"auto\" data-heading=\"\u793a\u4f8b\">\u793a\u4f8b<\/h3>\n<\/div>\n<div class=\"el-p\" data-tag-name=\"p\">\n<p dir=\"auto\">\u4ee5\u4e0b\u662f\u4e00\u4e2a\u5b8c\u6574\u7684\u793a\u4f8b\uff0c\u5c55\u793a\u5982\u4f55\u4ece\u4e00\u4e2a\u7b80\u5355\u7684HTML\u9875\u9762\u4e2d\u63d0\u53d6\u4e3b\u4f53\u5185\u5bb9\uff1a<\/p>\n<\/div>\n<div class=\"el-pre\" data-tag-name=\"pre\">\n<pre class=\"language-python\" tabindex=\"0\"><code class=\"language-python is-loaded\"><span class=\"token keyword\">from<\/span> magic_html <span class=\"token keyword\">import<\/span> GeneralExtractor\r\n\r\n<span class=\"token comment\"># \u521d\u59cb\u5316\u63d0\u53d6\u5668<\/span>\r\nextractor <span class=\"token operator\">=<\/span> GeneralExtractor<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span>\r\n\r\n<span class=\"token comment\"># \u793a\u4f8bHTML\u5185\u5bb9<\/span>\r\nhtml <span class=\"token operator\">=<\/span> <span class=\"token triple-quoted-string string\">\"\"\"\r\n&lt;!doctype html&gt;\r\n&lt;html&gt;\r\n&lt;head&gt;\r\n    &lt;title&gt;Example Domain&lt;\/title&gt;\r\n    &lt;meta charset=\"utf-8\" \/&gt;\r\n    &lt;meta http-equiv=\"Content-type\" content=\"text\/html; charset=utf-8\" \/&gt;\r\n    &lt;meta name=\"viewport\" content=\"width=device-width, initial-scale=1\" \/&gt;\r\n&lt;\/head&gt;\r\n&lt;body&gt;\r\n&lt;div&gt;\r\n    &lt;h1&gt;Example Domain&lt;\/h1&gt;\r\n    &lt;p&gt;This domain is for use in illustrative examples in documents. You may use this domain in literature without prior coordination or asking for permission.&lt;\/p&gt;\r\n    &lt;p&gt;&lt;a href=\"https:\/\/www.iana.org\/domains\/example\"&gt;More information...&lt;\/a&gt;&lt;\/p&gt;\r\n&lt;\/div&gt;\r\n&lt;\/body&gt;\r\n&lt;\/html&gt;\r\n\"\"\"<\/span>\r\n\r\n<span class=\"token comment\"># \u63d0\u53d6\u6570\u636e<\/span>\r\ndata <span class=\"token operator\">=<\/span> extractor<span class=\"token punctuation\">.<\/span>extract<span class=\"token punctuation\">(<\/span>html<span class=\"token punctuation\">)<\/span>\r\n<span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span>data<span class=\"token punctuation\">)<\/span><\/code><\/pre>\n<\/div>\n","protected":false},"excerpt":{"rendered":"<p>\u7efc\u5408\u4ecb\u7ecd magic-html\u662f\u4e00\u4e2aPython\u5e93\uff0c\u65e8\u5728\u7b80\u5316\u4eceHTML\u4e2d\u63d0\u53d6\u4e3b\u4f53\u533a\u57df\u5185\u5bb9\u7684\u8fc7\u7a0b\u3002\u65e0\u8bba\u5904\u7406\u7684\u662f\u590d\u6742\u7684HTML\u7ed3\u6784\u8fd8\u662f\u7b80\u5355\u7684\u7f51\u9875\uff0c\u8fd9\u4e2a\u5e93\u90fd\u65e8\u5728\u4e3a\u7528\u6237\u63d0\u4f9b\u4e00\u4e2a\u4fbf\u6377\u9ad8\u6548\u7684\u63a5\u53e3\u3002\u5b83\u652f\u6301\u591a\u6a21\u6001\u62bd\u53d6\uff0c\u652f\u6301\u591a\u79cd\u7248\u9762extractor\uff0c\u5305\u62ec\u6587&#8230;<\/p>\n","protected":false},"author":1,"featured_media":60951,"comment_status":"open","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[20],"tags":[230],"class_list":["post-5909","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-tool","tag-aikaiyuanxiangmu"],"_links":{"self":[{"href":"https:\/\/www.kdjingpai.com\/de\/wp-json\/wp\/v2\/posts\/5909","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.kdjingpai.com\/de\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.kdjingpai.com\/de\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.kdjingpai.com\/de\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/www.kdjingpai.com\/de\/wp-json\/wp\/v2\/comments?post=5909"}],"version-history":[{"count":0,"href":"https:\/\/www.kdjingpai.com\/de\/wp-json\/wp\/v2\/posts\/5909\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/www.kdjingpai.com\/de\/wp-json\/wp\/v2\/media\/60951"}],"wp:attachment":[{"href":"https:\/\/www.kdjingpai.com\/de\/wp-json\/wp\/v2\/media?parent=5909"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.kdjingpai.com\/de\/wp-json\/wp\/v2\/categories?post=5909"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.kdjingpai.com\/de\/wp-json\/wp\/v2\/tags?post=5909"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}