{"id":771,"date":"2025-01-05T22:59:44","date_gmt":"2025-01-05T14:59:44","guid":{"rendered":"https:\/\/www.laixuexila.com\/?p=771"},"modified":"2025-01-11T16:12:06","modified_gmt":"2025-01-11T08:12:06","slug":"%e5%a6%82%e4%bd%95%e7%ae%80%e5%8c%96python-%e6%b5%8f%e8%a7%88%e5%99%a8%e8%87%aa%e5%8a%a8%e5%8c%96%e7%9a%84%e6%a8%a1%e5%bc%8f%ef%bc%9f","status":"publish","type":"post","link":"https:\/\/www.laixuexila.com\/index.php\/2025\/01\/05\/%e5%a6%82%e4%bd%95%e7%ae%80%e5%8c%96python-%e6%b5%8f%e8%a7%88%e5%99%a8%e8%87%aa%e5%8a%a8%e5%8c%96%e7%9a%84%e6%a8%a1%e5%bc%8f%ef%bc%9f\/","title":{"rendered":"\u5982\u4f55\u7b80\u5316 Python \u6d4f\u89c8\u5668\u81ea\u52a8\u5316\u64cd\u4f5c\uff1f\u5b9e\u7528\u6280\u5de7\u4e0e\u65b9\u6cd5"},"content":{"rendered":"\n<blockquote class=\"wp-block-quote is-layout-flow wp-block-quote-is-layout-flow\">\n<p class=\"wp-block-paragraph\">Python \u6d4f\u89c8\u5668\u81ea\u52a8\u5316\u901a\u5e38\u7528\u4e8e\u7f51\u9875\u6d4b\u8bd5\u3001\u722c\u53d6\u6570\u636e\u6216\u4e0e\u7f51\u9875\u4ea4\u4e92\u3002\u7b80\u5316\u6d4f\u89c8\u5668\u81ea\u52a8\u5316\u7684\u6a21\u5f0f\u53ef\u4ee5\u4f7f\u5f00\u53d1\u8fc7\u7a0b\u66f4\u9ad8\u6548\u3001\u66f4\u6613\u4e8e\u7ef4\u62a4\u3002\u4e0b\u9762\u662f Python \u6d4f\u89c8\u5668\u81ea\u52a8\u5316\u7684\u4e09\u79cd\u5e38\u89c1\u7b80\u5316\u6a21\u5f0f\uff1a<\/p>\n<\/blockquote>\n\n\n\n<hr class=\"wp-block-separator has-alpha-channel-opacity\"\/>\n\n\n\n<h3 class=\"wp-block-heading\">1. <strong>\u4f7f\u7528 Selenium + WebDriver<\/strong><\/h3>\n\n\n\n<p class=\"wp-block-paragraph\"><strong>Selenium<\/strong> \u662f\u4e00\u4e2a\u5f3a\u5927\u7684\u6d4f\u89c8\u5668\u81ea\u52a8\u5316\u5de5\u5177\uff0c\u5e7f\u6cdb\u7528\u4e8e\u81ea\u52a8\u5316\u7f51\u9875\u7684\u64cd\u4f5c\u3002\u5b83\u652f\u6301\u591a\u79cd\u6d4f\u89c8\u5668\uff08\u5982 Chrome\u3001Firefox \u7b49\uff09\uff0c\u5e76\u63d0\u4f9b\u4e86\u4e00\u4e2a\u7edf\u4e00\u7684\u63a5\u53e3\u6765\u4e0e\u7f51\u9875\u8fdb\u884c\u4ea4\u4e92\u3002<code>Selenium WebDriver<\/code> \u662f\u4e00\u79cd\u63a7\u5236\u6d4f\u89c8\u5668\u7684\u5de5\u5177\uff0c\u53ef\u4ee5\u6a21\u62df\u4eba\u7c7b\u5728\u6d4f\u89c8\u5668\u4e2d\u7684\u64cd\u4f5c\u3002<\/p>\n\n\n\n<h4 class=\"wp-block-heading\">\u5b89\u88c5 Selenium\uff1a<\/h4>\n\n\n\n<pre class=\"wp-block-code\"><code>pip install selenium<\/code><\/pre>\n\n\n\n<h4 class=\"wp-block-heading\">\u7b80\u5355\u7684 Web \u81ea\u52a8\u5316\u6d41\u7a0b\uff1a<\/h4>\n\n\n\n<pre class=\"wp-block-code\"><code>from selenium import webdriver\nfrom selenium.webdriver.common.keys import Keys\n\n# \u8bbe\u7f6e\u6d4f\u89c8\u5668\u9a71\u52a8\ndriver = webdriver.Chrome(executable_path='\/path\/to\/chromedriver')\n\n# \u6253\u5f00\u7f51\u9875\ndriver.get(\"https:\/\/www.example.com\")\n\n# \u67e5\u627e\u5143\u7d20\u5e76\u6267\u884c\u64cd\u4f5c\nsearch_box = driver.find_element_by_name(\"q\")\nsearch_box.send_keys(\"Python\")\nsearch_box.send_keys(Keys.RETURN)\n\n# \u83b7\u53d6\u7f51\u9875\u6807\u9898\nprint(driver.title)\n\n# \u5173\u95ed\u6d4f\u89c8\u5668\ndriver.quit()<\/code><\/pre>\n\n\n\n<h4 class=\"wp-block-heading\">\u7b80\u5316\u4f7f\u7528\uff1a<\/h4>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>\u6d4f\u89c8\u5668\u542f\u52a8\u4e0e\u5173\u95ed<\/strong>\uff1a\u901a\u8fc7 <code>webdriver.Chrome()<\/code> \u542f\u52a8\uff0c\u4f7f\u7528 <code>quit()<\/code> \u6216 <code>close()<\/code> \u5173\u95ed\u6d4f\u89c8\u5668\u3002<\/li>\n\n\n\n<li><strong>\u5143\u7d20\u5b9a\u4f4d<\/strong>\uff1a\u53ef\u4ee5\u901a\u8fc7 <code>find_element_by_name()<\/code>, <code>find_element_by_xpath()<\/code> \u7b49\u65b9\u6cd5\u67e5\u627e\u5143\u7d20\u3002<\/li>\n<\/ul>\n\n\n\n<hr class=\"wp-block-separator has-alpha-channel-opacity\"\/>\n\n\n\n<h3 class=\"wp-block-heading\">2. <strong>\u4f7f\u7528 Playwright<\/strong><\/h3>\n\n\n\n<p class=\"wp-block-paragraph\"><code>Playwright<\/code> \u662f\u4e00\u4e2a\u73b0\u4ee3\u5316\u7684\u6d4f\u89c8\u5668\u81ea\u52a8\u5316\u5e93\uff0c\u5b83\u7531 Microsoft \u63d0\u4f9b\uff0c\u652f\u6301 Chromium\u3001Firefox \u548c WebKit\u3002\u4e0e Selenium \u76f8\u6bd4\uff0cPlaywright \u5177\u6709\u66f4\u5feb\u7684\u6027\u80fd\u548c\u66f4\u591a\u7684\u529f\u80fd\uff0c\u9002\u7528\u4e8e\u73b0\u4ee3 Web \u5e94\u7528\u7684\u81ea\u52a8\u5316\u3002<\/p>\n\n\n\n<h4 class=\"wp-block-heading\">\u5b89\u88c5 Playwright\uff1a<\/h4>\n\n\n\n<pre class=\"wp-block-code\"><code>pip install playwright\npython -m playwright install<\/code><\/pre>\n\n\n\n<h4 class=\"wp-block-heading\">\u7b80\u5355\u7684 Web \u81ea\u52a8\u5316\u6d41\u7a0b\uff1a<\/h4>\n\n\n\n<pre class=\"wp-block-code\"><code>from playwright.sync_api import sync_playwright\n\nwith sync_playwright() as p:\n    # \u542f\u52a8\u6d4f\u89c8\u5668\n    browser = p.chromium.launch(headless=False)  # headless=False \u663e\u793a\u6d4f\u89c8\u5668\u754c\u9762\n    page = browser.new_page()\n\n    # \u6253\u5f00\u7f51\u9875\n    page.goto(\"https:\/\/www.example.com\")\n\n    # \u67e5\u627e\u5e76\u64cd\u4f5c\u5143\u7d20\n    search_box = page.locator(\"input&#91;name='q']\")\n    search_box.fill(\"Python\")\n    search_box.press(\"Enter\")\n\n    # \u83b7\u53d6\u9875\u9762\u6807\u9898\n    print(page.title())\n\n    # \u5173\u95ed\u6d4f\u89c8\u5668\n    browser.close()<\/code><\/pre>\n\n\n\n<h4 class=\"wp-block-heading\">\u7b80\u5316\u4f7f\u7528\uff1a<\/h4>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>\u6d4f\u89c8\u5668\u542f\u52a8\u4e0e\u5173\u95ed<\/strong>\uff1a\u901a\u8fc7 <code>p.chromium.launch()<\/code> \u542f\u52a8\uff0c\u4f7f\u7528 <code>browser.close()<\/code> \u5173\u95ed\u3002<\/li>\n\n\n\n<li><strong>\u5143\u7d20\u64cd\u4f5c<\/strong>\uff1a\u4f7f\u7528 <code>locator()<\/code> \u5b9a\u4f4d\u5143\u7d20\uff0c\u652f\u6301\u66f4\u591a\u7c7b\u578b\u7684\u5143\u7d20\u4ea4\u4e92\uff08\u5982 <code>fill()<\/code>, <code>press()<\/code>\uff09\u3002<\/li>\n<\/ul>\n\n\n\n<hr class=\"wp-block-separator has-alpha-channel-opacity\"\/>\n\n\n\n<h3 class=\"wp-block-heading\">3. <strong>\u4f7f\u7528 Pyppeteer<\/strong><\/h3>\n\n\n\n<p class=\"wp-block-paragraph\"><code>Pyppeteer<\/code> \u662f Python \u7248\u7684 <code>Puppeteer<\/code>\uff0c\u7528\u4e8e\u901a\u8fc7 Chromium \u6d4f\u89c8\u5668\u6267\u884c\u81ea\u52a8\u5316\u4efb\u52a1\u3002<code>Pyppeteer<\/code> \u5177\u6709\u8f83\u4f4e\u7684\u5b66\u4e60\u66f2\u7ebf\uff0c\u9002\u5408\u5feb\u901f\u542f\u52a8\u548c\u6267\u884c\u6d4f\u89c8\u5668\u64cd\u4f5c\uff0c\u7279\u522b\u662f\u5728\u722c\u866b\u548c\u81ea\u52a8\u5316\u6d4b\u8bd5\u573a\u666f\u4e2d\u5e94\u7528\u5e7f\u6cdb\u3002<\/p>\n\n\n\n<h4 class=\"wp-block-heading\">\u5b89\u88c5 Pyppeteer\uff1a<\/h4>\n\n\n\n<pre class=\"wp-block-code\"><code>pip install pyppeteer<\/code><\/pre>\n\n\n\n<h4 class=\"wp-block-heading\">\u7b80\u5355\u7684 Web \u81ea\u52a8\u5316\u6d41\u7a0b\uff1a<\/h4>\n\n\n\n<pre class=\"wp-block-code\"><code>import asyncio\nfrom pyppeteer import launch\n\nasync def main():\n    # \u542f\u52a8\u6d4f\u89c8\u5668\n    browser = await launch(headless=False)\n    page = await browser.newPage()\n\n    # \u6253\u5f00\u7f51\u9875\n    await page.goto(\"https:\/\/www.example.com\")\n\n    # \u67e5\u627e\u5e76\u64cd\u4f5c\u5143\u7d20\n    await page.type('input&#91;name=\"q\"]', \"Python\")\n    await page.keyboard.press(\"Enter\")\n\n    # \u83b7\u53d6\u9875\u9762\u6807\u9898\n    title = await page.title()\n    print(title)\n\n    # \u5173\u95ed\u6d4f\u89c8\u5668\n    await browser.close()\n\n# \u8fd0\u884c\u5f02\u6b65\u4efb\u52a1\nasyncio.get_event_loop().run_until_complete(main())<\/code><\/pre>\n\n\n\n<h4 class=\"wp-block-heading\">\u7b80\u5316\u4f7f\u7528\uff1a<\/h4>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>\u6d4f\u89c8\u5668\u542f\u52a8\u4e0e\u5173\u95ed<\/strong>\uff1a\u901a\u8fc7 <code>launch()<\/code> \u542f\u52a8\uff0c\u4f7f\u7528 <code>browser.close()<\/code> \u5173\u95ed\u3002<\/li>\n\n\n\n<li><strong>\u5f02\u6b65\u64cd\u4f5c<\/strong>\uff1a<code>Pyppeteer<\/code> \u4f7f\u7528 <code>async\/await<\/code> \u8fdb\u884c\u5f02\u6b65\u64cd\u4f5c\uff0c\u66f4\u9002\u5408\u9700\u8981\u9ad8\u5e76\u53d1\u5904\u7406\u7684\u573a\u666f\u3002<\/li>\n<\/ul>\n\n\n\n<hr class=\"wp-block-separator has-alpha-channel-opacity\"\/>\n\n\n\n<h3 class=\"wp-block-heading\">4. <strong>\u5bf9\u6bd4\u4e0e\u603b\u7ed3<\/strong><\/h3>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th>\u7279\u6027<\/th><th>Selenium<\/th><th>Playwright<\/th><th>Pyppeteer<\/th><\/tr><\/thead><tbody><tr><td><strong>\u652f\u6301\u7684\u6d4f\u89c8\u5668<\/strong><\/td><td>Chrome, Firefox, Safari, Edge<\/td><td>Chromium, Firefox, WebKit<\/td><td>Chromium<\/td><\/tr><tr><td><strong>\u5f02\u6b65\u652f\u6301<\/strong><\/td><td>\u6709\uff08\u901a\u8fc7 WebDriverWait \u7b49\uff09<\/td><td>\u5b8c\u5168\u652f\u6301\uff08\u9ed8\u8ba4\u5f02\u6b65\uff09<\/td><td>\u5b8c\u5168\u652f\u6301\uff08\u5f02\u6b65\u6a21\u5f0f\uff09<\/td><\/tr><tr><td><strong>\u6027\u80fd<\/strong><\/td><td>\u8f83\u6162\uff0c\u9002\u5408\u901a\u7528\u573a\u666f<\/td><td>\u8f83\u5feb\uff0c\u9002\u5408\u73b0\u4ee3 Web<\/td><td>\u5feb\uff0c\u9002\u5408\u722c\u866b\u573a\u666f<\/td><\/tr><tr><td><strong>API \u8bbe\u8ba1<\/strong><\/td><td>\u7b80\u5355\uff0c\u4f46\u67d0\u4e9b\u64cd\u4f5c\u590d\u6742<\/td><td>\u66f4\u73b0\u4ee3\u5316\u4e14\u6613\u7528<\/td><td>\u7b80\u5355\uff0c\u7c7b\u4f3c Puppeteer<\/td><\/tr><tr><td><strong>\u529f\u80fd\u652f\u6301<\/strong><\/td><td>\u5f3a\u5927\u7684\u529f\u80fd\uff0c\u4f46\u6709\u4e9b\u64cd\u4f5c\u8f83\u7e41\u7410<\/td><td>\u5f3a\u5927\u7684\u73b0\u4ee3 Web \u652f\u6301<\/td><td>\u805a\u7126\u4e8e\u6d4f\u89c8\u5668\u81ea\u52a8\u5316\uff0c\u529f\u80fd\u8f83\u5355\u4e00<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<hr class=\"wp-block-separator has-alpha-channel-opacity\"\/>\n\n\n\n<h3 class=\"wp-block-heading\">5. <strong>\u9009\u62e9\u5408\u9002\u7684\u5de5\u5177<\/strong><\/h3>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>Selenium<\/strong> \u9002\u5408\u4e8e\u529f\u80fd\u5168\u9762\u3001\u9700\u8981\u652f\u6301\u591a\u79cd\u6d4f\u89c8\u5668\u7684\u5e94\u7528\u573a\u666f\uff0c\u7279\u522b\u662f\u9700\u8981\u517c\u5bb9\u4f20\u7edf\u6d4f\u89c8\u5668\u7684\u6d4b\u8bd5\u65f6\u3002<\/li>\n\n\n\n<li><strong>Playwright<\/strong> \u9002\u7528\u4e8e\u5bf9\u6027\u80fd\u548c\u73b0\u4ee3\u6d4f\u89c8\u5668\u652f\u6301\u8981\u6c42\u8f83\u9ad8\u7684\u9879\u76ee\uff0c\u5c24\u5176\u662f\u9700\u8981\u591a\u6d4f\u89c8\u5668\u6d4b\u8bd5\u65f6\u3002<\/li>\n\n\n\n<li><strong>Pyppeteer<\/strong> \u662f <code>Puppeteer<\/code> \u7684 Python \u5b9e\u73b0\uff0c\u9002\u7528\u4e8e\u9700\u8981\u9ad8\u6548\u722c\u866b\u548c Web \u81ea\u52a8\u5316\u7684\u573a\u666f\uff0c\u7279\u522b\u662f\u5728\u5904\u7406\u73b0\u4ee3 Web \u5e94\u7528\u65f6\u8868\u73b0\u4f18\u79c0\u3002<\/li>\n<\/ul>\n\n\n\n<h3 class=\"wp-block-heading\">\u603b\u7ed3\uff1a<\/h3>\n\n\n\n<p class=\"wp-block-paragraph\">\u901a\u8fc7\u8fd9\u4e9b\u5de5\u5177\uff0c\u4f60\u53ef\u4ee5\u66f4\u7b80\u5355\u548c\u9ad8\u6548\u5730\u5b9e\u73b0 Python \u6d4f\u89c8\u5668\u81ea\u52a8\u5316\u3002\u9009\u62e9\u5408\u9002\u7684\u81ea\u52a8\u5316\u5de5\u5177\u80fd\u591f\u663e\u8457\u63d0\u5347\u5f00\u53d1\u6548\u7387\u3002<\/p>\n","protected":false},"excerpt":{"rendered":"<p>Python \u6d4f\u89c8\u5668\u81ea\u52a8\u5316\u901a\u5e38\u7528\u4e8e\u7f51\u9875\u6d4b\u8bd5\u3001\u722c\u53d6\u6570\u636e\u6216\u4e0e\u7f51\u9875\u4ea4\u4e92\u3002\u7b80\u5316\u6d4f\u89c8\u5668\u81ea\u52a8\u5316\u7684\u6a21\u5f0f\u53ef\u4ee5\u4f7f\u5f00\u53d1\u8fc7\u7a0b\u66f4\u9ad8\u6548\u3001 [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[54],"tags":[],"class_list":["post-771","post","type-post","status-publish","format-standard","hentry","category-python"],"_links":{"self":[{"href":"https:\/\/www.laixuexila.com\/index.php\/wp-json\/wp\/v2\/posts\/771","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.laixuexila.com\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.laixuexila.com\/index.php\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.laixuexila.com\/index.php\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/www.laixuexila.com\/index.php\/wp-json\/wp\/v2\/comments?post=771"}],"version-history":[{"count":2,"href":"https:\/\/www.laixuexila.com\/index.php\/wp-json\/wp\/v2\/posts\/771\/revisions"}],"predecessor-version":[{"id":897,"href":"https:\/\/www.laixuexila.com\/index.php\/wp-json\/wp\/v2\/posts\/771\/revisions\/897"}],"wp:attachment":[{"href":"https:\/\/www.laixuexila.com\/index.php\/wp-json\/wp\/v2\/media?parent=771"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.laixuexila.com\/index.php\/wp-json\/wp\/v2\/categories?post=771"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.laixuexila.com\/index.php\/wp-json\/wp\/v2\/tags?post=771"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}