{"id":1117777,"date":"2025-01-08T18:29:15","date_gmt":"2025-01-08T10:29:15","guid":{"rendered":"https:\/\/docs.pingcode.com\/ask\/ask-ask\/1117777.html"},"modified":"2025-01-08T18:29:17","modified_gmt":"2025-01-08T10:29:17","slug":"python%e5%a6%82%e4%bd%95%e5%a4%9a%e7%ba%bf%e7%a8%8b%e7%88%ac%e8%99%ab%e4%b8%8d%e9%87%8d%e5%a4%8d%e6%95%b0%e6%8d%ae","status":"publish","type":"post","link":"https:\/\/docs.pingcode.com\/ask\/1117777.html","title":{"rendered":"python\u5982\u4f55\u591a\u7ebf\u7a0b\u722c\u866b\u4e0d\u91cd\u590d\u6570\u636e"},"content":{"rendered":"<p style=\"text-align:center;\" ><img decoding=\"async\" src=\"https:\/\/cdn-kb.worktile.com\/kb\/wp-content\/uploads\/2024\/04\/25081546\/a00008a1-6084-4c9e-81ac-8d8ea7387b67.webp\" alt=\"python\u5982\u4f55\u591a\u7ebf\u7a0b\u722c\u866b\u4e0d\u91cd\u590d\u6570\u636e\" \/><\/p>\n<p><p> \u5728Python\u4e2d\u4f7f\u7528\u591a\u7ebf\u7a0b\u722c\u866b\u4ee5\u907f\u514d\u91cd\u590d\u6570\u636e\u7684\u65b9\u6cd5\u5305\u62ec\uff1a\u4f7f\u7528\u7ebf\u7a0b\u9501\u3001\u4f7f\u7528\u96c6\u5408\u53bb\u91cd\u3001\u4f7f\u7528\u53bb\u91cd\u961f\u5217\u3002<strong>\u7ebf\u7a0b\u9501\u3001\u96c6\u5408\u53bb\u91cd\u3001\u53bb\u91cd\u961f\u5217<\/strong>\u3002\u5176\u4e2d<strong>\u4f7f\u7528\u7ebf\u7a0b\u9501<\/strong>\u662f\u6700\u91cd\u8981\u7684\uff0c\u5b83\u53ef\u4ee5\u786e\u4fdd\u5728\u591a\u7ebf\u7a0b\u73af\u5883\u4e0b\u5bf9\u5171\u4eab\u8d44\u6e90\u7684\u8bbf\u95ee\u662f\u5b89\u5168\u7684\u3002<\/p>\n<\/p>\n<p><h3>\u4e00\u3001\u4f7f\u7528\u7ebf\u7a0b\u9501<\/h3>\n<\/p>\n<p><p>\u7ebf\u7a0b\u9501\uff08Thread Lock\uff09\u662f\u591a\u7ebf\u7a0b\u7f16\u7a0b\u4e2d\u5e38\u7528\u7684\u540c\u6b65\u539f\u8bed\u3002\u5b83\u80fd\u786e\u4fdd\u5728\u4efb\u610f\u65f6\u523b\u53ea\u6709\u4e00\u4e2a\u7ebf\u7a0b\u80fd\u8bbf\u95ee\u5171\u4eab\u8d44\u6e90\uff0c\u4ece\u800c\u907f\u514d\u6570\u636e\u7ade\u4e89\u548c\u6570\u636e\u91cd\u590d\u3002\u4ee5\u4e0b\u662f\u4f7f\u7528\u7ebf\u7a0b\u9501\u6765\u907f\u514d\u6570\u636e\u91cd\u590d\u7684\u5b9e\u73b0\u6b65\u9aa4\uff1a<\/p>\n<\/p>\n<p><h4>1.1 \u521b\u5efa\u7ebf\u7a0b\u9501<\/h4>\n<\/p>\n<p><p>\u9996\u5148\uff0c\u5728\u4e3b\u7a0b\u5e8f\u4e2d\u521b\u5efa\u4e00\u4e2a\u7ebf\u7a0b\u9501\u3002Python\u7684<code>threading<\/code>\u6a21\u5757\u63d0\u4f9b\u4e86<code>Lock<\/code>\u7c7b\u6765\u5b9e\u73b0\u7ebf\u7a0b\u9501\uff1a<\/p>\n<\/p>\n<p><pre><code class=\"language-python\">import threading<\/p>\n<p>lock = threading.Lock()<\/p>\n<p><\/code><\/pre>\n<\/p>\n<p><h4>1.2 \u5728\u5173\u952e\u4ee3\u7801\u6bb5\u4e2d\u4f7f\u7528\u7ebf\u7a0b\u9501<\/h4>\n<\/p>\n<p><p>\u5728\u9700\u8981\u8bbf\u95ee\u5171\u4eab\u8d44\u6e90\u7684\u4ee3\u7801\u6bb5\u524d\u540e\u4f7f\u7528<code>lock.acquire()<\/code>\u548c<code>lock.release()<\/code>\u6765\u4e0a\u9501\u548c\u89e3\u9501\u3002\u4ee5\u4e0b\u662f\u4e00\u4e2a\u793a\u4f8b\uff1a<\/p>\n<\/p>\n<p><pre><code class=\"language-python\">import threading<\/p>\n<p>import requests<\/p>\n<p>urls = [&quot;http:\/\/example.com\/page1&quot;, &quot;http:\/\/example.com\/page2&quot;]  # \u793a\u4f8bURL\u5217\u8868<\/p>\n<p>visited_urls = set()  # \u7528\u4e8e\u5b58\u50a8\u5df2\u8bbf\u95ee\u7684URL<\/p>\n<p>lock = threading.Lock()<\/p>\n<p>def fetch_url(url):<\/p>\n<p>    global visited_urls<\/p>\n<p>    with lock:  # \u4f7f\u7528\u4e0a\u4e0b\u6587\u7ba1\u7406\u5668\u81ea\u52a8\u4e0a\u9501\u548c\u89e3\u9501<\/p>\n<p>        if url in visited_urls:<\/p>\n<p>            return<\/p>\n<p>        visited_urls.add(url)<\/p>\n<p>    response = requests.get(url)<\/p>\n<p>    print(f&quot;Fetched {url}: {response.status_code}&quot;)<\/p>\n<p>threads = []<\/p>\n<p>for url in urls:<\/p>\n<p>    t = threading.Thread(target=fetch_url, args=(url,))<\/p>\n<p>    threads.append(t)<\/p>\n<p>    t.start()<\/p>\n<p>for t in threads:<\/p>\n<p>    t.join()<\/p>\n<p><\/code><\/pre>\n<\/p>\n<p><p>\u5728\u8fd9\u4e2a\u793a\u4f8b\u4e2d\uff0c<code>visited_urls<\/code>\u96c6\u5408\u7528\u4e8e\u5b58\u50a8\u5df2\u8bbf\u95ee\u7684URL\u3002<code>lock<\/code>\u7528\u4e8e\u5728\u8bbf\u95ee\u548c\u4fee\u6539<code>visited_urls<\/code>\u65f6\u786e\u4fdd\u7ebf\u7a0b\u5b89\u5168\u3002<\/p>\n<\/p>\n<p><h3>\u4e8c\u3001\u4f7f\u7528\u96c6\u5408\u53bb\u91cd<\/h3>\n<\/p>\n<p><p>\u96c6\u5408\uff08Set\uff09\u662f\u4e00\u79cd\u65e0\u5e8f\u4e14\u4e0d\u91cd\u590d\u7684\u6570\u636e\u7ed3\u6784\uff0c\u4f7f\u7528\u96c6\u5408\u5b58\u50a8\u5df2\u8bbf\u95ee\u7684URL\u53ef\u4ee5\u81ea\u52a8\u5b9e\u73b0\u53bb\u91cd\u3002<\/p>\n<\/p>\n<p><h4>2.1 \u521b\u5efa\u96c6\u5408<\/h4>\n<\/p>\n<p><p>\u5728\u4e3b\u7a0b\u5e8f\u4e2d\u521b\u5efa\u4e00\u4e2a\u96c6\u5408\uff0c\u7528\u4e8e\u5b58\u50a8\u5df2\u8bbf\u95ee\u7684URL\uff1a<\/p>\n<\/p>\n<p><pre><code class=\"language-python\">visited_urls = set()<\/p>\n<p><\/code><\/pre>\n<\/p>\n<p><h4>2.2 \u5728\u8bbf\u95ee\u524d\u68c0\u67e5\u96c6\u5408<\/h4>\n<\/p>\n<p><p>\u5728\u722c\u53d6\u6bcf\u4e2aURL\u4e4b\u524d\uff0c\u68c0\u67e5\u8be5URL\u662f\u5426\u5df2\u5728\u96c6\u5408\u4e2d\u3002\u5982\u679c\u4e0d\u5728\uff0c\u5219\u8fdb\u884c\u722c\u53d6\uff0c\u5e76\u5c06\u5176\u6dfb\u52a0\u5230\u96c6\u5408\u4e2d\uff1a<\/p>\n<\/p>\n<p><pre><code class=\"language-python\">def fetch_url(url):<\/p>\n<p>    global visited_urls<\/p>\n<p>    if url in visited_urls:<\/p>\n<p>        return<\/p>\n<p>    visited_urls.add(url)<\/p>\n<p>    response = requests.get(url)<\/p>\n<p>    print(f&quot;Fetched {url}: {response.status_code}&quot;)<\/p>\n<p><\/code><\/pre>\n<\/p>\n<p><p>\u7ed3\u5408\u7ebf\u7a0b\u9501\u548c\u96c6\u5408\uff0c\u53ef\u4ee5\u786e\u4fdd\u591a\u7ebf\u7a0b\u73af\u5883\u4e0b\u7684\u6570\u636e\u4e0d\u91cd\u590d\u3002<\/p>\n<\/p>\n<p><h3>\u4e09\u3001\u4f7f\u7528\u53bb\u91cd\u961f\u5217<\/h3>\n<\/p>\n<p><p>\u961f\u5217\uff08Queue\uff09\u662f\u4e00\u79cd\u7ebf\u7a0b\u5b89\u5168\u7684\u6570\u636e\u7ed3\u6784\uff0c\u53ef\u4ee5\u7528\u4e8e\u5b58\u50a8\u5f85\u722c\u53d6\u7684URL\u3002\u901a\u8fc7\u4f7f\u7528\u53bb\u91cd\u961f\u5217\uff0c\u53ef\u4ee5\u907f\u514d\u591a\u7ebf\u7a0b\u73af\u5883\u4e0b\u7684\u91cd\u590d\u722c\u53d6\u3002<\/p>\n<\/p>\n<p><h4>3.1 \u4f7f\u7528\u961f\u5217\u5b58\u50a8\u5f85\u722c\u53d6URL<\/h4>\n<\/p>\n<p><p>\u4f7f\u7528<code>queue.Queue<\/code>\u521b\u5efa\u4e00\u4e2a\u961f\u5217\uff0c\u5e76\u5c06\u5f85\u722c\u53d6\u7684URL\u653e\u5165\u961f\u5217\u4e2d\uff1a<\/p>\n<\/p>\n<p><pre><code class=\"language-python\">import queue<\/p>\n<p>url_queue = queue.Queue()<\/p>\n<p>for url in urls:<\/p>\n<p>    url_queue.put(url)<\/p>\n<p><\/code><\/pre>\n<\/p>\n<p><h4>3.2 \u4ece\u961f\u5217\u4e2d\u53d6\u51faURL\u8fdb\u884c\u722c\u53d6<\/h4>\n<\/p>\n<p><p>\u5728\u6bcf\u4e2a\u7ebf\u7a0b\u4e2d\uff0c\u4ece\u961f\u5217\u4e2d\u53d6\u51faURL\u8fdb\u884c\u722c\u53d6\uff1a<\/p>\n<\/p>\n<p><pre><code class=\"language-python\">def fetch_url():<\/p>\n<p>    while not url_queue.empty():<\/p>\n<p>        url = url_queue.get()<\/p>\n<p>        if url in visited_urls:<\/p>\n<p>            continue<\/p>\n<p>        visited_urls.add(url)<\/p>\n<p>        response = requests.get(url)<\/p>\n<p>        print(f&quot;Fetched {url}: {response.status_code}&quot;)<\/p>\n<p>        url_queue.task_done()<\/p>\n<p><\/code><\/pre>\n<\/p>\n<p><h3>\u56db\u3001\u5b8c\u6574\u793a\u4f8b<\/h3>\n<\/p>\n<p><p>\u4ee5\u4e0b\u662f\u4e00\u4e2a\u5b8c\u6574\u7684\u793a\u4f8b\uff0c\u5c55\u793a\u4e86\u5982\u4f55\u4f7f\u7528\u591a\u7ebf\u7a0b\u722c\u866b\u5e76\u907f\u514d\u91cd\u590d\u6570\u636e\uff1a<\/p>\n<\/p>\n<p><pre><code class=\"language-python\">import threading<\/p>\n<p>import queue<\/p>\n<p>import requests<\/p>\n<p>urls = [&quot;http:\/\/example.com\/page1&quot;, &quot;http:\/\/example.com\/page2&quot;]  # \u793a\u4f8bURL\u5217\u8868<\/p>\n<p>visited_urls = set()  # \u7528\u4e8e\u5b58\u50a8\u5df2\u8bbf\u95ee\u7684URL<\/p>\n<p>url_queue = queue.Queue()  # \u7528\u4e8e\u5b58\u50a8\u5f85\u722c\u53d6\u7684URL<\/p>\n<p>lock = threading.Lock()<\/p>\n<p>for url in urls:<\/p>\n<p>    url_queue.put(url)<\/p>\n<p>def fetch_url():<\/p>\n<p>    while not url_queue.empty():<\/p>\n<p>        url = url_queue.get()<\/p>\n<p>        with lock:<\/p>\n<p>            if url in visited_urls:<\/p>\n<p>                url_queue.task_done()<\/p>\n<p>                continue<\/p>\n<p>            visited_urls.add(url)<\/p>\n<p>        response = requests.get(url)<\/p>\n<p>        print(f&quot;Fetched {url}: {response.status_code}&quot;)<\/p>\n<p>        url_queue.task_done()<\/p>\n<p>threads = []<\/p>\n<p>for _ in range(5):  # \u521b\u5efa5\u4e2a\u7ebf\u7a0b<\/p>\n<p>    t = threading.Thread(target=fetch_url)<\/p>\n<p>    threads.append(t)<\/p>\n<p>    t.start()<\/p>\n<p>for t in threads:<\/p>\n<p>    t.join()<\/p>\n<p><\/code><\/pre>\n<\/p>\n<p><p>\u5728\u8fd9\u4e2a\u793a\u4f8b\u4e2d\uff0c\u6211\u4eec\u521b\u5efa\u4e86\u4e00\u4e2a\u7ebf\u7a0b\u9501\u3001\u4e00\u4e2a\u96c6\u5408\u548c\u4e00\u4e2a\u961f\u5217\uff0c\u5e76\u4f7f\u7528\u591a\u7ebf\u7a0b\u6765\u722c\u53d6URL\u3002\u901a\u8fc7\u5728\u5173\u952e\u4ee3\u7801\u6bb5\u4e2d\u4f7f\u7528\u7ebf\u7a0b\u9501\uff0c\u786e\u4fdd\u4e86\u591a\u7ebf\u7a0b\u73af\u5883\u4e0b\u7684\u7ebf\u7a0b\u5b89\u5168\uff0c\u4ece\u800c\u907f\u514d\u4e86\u6570\u636e\u7684\u91cd\u590d\u722c\u53d6\u3002<\/p>\n<\/p>\n<p><h3>\u4e94\u3001\u603b\u7ed3<\/h3>\n<\/p>\n<p><p>\u5728Python\u4e2d\u4f7f\u7528\u591a\u7ebf\u7a0b\u722c\u866b\u4ee5\u907f\u514d\u91cd\u590d\u6570\u636e\u7684\u65b9\u6cd5\u4e3b\u8981\u5305\u62ec\u4f7f\u7528\u7ebf\u7a0b\u9501\u3001\u4f7f\u7528\u96c6\u5408\u53bb\u91cd\u548c\u4f7f\u7528\u53bb\u91cd\u961f\u5217\u3002\u7ebf\u7a0b\u9501\u662f\u786e\u4fdd\u591a\u7ebf\u7a0b\u73af\u5883\u4e0b\u7ebf\u7a0b\u5b89\u5168\u7684\u5173\u952e\uff0c\u901a\u8fc7\u7ed3\u5408\u4f7f\u7528\u96c6\u5408\u548c\u961f\u5217\uff0c\u53ef\u4ee5\u6709\u6548\u5730\u907f\u514d\u6570\u636e\u91cd\u590d\u3002\u5e0c\u671b\u672c\u6587\u5bf9\u60a8\u7406\u89e3\u548c\u5b9e\u73b0\u591a\u7ebf\u7a0b\u722c\u866b\u6709\u6240\u5e2e\u52a9\u3002<\/p>\n<\/p>\n<h2><strong>\u76f8\u5173\u95ee\u7b54FAQs\uff1a<\/strong><\/h2>\n<p> <strong>\u5982\u4f55\u786e\u4fdd\u5728Python\u591a\u7ebf\u7a0b\u722c\u866b\u4e2d\u4e0d\u91cd\u590d\u6293\u53d6\u6570\u636e\uff1f<\/strong><br \/>\u4e3a\u4e86\u907f\u514d\u91cd\u590d\u6293\u53d6\uff0c\u9996\u5148\u8981\u5efa\u7acb\u4e00\u4e2a\u6570\u636e\u5b58\u50a8\u673a\u5236\uff0c\u53ef\u4ee5\u4f7f\u7528\u96c6\u5408\u6216\u6570\u636e\u5e93\u6765\u8bb0\u5f55\u5df2\u6293\u53d6\u7684URL\u3002\u5728\u6bcf\u6b21\u53d1\u9001\u8bf7\u6c42\u4e4b\u524d\uff0c\u68c0\u67e5\u8be5URL\u662f\u5426\u5df2\u7ecf\u5728\u8bb0\u5f55\u4e2d\u3002\u5982\u679c\u5df2\u5b58\u5728\uff0c\u5219\u8df3\u8fc7\u6293\u53d6\uff1b\u5982\u679c\u4e0d\u5b58\u5728\uff0c\u5219\u8fdb\u884c\u6293\u53d6\u5e76\u5c06\u8be5URL\u6dfb\u52a0\u5230\u8bb0\u5f55\u4e2d\u3002\u8fd9\u6837\u53ef\u4ee5\u6709\u6548\u51cf\u5c11\u91cd\u590d\u6570\u636e\u7684\u4ea7\u751f\u3002<\/p>\n<p><strong>\u4f7f\u7528\u54ea\u4e9b\u5e93\u53ef\u4ee5\u5b9e\u73b0Python\u591a\u7ebf\u7a0b\u722c\u866b\uff1f<\/strong><br \/>Python\u63d0\u4f9b\u4e86\u591a\u4e2a\u5e93\u6765\u5b9e\u73b0\u591a\u7ebf\u7a0b\u722c\u866b\uff0c\u6bd4\u5982<code>threading<\/code>\u548c<code>concurrent.futures<\/code>\u3002<code>threading<\/code>\u5e93\u53ef\u4ee5\u521b\u5efa\u591a\u4e2a\u7ebf\u7a0b\u6765\u5e76\u53d1\u5904\u7406\u8bf7\u6c42\uff0c\u800c<code>concurrent.futures<\/code>\u63d0\u4f9b\u4e86\u66f4\u9ad8\u7ea7\u7684\u63a5\u53e3\uff0c\u53ef\u4ee5\u66f4\u65b9\u4fbf\u5730\u7ba1\u7406\u7ebf\u7a0b\u6c60\u548c\u4efb\u52a1\u3002\u6b64\u5916\uff0c<code>requests<\/code>\u5e93\u901a\u5e38\u4e0e\u8fd9\u4e9b\u591a\u7ebf\u7a0b\u5e93\u7ed3\u5408\u4f7f\u7528\uff0c\u4fbf\u4e8e\u8fdb\u884c\u7f51\u7edc\u8bf7\u6c42\u3002<\/p>\n<p><strong>\u5728\u591a\u7ebf\u7a0b\u722c\u866b\u4e2d\u5982\u4f55\u7ba1\u7406\u8bf7\u6c42\u9891\u7387\u4ee5\u9632\u6b62\u88ab\u5c01\u7981\uff1f<\/strong><br \/>\u5408\u7406\u63a7\u5236\u8bf7\u6c42\u9891\u7387\u662f\u975e\u5e38\u91cd\u8981\u7684\uff0c\u53ef\u4ee5\u901a\u8fc7\u8bbe\u7f6e\u5ef6\u8fdf\u6765\u964d\u4f4e\u8bf7\u6c42\u7684\u9891\u7387\u3002\u4f8b\u5982\uff0c\u5728\u6bcf\u6b21\u53d1\u9001\u8bf7\u6c42\u540e\u53ef\u4ee5\u4f7f\u7528<code>time.sleep()<\/code>\u65b9\u6cd5\u6765\u6682\u505c\u4e00\u6bb5\u65f6\u95f4\u3002\u6b64\u5916\uff0c\u968f\u673a\u5316\u8bf7\u6c42\u95f4\u9694\u4e5f\u662f\u4e00\u79cd\u6709\u6548\u7684\u7b56\u7565\uff0c\u8fd9\u6837\u53ef\u4ee5\u51cf\u5c11\u88ab\u76ee\u6807\u7f51\u7ad9\u68c0\u6d4b\u5230\u7684\u98ce\u9669\u3002\u4f7f\u7528\u4ee3\u7406IP\u4e5f\u662f\u4e00\u79cd\u5e38\u89c1\u7684\u9632\u5c01\u7981\u63aa\u65bd\uff0c\u5c24\u5176\u662f\u5728\u8fdb\u884c\u5927\u89c4\u6a21\u6293\u53d6\u65f6\u3002<\/p>\n","protected":false},"excerpt":{"rendered":"\u5728Python\u4e2d\u4f7f\u7528\u591a\u7ebf\u7a0b\u722c\u866b\u4ee5\u907f\u514d\u91cd\u590d\u6570\u636e\u7684\u65b9\u6cd5\u5305\u62ec\uff1a\u4f7f\u7528\u7ebf\u7a0b\u9501\u3001\u4f7f\u7528\u96c6\u5408\u53bb\u91cd\u3001\u4f7f\u7528\u53bb\u91cd\u961f\u5217\u3002\u7ebf\u7a0b\u9501\u3001\u96c6\u5408\u53bb [&hellip;]","protected":false},"author":3,"featured_media":1117783,"comment_status":"closed","ping_status":"","sticky":false,"template":"","format":"standard","meta":{"_acf_changed":false,"footnotes":""},"categories":[37],"tags":[],"acf":[],"_links":{"self":[{"href":"https:\/\/docs.pingcode.com\/wp-json\/wp\/v2\/posts\/1117777"}],"collection":[{"href":"https:\/\/docs.pingcode.com\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/docs.pingcode.com\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/docs.pingcode.com\/wp-json\/wp\/v2\/users\/3"}],"replies":[{"embeddable":true,"href":"https:\/\/docs.pingcode.com\/wp-json\/wp\/v2\/comments?post=1117777"}],"version-history":[{"count":"1","href":"https:\/\/docs.pingcode.com\/wp-json\/wp\/v2\/posts\/1117777\/revisions"}],"predecessor-version":[{"id":1117786,"href":"https:\/\/docs.pingcode.com\/wp-json\/wp\/v2\/posts\/1117777\/revisions\/1117786"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/docs.pingcode.com\/wp-json\/wp\/v2\/media\/1117783"}],"wp:attachment":[{"href":"https:\/\/docs.pingcode.com\/wp-json\/wp\/v2\/media?parent=1117777"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/docs.pingcode.com\/wp-json\/wp\/v2\/categories?post=1117777"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/docs.pingcode.com\/wp-json\/wp\/v2\/tags?post=1117777"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}