From 0a17218181ea9c32577b33ead501336fa998dbf8 Mon Sep 17 00:00:00 2001 From: nubotz Date: Fri, 11 Nov 2016 17:23:21 +0800 Subject: [PATCH 1/2] Update crawl_proxy_servers.py it seems the proxy web added one more div with class="table-container" --- crawl_proxy_servers.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/crawl_proxy_servers.py b/crawl_proxy_servers.py index 909f2e7..27572e2 100644 --- a/crawl_proxy_servers.py +++ b/crawl_proxy_servers.py @@ -28,7 +28,7 @@ def crawl_proxy_servers(): if page.status_code == requests.codes.ok: bsobj = BeautifulSoup(page.text, 'html.parser') try: - proxy_table = bsobj.find('div', {'class': 'table-container'}) + proxy_table = bsobj.findAll('div', {'class': 'table-container'})[1] proxy_body = proxy_table.find('table').find('tbody') for tr in proxy_body.findAll('tr'): proxy_info = tr.findAll('td') From bda46debebfd4c947d435161dd5a136f5719b8d1 Mon Sep 17 00:00:00 2001 From: nubotz Date: Sun, 26 Feb 2017 12:24:05 +0800 Subject: [PATCH 2/2] Update crawl_proxy_servers.py --- crawl_proxy_servers.py | 1 - 1 file changed, 1 deletion(-) diff --git a/crawl_proxy_servers.py b/crawl_proxy_servers.py index 27572e2..55f74a1 100644 --- a/crawl_proxy_servers.py +++ b/crawl_proxy_servers.py @@ -47,7 +47,6 @@ def crawl_proxy_servers(): def test_proxy_server(proxy): proxies = {'http': proxy} - try: response = requests.get(test_url, proxies=proxies, timeout=10) if response.status_code == requests.codes.ok: