done proxy.py
This commit is contained in:
parent
c205e1b627
commit
de56ecb253
27
proxy.py
27
proxy.py
@ -1,8 +1,12 @@
|
||||
from selenium import webdriver
|
||||
import re
|
||||
import random
|
||||
|
||||
|
||||
# TODO: export path with geckodriver or chromedriver automatically and put driver in project files
|
||||
# TODO: automatically download geckodriver or chromedriver
|
||||
class Proxy():
|
||||
def __init__(self, proxies = None):
|
||||
def __init__(self, proxies=None):
|
||||
"docstring"
|
||||
self.proxies = [] if proxies is None else proxies
|
||||
|
||||
@ -10,21 +14,32 @@ class Proxy():
|
||||
driver = webdriver.Chrome()
|
||||
driver.maximize_window()
|
||||
driver.get('http://www.gatherproxy.com/proxylist/anonymity/?t=elite')
|
||||
full_list_button = driver.find_element_by_xpath('//input[@type="submit" and @value="Show Full List"]')
|
||||
full_list_button = driver.find_element_by_xpath(
|
||||
'//input[@type="submit" and @value="Show Full List"]')
|
||||
full_list_button.click()
|
||||
print(driver.page_source)
|
||||
for match in re.finditer('<a href="#(.*?)" class="inactive" onclick="gp.pageClick', driver.page_source):
|
||||
for match in re.finditer(
|
||||
'<a href="#(.*?)" class="inactive" onclick="gp.pageClick',
|
||||
driver.page_source):
|
||||
pass
|
||||
pages_nr = int(match.group(1))
|
||||
for i in range(2, pages_nr+1):
|
||||
for i in range(1, pages_nr + 1):
|
||||
self._get_proxies(driver.page_source)
|
||||
driver.execute_script('gp.pageClick(' + str(i) + ')')
|
||||
print(i)
|
||||
|
||||
def random(self):
|
||||
return random.choice(self.proxies)
|
||||
|
||||
def _get_proxies(self, html):
|
||||
for match in re.findall("<td><script>document.write\('(.*?)'[\w\W]*?<td><script>document.write\(gp.dep\('(.*?)'", html):
|
||||
proxy = (match[0], str(int(match[1],16)))
|
||||
for match in re.findall(
|
||||
"<td><script>document.write\('(.*?)'[\w\W]*?<td><script>document.write\(gp.dep\('(.*?)'",
|
||||
html):
|
||||
proxy = (match[0], str(int(match[1], 16)))
|
||||
self.proxies.append(proxy)
|
||||
|
||||
|
||||
if __name__ == '__main__':
|
||||
p = Proxy()
|
||||
p.download()
|
||||
print(p.random())
|
||||
|
Loading…
Reference in New Issue
Block a user