Source code for scylla.providers.cool_proxy_provider
import re
from requests_html import HTML
from scylla.database import ProxyIP
from .base_provider import BaseProvider
[docs]class CoolProxyProvider(BaseProvider):
[docs] def parse(self, html: HTML) -> [ProxyIP]:
ip_list: [ProxyIP] = []
for ip_row in html.find('table tr'):
ip_element = ip_row.find('td:nth-child(1)', first=True)
port_element = ip_row.find('td:nth-child(2)', first=True)
if ip_element and port_element:
p = ProxyIP(ip=re.sub(r'document\.write\(.+\)', '', ip_element.text), port=port_element.text)
ip_list.append(p)
return ip_list
[docs] def urls(self) -> [str]:
return [
'https://www.cool-proxy.net/proxies/http_proxy_list/country_code:/port:/anonymous:1',
'https://www.cool-proxy.net/proxies/http_proxy_list/country_code:/port:/anonymous:1/page:2',
'https://www.cool-proxy.net/proxies/http_proxy_list/country_code:/port:/anonymous:1/page:3',
]
[docs] @staticmethod
def should_render_js() -> bool:
return True