mirror of
https://github.com/simon987/vanwanet_scrape.git
synced 2025-04-19 18:36:47 +00:00
Add logging
This commit is contained in:
parent
ec03e5e412
commit
1c86a781e3
2
setup.py
2
setup.py
@ -2,7 +2,7 @@ from setuptools import setup
|
|||||||
|
|
||||||
setup(
|
setup(
|
||||||
name="vanwanet_scrape",
|
name="vanwanet_scrape",
|
||||||
version="1.0",
|
version="1.1",
|
||||||
description="VanwaTech DDoS protection bypass",
|
description="VanwaTech DDoS protection bypass",
|
||||||
author="simon987",
|
author="simon987",
|
||||||
author_email="me@simon987.net",
|
author_email="me@simon987.net",
|
||||||
|
@ -15,10 +15,11 @@ SUB_PATTRN = re.compile(r'document\.cookie="(.+)";location.+$')
|
|||||||
|
|
||||||
class Scraper:
|
class Scraper:
|
||||||
|
|
||||||
def __init__(self, domains: list, headers=None, proxies=None):
|
def __init__(self, domains: list, headers=None, proxies=None, logger=None):
|
||||||
self._session = requests.session()
|
self._session = requests.session()
|
||||||
self._domains = domains
|
self._domains = domains
|
||||||
self._session.cookies = CookieJar()
|
self._session.cookies = CookieJar()
|
||||||
|
self.logger = logger
|
||||||
|
|
||||||
if headers:
|
if headers:
|
||||||
self._session.headers = headers
|
self._session.headers = headers
|
||||||
@ -32,10 +33,13 @@ class Scraper:
|
|||||||
r = self._get(url, **kwargs)
|
r = self._get(url, **kwargs)
|
||||||
|
|
||||||
if Scraper._is_challenge_page(r):
|
if Scraper._is_challenge_page(r):
|
||||||
cookie = Scraper._execute_challenge(Scraper._transform_js(Scraper._get_js(r)))
|
cookie_str = Scraper._execute_challenge(Scraper._transform_js(Scraper._get_js(r)))
|
||||||
|
|
||||||
|
if self.logger:
|
||||||
|
self.logger.debug("Executed challenge, got %s" % (cookie_from_string(cookie_str, ""),))
|
||||||
|
|
||||||
for domain in self._domains:
|
for domain in self._domains:
|
||||||
self._session.cookies.set_cookie(cookie_from_string(cookie, domain))
|
self._session.cookies.set_cookie(cookie_from_string(cookie_str, domain))
|
||||||
|
|
||||||
return self.get(url, **kwargs)
|
return self.get(url, **kwargs)
|
||||||
return r
|
return r
|
||||||
|
Loading…
x
Reference in New Issue
Block a user