kopia lustrzana https://github.com/dgtlmoon/changedetection.io
Playwright - ByPass CSP for more reliable JS scraping, disable accept downloads
rodzic
e3e022b0f4
commit
9d742446ab
|
@ -277,8 +277,13 @@ class base_html_playwright(Fetcher):
|
||||||
# Use the default one configured in the App.py model that's passed from fetch_site_status.py
|
# Use the default one configured in the App.py model that's passed from fetch_site_status.py
|
||||||
context = browser.new_context(
|
context = browser.new_context(
|
||||||
user_agent=request_headers['User-Agent'] if request_headers.get('User-Agent') else 'Mozilla/5.0',
|
user_agent=request_headers['User-Agent'] if request_headers.get('User-Agent') else 'Mozilla/5.0',
|
||||||
proxy=self.proxy
|
proxy=self.proxy,
|
||||||
|
# This is needed to enable JavaScript execution on GitHub and others
|
||||||
|
bypass_csp=True,
|
||||||
|
# Should never be needed
|
||||||
|
accept_downloads=False
|
||||||
)
|
)
|
||||||
|
|
||||||
page = context.new_page()
|
page = context.new_page()
|
||||||
try:
|
try:
|
||||||
# Bug - never set viewport size BEFORE page.goto
|
# Bug - never set viewport size BEFORE page.goto
|
||||||
|
|
Ładowanie…
Reference in New Issue