Add files via upload
This commit is contained in:
parent
3d3d1aeca8
commit
d7a826db47
|
@ -0,0 +1,271 @@
|
||||||
|
#!/usr/bin/env python3
|
||||||
|
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
888 888 d8b
|
||||||
|
888 888 Y8P
|
||||||
|
888 888
|
||||||
|
.d8888b 88888b. 888d888 .d88b. 88888b.d88b. .d88b. .d88888 888d888 888 888 888 .d88b. 888d888
|
||||||
|
d88P" 888 "88b 888P" d88""88b 888 "888 "88b d8P Y8b d88" 888 888P" 888 888 888 d8P Y8b 888P"
|
||||||
|
888 888 888 888 888 888 888 888 888 88888888 888 888 888 888 Y88 88P 88888888 888
|
||||||
|
Y88b. 888 888 888 Y88..88P 888 888 888 Y8b. Y88b 888 888 888 Y8bd8P Y8b. 888
|
||||||
|
"Y8888P 888 888 888 "Y88P" 888 888 888 "Y8888 "Y88888 888 888 Y88P "Y8888 888 88888888
|
||||||
|
|
||||||
|
888 d8b 888 888
|
||||||
|
888 Y8P 888 888
|
||||||
|
888 888 888
|
||||||
|
88888b. 888 .d88888 .d88888 .d88b. 88888b.
|
||||||
|
888 "88b 888 d88" 888 d88" 888 d8P Y8b 888 "88b
|
||||||
|
888 888 888 888 888 888 888 88888888 888 888
|
||||||
|
888 888 888 Y88b 888 Y88b 888 Y8b. 888 888
|
||||||
|
888 888 888 "Y88888 "Y88888 "Y8888 888 888
|
||||||
|
|
||||||
|
BY ULTRAFUNKAMSTERDAM (https://github.com/ultrafunkamsterdam)
|
||||||
|
|
||||||
|
|
||||||
|
##################################################################
|
||||||
|
|
||||||
|
Optimized Selenium Chromedriver patch which does not trigger anti-bot services like Distill Network.
|
||||||
|
Automatically downloads the driver binary and patches it.
|
||||||
|
|
||||||
|
Not tested on Chrome higher than 79!
|
||||||
|
|
||||||
|
#################################################################
|
||||||
|
|
||||||
|
|
||||||
|
USAGE
|
||||||
|
|
||||||
|
# 1- by far the easiest
|
||||||
|
|
||||||
|
from undetected_chromedriver import Chrome, ChromeOptions
|
||||||
|
driver = Chrome()
|
||||||
|
driver.get('https://distilnetworks.com')
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
# 2- patches current selenium instance (for current session)
|
||||||
|
|
||||||
|
import undetected_chromedriver
|
||||||
|
undetected_chromedriver.install()
|
||||||
|
|
||||||
|
from selenium.webdriver import Chrome
|
||||||
|
driver = Chrome()
|
||||||
|
driver.get('https://distilnetworks.com')
|
||||||
|
|
||||||
|
|
||||||
|
# 3 - Customized
|
||||||
|
|
||||||
|
import undetected_chromedriver
|
||||||
|
|
||||||
|
#specify chromedriver version to download and patch
|
||||||
|
undetected_chromedriver.TARGET_VERSION = 78
|
||||||
|
|
||||||
|
# or specify your own chromedriver binary to patch
|
||||||
|
undetected_chromedriver.install(
|
||||||
|
executable_path='c:/users/user1/chromedriver.exe',
|
||||||
|
target_version=78
|
||||||
|
)
|
||||||
|
|
||||||
|
from selenium.webdriver import Chrome, ChromeOptions
|
||||||
|
opts = ChromeOptions()
|
||||||
|
opts.add_argument(f'--proxy-server=socks5://127.0.0.1:9050')
|
||||||
|
driver = Chrome(options=opts)
|
||||||
|
driver.get('https://distilnetworks.com')
|
||||||
|
|
||||||
|
|
||||||
|
a combination of function(s) from this module :)
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
import io
|
||||||
|
import logging
|
||||||
|
import os
|
||||||
|
import sys
|
||||||
|
import zipfile
|
||||||
|
from urllib.request import urlopen, urlretrieve
|
||||||
|
|
||||||
|
from selenium.webdriver import Chrome as _Chrome
|
||||||
|
from selenium.webdriver import ChromeOptions as _ChromeOptions
|
||||||
|
|
||||||
|
|
||||||
|
_DL_BASE = "https://chromedriver.storage.googleapis.com/"
|
||||||
|
TARGET_VERSION = 79
|
||||||
|
__is_patched__ = 0
|
||||||
|
|
||||||
|
|
||||||
|
class Chrome:
|
||||||
|
def __new__(cls, *args, **kwargs):
|
||||||
|
if not ChromeDriverManager.installed:
|
||||||
|
ChromeDriverManager(*args, **kwargs).install()
|
||||||
|
if not ChromeDriverManager.selenium_patched:
|
||||||
|
ChromeDriverManager(*args, **kwargs).patch_selenium_webdriver()
|
||||||
|
instance = object.__new__(_Chrome)
|
||||||
|
instance.__init__(*args, **kwargs)
|
||||||
|
instance.execute_cdp_cmd(
|
||||||
|
"Page.addScriptToEvaluateOnNewDocument",
|
||||||
|
{
|
||||||
|
"source": """
|
||||||
|
Object.defineProperty(navigator, 'webdriver', {
|
||||||
|
get: () => undefined
|
||||||
|
})
|
||||||
|
"""
|
||||||
|
},
|
||||||
|
)
|
||||||
|
original_user_agent_string = instance.execute_script(
|
||||||
|
"return navigator.userAgent"
|
||||||
|
)
|
||||||
|
instance.execute_cdp_cmd(
|
||||||
|
"Network.setUserAgentOverride",
|
||||||
|
{
|
||||||
|
"userAgent": original_user_agent_string.replace("Headless", ""),
|
||||||
|
"platform": "Windows",
|
||||||
|
},
|
||||||
|
)
|
||||||
|
print(f"starting webdriver instance Chrome({args}, {kwargs})")
|
||||||
|
return instance
|
||||||
|
|
||||||
|
|
||||||
|
class ChromeOptions:
|
||||||
|
def __new__(cls, *args, **kwargs):
|
||||||
|
if not ChromeDriverManager.installed:
|
||||||
|
ChromeDriverManager(*args, **kwargs).install()
|
||||||
|
if not ChromeDriverManager.selenium_patched:
|
||||||
|
ChromeDriverManager(*args, **kwargs).patch_selenium_webdriver()
|
||||||
|
instance = object.__new__(_ChromeOptions)
|
||||||
|
instance.__init__()
|
||||||
|
print(f"starting options instance ChromeOptions({args}, {kwargs})")
|
||||||
|
return instance
|
||||||
|
|
||||||
|
# return _ChromeOptions()
|
||||||
|
|
||||||
|
|
||||||
|
class ChromeDriverManager(object):
|
||||||
|
installed = False
|
||||||
|
selenium_patched = False
|
||||||
|
|
||||||
|
def __init__(self, executable_path=None, target_version=None, *args, **kwargs):
|
||||||
|
self.executable_path = executable_path or "chromedriver.exe"
|
||||||
|
self.platform = sys.platform
|
||||||
|
self.target_version = target_version
|
||||||
|
|
||||||
|
def patch_selenium_webdriver(self_):
|
||||||
|
"""
|
||||||
|
Patches existing webdriver path on <executable_path> OR if executable_path is None, will download
|
||||||
|
and patch a new webdriver binary for chrome <version_int> (automatically finds latest release of main version)
|
||||||
|
|
||||||
|
:param str executable_path: OPTIONAL path to existing chromedriver executable to patch
|
||||||
|
:param int version_int: OPTIONAL target chrome main version. default 79
|
||||||
|
:return:
|
||||||
|
"""
|
||||||
|
import selenium.webdriver.chrome.service
|
||||||
|
import selenium.webdriver
|
||||||
|
|
||||||
|
# Monkeypatching ChromeDriver Service
|
||||||
|
if self_.__class__.selenium_patched:
|
||||||
|
return
|
||||||
|
|
||||||
|
Service__init__ = selenium.webdriver.chrome.service.Service.__init__
|
||||||
|
|
||||||
|
def patched_Service__init__(self, *a, **k):
|
||||||
|
logging.warning("Using patched ChromeDriver Service class")
|
||||||
|
Service__init__(self, self_.executable_path, **k)
|
||||||
|
|
||||||
|
selenium.webdriver.chrome.service.Service.__init__ = patched_Service__init__
|
||||||
|
|
||||||
|
# monkeypatching ChromeOptions
|
||||||
|
ChromeOptions__init__ = selenium.webdriver.ChromeOptions.__init__
|
||||||
|
|
||||||
|
def patched_ChromeOptions__init__(self):
|
||||||
|
logging.warning("Using patched ChromeOptions class")
|
||||||
|
ChromeOptions__init__(self)
|
||||||
|
self.add_argument("start-maximized")
|
||||||
|
self.add_experimental_option("excludeSwitches", ["enable-automation"])
|
||||||
|
self.add_experimental_option("useAutomationExtension", False)
|
||||||
|
|
||||||
|
selenium.webdriver.ChromeOptions.__init__ = patched_ChromeOptions__init__
|
||||||
|
logging.warning(
|
||||||
|
"Now it is safe to import Chrome and ChromeOptions from selenium"
|
||||||
|
)
|
||||||
|
self_.__class__.selenium_patched = True
|
||||||
|
|
||||||
|
def install(self, patch_selenium=True):
|
||||||
|
"""
|
||||||
|
Initialize the patch
|
||||||
|
|
||||||
|
This will:
|
||||||
|
download chromedriver if not present
|
||||||
|
patch the downloaded chromedriver
|
||||||
|
patch selenium package if <patch_selenium> is True (default)
|
||||||
|
|
||||||
|
:param patch_selenium: patch selenium webdriver classes for Chrome and ChromeDriver (for current python session)
|
||||||
|
:return:
|
||||||
|
"""
|
||||||
|
if (
|
||||||
|
not self.__class__.installed
|
||||||
|
or not __is_patched__
|
||||||
|
or not os.path.exists(self.executable_path)
|
||||||
|
):
|
||||||
|
self.fetch_chromedriver()
|
||||||
|
self.patch_binary()
|
||||||
|
self.__class__.installed = True
|
||||||
|
|
||||||
|
if patch_selenium:
|
||||||
|
self.patch_selenium_webdriver()
|
||||||
|
|
||||||
|
def get_release_version_number(self):
|
||||||
|
"""
|
||||||
|
Gets the latest major version available, or the latest major version of self.target_version if set explicitly.
|
||||||
|
|
||||||
|
:return: version string
|
||||||
|
"""
|
||||||
|
path = (
|
||||||
|
"LATEST_RELEASE"
|
||||||
|
if not self.target_version
|
||||||
|
else f"LATEST_RELEASE_{self.target_version}"
|
||||||
|
)
|
||||||
|
return urlopen(_DL_BASE + path).read().decode()
|
||||||
|
|
||||||
|
def fetch_chromedriver(self):
|
||||||
|
"""
|
||||||
|
Downloads ChromeDriver from source and unpacks the executable
|
||||||
|
|
||||||
|
:return: on success, name of the unpacked executable
|
||||||
|
"""
|
||||||
|
base_ = "chromedriver{}"
|
||||||
|
exe_name = base_.format(".exe")
|
||||||
|
zip_name = base_.format(".zip")
|
||||||
|
ver = self.get_release_version_number()
|
||||||
|
urlretrieve(
|
||||||
|
f"{_DL_BASE}{ver}/{base_.format(f'_{self.platform}')}.zip",
|
||||||
|
filename=zip_name,
|
||||||
|
)
|
||||||
|
with zipfile.ZipFile(zip_name) as zf:
|
||||||
|
zf.extract(exe_name)
|
||||||
|
os.remove(zip_name)
|
||||||
|
return exe_name
|
||||||
|
|
||||||
|
def patch_binary(self):
|
||||||
|
"""
|
||||||
|
Patches the ChromeDriver binary
|
||||||
|
|
||||||
|
:return: False on failure, binary name on success
|
||||||
|
"""
|
||||||
|
if self.__class__.installed:
|
||||||
|
return
|
||||||
|
|
||||||
|
with io.open(self.executable_path, "r+b") as binary:
|
||||||
|
for line in iter(lambda: binary.readline(), b""):
|
||||||
|
if b"cdc_" in line:
|
||||||
|
binary.seek(-len(line), 1)
|
||||||
|
line = b" var key = '$azc_abcdefghijklmnopQRstuv_';\n"
|
||||||
|
binary.write(line)
|
||||||
|
__is_patched__ = 1
|
||||||
|
break
|
||||||
|
else:
|
||||||
|
return False
|
||||||
|
return True
|
||||||
|
|
||||||
|
|
||||||
|
def install(executable_path=None, target_version=TARGET_VERSION, *args, **kwargs):
|
||||||
|
ChromeDriverManager(executable_path, target_version, *args, **kwargs).install()
|
Loading…
Reference in New Issue