SeleniumBase/seleniumbase/undetected/cdp_driver/tab.py

1361 lines
51 KiB
Python

from __future__ import annotations
import asyncio
import base64
import datetime
import logging
import pathlib
import urllib.parse
import warnings
from typing import Dict, List, Union, Optional, Tuple
from . import browser as cdp_browser
from . import element
from . import cdp_util as util
from .config import PathLike
from .connection import Connection, ProtocolException
import mycdp as cdp
logger = logging.getLogger(__name__)
class Tab(Connection):
"""
:ref:`tab` is the controlling mechanism/connection to a 'target',
for most of us 'target' can be read as 'tab'. However it could also
be an iframe, serviceworker or background script for example,
although there isn't much to control for those.
If you open a new window by using
:py:meth:`browser.get(..., new_window=True)`
Your url will open a new window. This window is a 'tab'.
When you browse to another page, the tab will be the same (browser view).
It's important to keep some reference to tab objects, in case you're
done interacting with elements and want to operate on the page level again.
Custom CDP commands
---------------------------
Tab object provide many useful and often-used methods. It is also possible
to utilize the included cdp classes to to something totally custom.
The cdp package is a set of so-called "domains" with each having methods,
events and types.
To send a cdp method, for example :py:obj:`cdp.page.navigate`,
you'll have to check whether the method accepts any parameters
and whether they are required or not.
You can use:
```python
await tab.send(cdp.page.navigate(url='https://Your-URL-Here'))
```
So tab.send() accepts a generator object,
which is created by calling a cdp method.
This way you can build very detailed and customized commands.
(Note: Finding correct command combos can be a time-consuming task.
A whole bunch of useful methods have been added,
preferably having the same apis or lookalikes, as in selenium.)
Some useful, often needed and simply required methods
===================================================================
:py:meth:`~find` | find(text)
----------------------------------------
Finds and returns a single element by text match.
By default, returns the first element found.
Much more powerful is the best_match flag,
although also much more expensive.
When no match is found, it will retry for <timeout> seconds (default: 10),
so this is also suitable to use as wait condition.
:py:meth:`~find` | find(text, best_match=True) or find(text, True)
-----------------------------------------------------------------------
Much more powerful (and expensive) than the above is
the use of the `find(text, best_match=True)` flag.
It will still return 1 element, but when multiple matches are found,
it picks the one having the most similar text length.
How would that help?
For example, you search for "login",
you'd probably want the "login" button element,
and not thousands of scripts/meta/headings,
which happens to contain a string of "login".
When no match is found, it will retry for <timeout> seconds (default: 10),
so this is also suitable to use as wait condition.
:py:meth:`~select` | select(selector)
----------------------------------------
Finds and returns a single element by css selector match.
When no match is found, it will retry for <timeout> seconds (default: 10),
so this is also suitable to use as wait condition.
:py:meth:`~select_all` | select_all(selector)
------------------------------------------------
Finds and returns all elements by css selector match.
When no match is found, it will retry for <timeout> seconds (default: 10),
so this is also suitable to use as wait condition.
await :py:obj:`Tab`
---------------------------
Calling `await tab` will do a lot of stuff under the hood,
and ensures all references are up to date.
Also it allows for the script to "breathe",
as it is oftentime faster than your browser or webpage.
So whenever you get stuck and things crashes or element could not be found,
you should probably let it "breathe" by calling `await page`
and/or `await page.sleep()`.
It ensures :py:obj:`~url` will be updated to the most recent one,
which is quite important in some other methods.
Using other and custom CDP commands
======================================================
Using the included cdp module, you can easily craft commands,
which will always return an generator object.
This generator object can be easily sent to the :py:meth:`~send` method.
:py:meth:`~send`
---------------------------
This is probably the most important method,
although you won't ever call it, unless you want to go really custom.
The send method accepts a :py:obj:`cdp` command.
Each of which can be found in the cdp section.
When you import * from this package, cdp will be in your namespace,
and contains all domains/actions/events you can act upon.
"""
browser: cdp_browser.Browser
_download_behavior: List[str] = None
def __init__(
self,
websocket_url: str,
target: cdp.target.TargetInfo,
browser: Optional["cdp_browser.Browser"] = None,
**kwargs,
):
super().__init__(websocket_url, target, browser, **kwargs)
self.browser = browser
self._dom = None
self._window_id = None
@property
def inspector_url(self):
"""
Get the inspector url.
This url can be used in another browser to show you
the devtools interface for current tab.
Useful for debugging and headless mode.
"""
return f"http://{self.browser.config.host}:{self.browser.config.port}/devtools/inspector.html?ws={self.websocket_url[5:]}" # noqa
def inspector_open(self):
import webbrowser
webbrowser.open(self.inspector_url, new=2)
async def open_external_inspector(self):
"""
Opens the system's browser containing the devtools inspector page
for this tab. Could be handy, especially to debug in headless mode.
"""
import webbrowser
webbrowser.open(self.inspector_url)
async def find(
self,
text: str,
best_match: bool = False,
return_enclosing_element: bool = True,
timeout: Union[int, float] = 10,
):
"""
Find single element by text.
Can also be used to wait for such element to appear.
:param text:
Text to search for. Note: Script contents are also considered text.
:type text: str
:param best_match: :param best_match:
When True (default), it will return the element which has the most
comparable string length. This could help a lot. Eg:
If you search for "login", you probably want the login button element,
and not thousands of tags/scripts containing a "login" string.
When False, it returns just the first match (but is way faster).
:type best_match: bool
:param return_enclosing_element:
Since we deal with nodes instead of elements,
the find function most often returns so called text nodes,
which is actually a element of plain text,
which is the somehow imaginary "child" of a "span", "p", "script"
or any other elements which have text between their opening
and closing tags.
Most often when we search by text, we actually aim for the
element containing the text instead of a lousy plain text node,
so by default the containing element is returned.
There are exceptions. Eg:
Elements that use the "placeholder=" property.
:type return_enclosing_element: bool
:param timeout:
Raise timeout exception when after this many seconds nothing is found.
:type timeout: float,int
"""
loop = asyncio.get_running_loop()
start_time = loop.time()
text = text.strip()
item = None
try:
item = await self.find_element_by_text(
text, best_match, return_enclosing_element
)
except (Exception, TypeError):
pass
while not item:
await self
item = await self.find_element_by_text(
text, best_match, return_enclosing_element
)
if loop.time() - start_time > timeout:
raise asyncio.TimeoutError(
"Time ran out while waiting for: {%s}" % text
)
await self.sleep(0.5)
return item
async def select(
self,
selector: str,
timeout: Union[int, float] = 10,
) -> element.Element:
"""
Find a single element by css selector.
Can also be used to wait for such an element to appear.
:param selector: css selector,
eg a[href], button[class*=close], a > img[src]
:type selector: str
:param timeout:
Raise timeout exception when after this many seconds nothing is found.
:type timeout: float,int
"""
loop = asyncio.get_running_loop()
start_time = loop.time()
selector = selector.strip()
item = None
try:
item = await self.query_selector(selector)
except (Exception, TypeError):
pass
while not item:
await self
item = await self.query_selector(selector)
if loop.time() - start_time > timeout:
raise asyncio.TimeoutError(
"Time ran out while waiting for: {%s}" % selector
)
await self.sleep(0.5)
return item
async def find_all(
self,
text: str,
timeout: Union[int, float] = 10,
) -> List[element.Element]:
"""
Find multiple elements by text.
Can also be used to wait for such elements to appear.
:param text: Text to search for.
Note: Script contents are also considered text.
:type text: str
:param timeout:
Raise timeout exception when after this many seconds nothing is found.
:type timeout: float,int
"""
loop = asyncio.get_running_loop()
now = loop.time()
text = text.strip()
items = []
try:
items = await self.find_elements_by_text(text)
except (Exception, TypeError):
pass
while not items:
await self
items = await self.find_elements_by_text(text)
if loop.time() - now > timeout:
raise asyncio.TimeoutError(
"Time ran out while waiting for: {%s}" % text
)
await self.sleep(0.5)
return items
async def select_all(
self,
selector: str,
timeout: Union[int, float] = 10,
include_frames=False,
) -> List[element.Element]:
"""
Find multiple elements by CSS Selector.
Can also be used to wait for such elements to appear.
:param selector: css selector,
eg a[href], button[class*=close], a > img[src]
:type selector: str
:param timeout:
Raise timeout exception when after this many seconds nothing is found.
:type timeout: float,int
:param include_frames: Whether to include results in iframes.
:type include_frames: bool
"""
loop = asyncio.get_running_loop()
now = loop.time()
selector = selector.strip()
items = []
if include_frames:
frames = await self.query_selector_all("iframe")
# Unfortunately, asyncio.gather is not an option here
for fr in frames:
items.extend(await fr.query_selector_all(selector))
items.extend(await self.query_selector_all(selector))
while not items:
await self
items = await self.query_selector_all(selector)
if loop.time() - now > timeout:
raise asyncio.TimeoutError(
"Time ran out while waiting for: {%s}" % selector
)
await self.sleep(0.5)
return items
async def get(
self,
url="about:blank",
new_tab: bool = False,
new_window: bool = False,
):
"""
Top level get. Utilizes the first tab to retrieve the given url.
This is a convenience function known from selenium.
This function handles waits/sleeps and detects when DOM events fired,
so it's the safest way of navigating.
:param url: the url to navigate to
:param new_tab: open new tab
:param new_window: open new window
:return: Page
"""
if not self.browser:
raise AttributeError(
"This page/tab has no browser attribute, "
"so you can't use get()"
)
if new_window and not new_tab:
new_tab = True
if new_tab:
return await self.browser.get(url, new_tab, new_window)
else:
frame_id, loader_id, *_ = await self.send(cdp.page.navigate(url))
await self
return self
async def query_selector_all(
self,
selector: str,
_node: Optional[Union[cdp.dom.Node, "element.Element"]] = None,
):
"""
Equivalent of JavaScript "document.querySelectorAll".
This is considered one of the main methods to use in this package.
It returns all matching :py:obj:`element.Element` objects.
:param selector: css selector.
(first time? => https://www.w3schools.com/cssref/css_selectors.php )
:type selector: str
:param _node: internal use
"""
if not _node:
doc: cdp.dom.Node = await self.send(cdp.dom.get_document(-1, True))
else:
doc = _node
if _node.node_name == "IFRAME":
doc = _node.content_document
node_ids = []
try:
node_ids = await self.send(
cdp.dom.query_selector_all(doc.node_id, selector)
)
except ProtocolException as e:
if _node is not None:
if "could not find node" in e.message.lower():
if getattr(_node, "__last", None):
del _node.__last
return []
# If the supplied node is not found,
# then the DOM has changed since acquiring the element.
# Therefore, we need to update our node, and try again.
await _node.update()
_node.__last = (
True # Make sure this isn't turned into infinite loop.
)
return await self.query_selector_all(selector, _node)
else:
await self.send(cdp.dom.disable())
raise
if not node_ids:
return []
items = []
for nid in node_ids:
node = util.filter_recurse(doc, lambda n: n.node_id == nid)
# Pass along the retrieved document tree to improve performance.
if not node:
continue
elem = element.create(node, self, doc)
items.append(elem)
return items
async def query_selector(
self,
selector: str,
_node: Optional[Union[cdp.dom.Node, element.Element]] = None,
):
"""
Find a single element based on a CSS Selector string.
:param selector: CSS Selector(s)
:type selector: str
"""
selector = selector.strip()
if not _node:
doc: cdp.dom.Node = await self.send(cdp.dom.get_document(-1, True))
else:
doc = _node
if _node.node_name == "IFRAME":
doc = _node.content_document
node_id = None
try:
node_id = await self.send(
cdp.dom.query_selector(doc.node_id, selector)
)
except ProtocolException as e:
if _node is not None:
if "could not find node" in e.message.lower():
if getattr(_node, "__last", None):
del _node.__last
return []
# If supplied node is not found,
# the dom has changed since acquiring the element,
# therefore, update our passed node and try again.
await _node.update()
_node.__last = (
True # Make sure this isn't turned into infinite loop.
)
return await self.query_selector(selector, _node)
else:
await self.send(cdp.dom.disable())
raise
if not node_id:
return
node = util.filter_recurse(doc, lambda n: n.node_id == node_id)
if not node:
return
return element.create(node, self, doc)
async def find_elements_by_text(
self,
text: str,
) -> List[element.Element]:
"""
Returns element which match the given text.
Note: This may (or will) also return any other element
(like inline scripts), which happen to contain that text.
:param text:
"""
text = text.strip()
doc = await self.send(cdp.dom.get_document(-1, True))
search_id, nresult = await self.send(
cdp.dom.perform_search(text, True)
)
if nresult:
node_ids = await self.send(
cdp.dom.get_search_results(search_id, 0, nresult)
)
else:
node_ids = []
await self.send(cdp.dom.discard_search_results(search_id))
items = []
for nid in node_ids:
node = util.filter_recurse(doc, lambda n: n.node_id == nid)
if not node:
node = await self.send(cdp.dom.resolve_node(node_id=nid))
if not node:
continue
# remote_object = await self.send(
# cdp.dom.resolve_node(backend_node_id=node.backend_node_id)
# )
# node_id = await self.send(
# cdp.dom.request_node(object_id=remote_object.object_id)
# )
try:
elem = element.create(node, self, doc)
except BaseException:
continue
if elem.node_type == 3:
# If found element is a text node (which is plain text,
# and useless for our purpose), we return the parent element
# of the node (which is often a tag which can have text
# between their opening and closing tags (that is most tags,
# except for example "img" and "video", "br").
if not elem.parent:
# Check if parent actually has a parent
# and update it to be absolutely sure.
await elem.update()
items.append(
elem.parent or elem
) # When there's no parent, use the text node itself.
continue
else:
# Add the element itself.
items.append(elem)
# Since we already fetched the entire doc, including shadow and frames,
# let's also search through the iframes.
iframes = util.filter_recurse_all(
doc, lambda node: node.node_name == "IFRAME"
)
if iframes:
iframes_elems = [
element.create(iframe, self, iframe.content_document)
for iframe in iframes
]
for iframe_elem in iframes_elems:
if iframe_elem.content_document:
iframe_text_nodes = util.filter_recurse_all(
iframe_elem,
lambda node: node.node_type == 3 # noqa
and text.lower() in node.node_value.lower(),
)
if iframe_text_nodes:
iframe_text_elems = [
element.create(text_node, self, iframe_elem.tree)
for text_node in iframe_text_nodes
]
items.extend(
text_node.parent for text_node in iframe_text_elems
)
await self.send(cdp.dom.disable())
return items or []
async def find_element_by_text(
self,
text: str,
best_match: Optional[bool] = False,
return_enclosing_element: Optional[bool] = True,
) -> Union[element.Element, None]:
"""
Finds and returns the first element containing <text>, or best match.
:param text:
:param best_match:
When True, which is MUCH more expensive (thus much slower),
will find the closest match based on length.
When searching for "login", you probably want the button element,
and not thousands of tags/scripts containing the "login" string.
:type best_match: bool
:param return_enclosing_element:
"""
doc = await self.send(cdp.dom.get_document(-1, True))
text = text.strip()
search_id, nresult = await self.send(
cdp.dom.perform_search(text, True)
)
node_ids = await self.send(
cdp.dom.get_search_results(search_id, 0, nresult)
)
await self.send(cdp.dom.discard_search_results(search_id))
if not node_ids:
node_ids = []
items = []
for nid in node_ids:
node = util.filter_recurse(doc, lambda n: n.node_id == nid)
try:
elem = element.create(node, self, doc)
except BaseException:
continue
if elem.node_type == 3:
# If found element is a text node
# (which is plain text, and useless for our purpose),
# then return the parent element of the node
# (which is often a tag which can have text between their
# opening and closing tags (that is most tags,
# except for example "img" and "video", "br").
if not elem.parent:
# Check if parent has a parent, and update it to be sure.
await elem.update()
items.append(
elem.parent or elem
) # When it really has no parent, use the text node itself
continue
else:
# Add the element itself
items.append(elem)
# Since the entire doc is already fetched, including shadow and frames,
# also search through the iframes.
iframes = util.filter_recurse_all(
doc, lambda node: node.node_name == "IFRAME"
)
if iframes:
iframes_elems = [
element.create(iframe, self, iframe.content_document)
for iframe in iframes
]
for iframe_elem in iframes_elems:
iframe_text_nodes = util.filter_recurse_all(
iframe_elem,
lambda node: node.node_type == 3 # noqa
and text.lower() in node.node_value.lower(),
)
if iframe_text_nodes:
iframe_text_elems = [
element.create(text_node, self, iframe_elem.tree)
for text_node in iframe_text_nodes
]
items.extend(
text_node.parent for text_node in iframe_text_elems
)
try:
if not items:
return
if best_match:
closest_by_length = min(
items, key=lambda el: abs(len(text) - len(el.text_all))
)
elem = closest_by_length or items[0]
return elem
else:
# Return the first result
for elem in items:
if elem:
return elem
finally:
await self.send(cdp.dom.disable())
async def back(self):
"""History back"""
await self.send(cdp.runtime.evaluate("window.history.back()"))
async def forward(self):
"""History forward"""
await self.send(cdp.runtime.evaluate("window.history.forward()"))
async def get_navigation_history(self):
"""Get Navigation History"""
return await self.send(cdp.page.get_navigation_history())
async def reload(
self,
ignore_cache: Optional[bool] = True,
script_to_evaluate_on_load: Optional[str] = None,
):
"""
Reloads the page
:param ignore_cache: When set to True (default),
it ignores cache, and re-downloads the items.
:param script_to_evaluate_on_load: Script to run on load.
"""
await self.send(
cdp.page.reload(
ignore_cache=ignore_cache,
script_to_evaluate_on_load=script_to_evaluate_on_load,
),
)
async def evaluate(
self, expression: str, await_promise=False, return_by_value=True
):
remote_object, errors = await self.send(
cdp.runtime.evaluate(
expression=expression,
user_gesture=True,
await_promise=await_promise,
return_by_value=return_by_value,
allow_unsafe_eval_blocked_by_csp=True,
)
)
if errors:
raise ProtocolException(errors)
if remote_object:
if return_by_value:
if remote_object.value:
return remote_object.value
else:
return remote_object, errors
async def js_dumps(
self, obj_name: str, return_by_value: Optional[bool] = True
) -> Union[
Dict,
Tuple[cdp.runtime.RemoteObject, cdp.runtime.ExceptionDetails],
]:
"""
Dump Given js object with its properties and values as a dict.
Note: Complex objects might not be serializable,
therefore this method is not a "source of truth"
:param obj_name: the js object to dump
:type obj_name: str
:param return_by_value: If you want an tuple of cdp objects
(returnvalue, errors), then set this to False.
:type return_by_value: bool
Example
-------
x = await self.js_dumps('window')
print(x)
'...{
'pageYOffset': 0,
'visualViewport': {},
'screenX': 10,
'screenY': 10,
'outerWidth': 1050,
'outerHeight': 832,
'devicePixelRatio': 1,
'screenLeft': 10,
'screenTop': 10,
'styleMedia': {},
'onsearch': None,
'isSecureContext': True,
'trustedTypes': {},
'performance': {'timeOrigin': 1707823094767.9,
'timing': {'connectStart': 0,
'navigationStart': 1707823094768,
]...
"""
js_code_a = (
"""
function ___dump(obj, _d = 0) {
let _typesA = ['object', 'function'];
let _typesB = ['number', 'string', 'boolean'];
if (_d == 2) {
console.log('maxdepth reached for ', obj);
return
}
let tmp = {}
for (let k in obj) {
if (obj[k] == window) continue;
let v;
try {
if (obj[k] === null
|| obj[k] === undefined
|| obj[k] === NaN) {
console.log('obj[k] is null or undefined or Nan',
k, '=>', obj[k])
tmp[k] = obj[k];
continue
}
} catch (e) {
tmp[k] = null;
continue
}
if (_typesB.includes(typeof obj[k])) {
tmp[k] = obj[k]
continue
}
try {
if (typeof obj[k] === 'function') {
tmp[k] = obj[k].toString()
continue
}
if (typeof obj[k] === 'object') {
tmp[k] = ___dump(obj[k], _d + 1);
continue
}
} catch (e) {}
try {
tmp[k] = JSON.stringify(obj[k])
continue
} catch (e) {
}
try {
tmp[k] = obj[k].toString();
continue
} catch (e) {}
}
return tmp
}
function ___dumpY(obj) {
var objKeys = (obj) => {
var [target, result] = [obj, []];
while (target !== null) {
result = result.concat(
Object.getOwnPropertyNames(target)
);
target = Object.getPrototypeOf(target);
}
return result;
}
return Object.fromEntries(
objKeys(obj).map(_ => [_, ___dump(obj[_])]))
}
___dumpY( %s )
"""
% obj_name
)
js_code_b = (
"""
((obj, visited = new WeakSet()) => {
if (visited.has(obj)) {
return {}
}
visited.add(obj)
var result = {}, _tmp;
for (var i in obj) {
try {
if (i === 'enabledPlugin'
|| typeof obj[i] === 'function') {
continue;
} else if (typeof obj[i] === 'object') {
_tmp = recurse(obj[i], visited);
if (Object.keys(_tmp).length) {
result[i] = _tmp;
}
} else {
result[i] = obj[i];
}
} catch (error) {
// console.error('Error:', error);
}
}
return result;
})(%s)
"""
% obj_name
)
# No self.evaluate here to prevent infinite loop on certain expressions
remote_object, exception_details = await self.send(
cdp.runtime.evaluate(
js_code_a,
await_promise=True,
return_by_value=return_by_value,
allow_unsafe_eval_blocked_by_csp=True,
)
)
if exception_details:
# Try second variant
remote_object, exception_details = await self.send(
cdp.runtime.evaluate(
js_code_b,
await_promise=True,
return_by_value=return_by_value,
allow_unsafe_eval_blocked_by_csp=True,
)
)
if exception_details:
raise ProtocolException(exception_details)
if return_by_value:
if remote_object.value:
return remote_object.value
else:
return remote_object, exception_details
async def close(self):
"""Close the current target (ie: tab,window,page)"""
if self.target and self.target.target_id:
await self.send(
cdp.target.close_target(target_id=self.target.target_id)
)
await asyncio.sleep(0.1)
async def get_window(self) -> Tuple[
cdp.browser.WindowID, cdp.browser.Bounds
]:
"""Get the window Bounds"""
window_id, bounds = await self.send(
cdp.browser.get_window_for_target(self.target_id)
)
return window_id, bounds
async def get_content(self):
"""Gets the current page source content (html)"""
doc: cdp.dom.Node = await self.send(cdp.dom.get_document(-1, True))
return await self.send(
cdp.dom.get_outer_html(backend_node_id=doc.backend_node_id)
)
async def maximize(self):
"""Maximize page/tab/window"""
return await self.set_window_state(state="maximize")
async def minimize(self):
"""Minimize page/tab/window"""
return await self.set_window_state(state="minimize")
async def fullscreen(self):
"""Minimize page/tab/window"""
return await self.set_window_state(state="fullscreen")
async def medimize(self):
return await self.set_window_state(state="normal")
async def set_window_size(self, left=0, top=0, width=1280, height=1024):
"""
Set window size and position.
:param left:
Pixels from the left of the screen to the window top-left corner.
:param top:
Pixels from the top of the screen to the window top-left corner.
:param width: width of the window in pixels
:param height: height of the window in pixels
"""
return await self.set_window_state(left, top, width, height)
async def set_window_rect(self, left=0, top=0, width=1280, height=1024):
"""Same as set_window_size(). Uses a different naming convention."""
return await self.set_window_state(left, top, width, height)
async def activate(self):
"""Active this target (Eg: tab, window, page)"""
await self.send(cdp.target.activate_target(self.target.target_id))
async def bring_to_front(self):
"""Alias to self.activate"""
await self.activate()
async def set_window_state(
self, left=0, top=0, width=1280, height=720, state="normal"
):
"""
Sets the window size or state.
For state you can provide the full name like minimized, maximized,
normal, fullscreen, or something which leads to either of those,
like min, mini, mi, max, ma, maxi, full, fu, no, nor.
In case state is set other than "normal",
the left, top, width, and height are ignored.
:param left:
desired offset from left, in pixels
:type left: int
:param top:
desired offset from the top, in pixels
:type top: int
:param width:
desired width in pixels
:type width: int
:param height:
desired height in pixels
:type height: int
:param state:
can be one of the following strings:
- normal
- fullscreen
- maximized
- minimized
:type state: str
"""
available_states = ["minimized", "maximized", "fullscreen", "normal"]
window_id: cdp.browser.WindowID
bounds: cdp.browser.Bounds
(window_id, bounds) = await self.get_window()
for state_name in available_states:
if all(x in state_name for x in state.lower()):
break
else:
raise NameError(
"could not determine any of %s from input '%s'"
% (",".join(available_states), state)
)
window_state = getattr(
cdp.browser.WindowState,
state_name.upper(),
cdp.browser.WindowState.NORMAL,
)
if window_state == cdp.browser.WindowState.NORMAL:
bounds = cdp.browser.Bounds(
left, top, width, height, window_state
)
else:
# min, max, full can only be used when current state == NORMAL,
# therefore, first switch to NORMAL
await self.set_window_state(state="normal")
bounds = cdp.browser.Bounds(window_state=window_state)
await self.send(
cdp.browser.set_window_bounds(window_id, bounds=bounds)
)
async def scroll_down(self, amount=25):
"""
Scrolls the page down.
:param amount: Number in percentage.
25 is a quarter of page, 50 half, and 1000 is 10x the page.
:type amount: int
"""
window_id: cdp.browser.WindowID
bounds: cdp.browser.Bounds
(window_id, bounds) = await self.get_window()
await self.send(
cdp.input_.synthesize_scroll_gesture(
x=0,
y=0,
y_distance=-(bounds.height * (amount / 100)),
y_overscroll=0,
x_overscroll=0,
prevent_fling=True,
repeat_delay_ms=0,
speed=7777,
)
)
async def scroll_up(self, amount=25):
"""
Scrolls the page up.
:param amount: Number in percentage.
25 is a quarter of page, 50 half, and 1000 is 10x the page.
:type amount: int
"""
window_id: cdp.browser.WindowID
bounds: cdp.browser.Bounds
(window_id, bounds) = await self.get_window()
await self.send(
cdp.input_.synthesize_scroll_gesture(
x=0,
y=0,
y_distance=(bounds.height * (amount / 100)),
x_overscroll=0,
prevent_fling=True,
repeat_delay_ms=0,
speed=7777,
)
)
async def wait_for(
self,
selector: Optional[str] = "",
text: Optional[str] = "",
timeout: Optional[Union[int, float]] = 10,
) -> element.Element:
"""
Variant on query_selector_all and find_elements_by_text.
This variant takes either selector or text,
and will block until the requested element(s) are found.
It will block for a maximum of <timeout> seconds,
after which a TimeoutError will be raised.
:param selector: css selector
:param text: text
:param timeout:
:return: Element
:raises: asyncio.TimeoutError
"""
loop = asyncio.get_running_loop()
now = loop.time()
if selector:
item = await self.query_selector(selector)
while not item:
item = await self.query_selector(selector)
if loop.time() - now > timeout:
raise asyncio.TimeoutError(
"Time ran out while waiting for: {%s}" % selector
)
await self.sleep(0.5)
return item
if text:
item = await self.find_element_by_text(text)
while not item:
item = await self.find_element_by_text(text)
if loop.time() - now > timeout:
raise asyncio.TimeoutError(
"Time ran out while waiting for: {%s}" % text
)
await self.sleep(0.5)
return item
async def download_file(
self, url: str, filename: Optional[PathLike] = None
):
"""
Downloads the file by the given url.
:param url: The URL of the file.
:param filename: The name for the file.
If not specified, the name is composed from the url file name
"""
if not self._download_behavior:
directory_path = pathlib.Path.cwd() / "downloads"
directory_path.mkdir(exist_ok=True)
await self.set_download_path(directory_path)
warnings.warn(
f"No download path set, so creating and using a default of "
f"{directory_path}"
)
if not filename:
filename = url.rsplit("/")[-1]
filename = filename.split("?")[0]
code = """
(elem) => {
async function _downloadFile(
imageSrc,
nameOfDownload,
) {
const response = await fetch(imageSrc);
const blobImage = await response.blob();
const href = URL.createObjectURL(blobImage);
const anchorElement = document.createElement('a');
anchorElement.href = href;
anchorElement.download = nameOfDownload;
document.body.appendChild(anchorElement);
anchorElement.click();
setTimeout(() => {
document.body.removeChild(anchorElement);
window.URL.revokeObjectURL(href);
}, 500);
}
_downloadFile('%s', '%s')
}
""" % (
url,
filename,
)
body = (await self.query_selector_all("body"))[0]
await body.update()
await self.send(
cdp.runtime.call_function_on(
code,
object_id=body.object_id,
arguments=[cdp.runtime.CallArgument(object_id=body.object_id)],
)
)
async def save_screenshot(
self,
filename: Optional[PathLike] = "auto",
format: Optional[str] = "png",
full_page: Optional[bool] = False,
) -> str:
"""
Saves a screenshot of the page.
This is not the same as :py:obj:`Element.save_screenshot`,
which saves a screenshot of a single element only.
:param filename: uses this as the save path
:type filename: PathLike
:param format: jpeg or png (defaults to jpeg)
:type format: str
:param full_page:
When False (default), it captures the current viewport.
When True, it captures the entire page.
:type full_page: bool
:return: The path/filename of the saved screenshot.
:rtype: str
"""
await self.sleep() # Update the target's URL
path = None
if format.lower() in ["jpg", "jpeg"]:
ext = ".jpg"
format = "jpeg"
elif format.lower() in ["png"]:
ext = ".png"
format = "png"
if not filename or filename == "auto":
parsed = urllib.parse.urlparse(self.target.url)
parts = parsed.path.split("/")
last_part = parts[-1]
last_part = last_part.rsplit("?", 1)[0]
dt_str = datetime.datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
candidate = f"{parsed.hostname}__{last_part}_{dt_str}"
path = pathlib.Path(candidate + ext) # noqa
else:
path = pathlib.Path(filename)
path.parent.mkdir(parents=True, exist_ok=True)
data = await self.send(
cdp.page.capture_screenshot(
format_=format, capture_beyond_viewport=full_page
)
)
if not data:
raise ProtocolException(
"Could not take screenshot. "
"Most possible cause is the page "
"has not finished loading yet."
)
data_bytes = base64.b64decode(data)
if not path:
raise RuntimeError("Invalid filename or path: '%s'" % filename)
path.write_bytes(data_bytes)
return str(path)
async def print_to_pdf(
self,
filename: Optional[PathLike] = "auto",
) -> str:
"""
Saves a webpage as a PDF.
:param filename: uses this as the save path
:type filename: PathLike
:return: The path/filename of the saved screenshot.
:rtype: str
"""
await self.sleep() # Update the target's URL
path = None
ext = ".pdf"
if not filename or filename == "auto":
parsed = urllib.parse.urlparse(self.target.url)
parts = parsed.path.split("/")
last_part = parts[-1]
last_part = last_part.rsplit("?", 1)[0]
dt_str = datetime.datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
candidate = f"{parsed.hostname}__{last_part}_{dt_str}"
path = pathlib.Path(candidate + ext) # noqa
else:
path = pathlib.Path(filename)
path.parent.mkdir(parents=True, exist_ok=True)
data, _ = await self.send(cdp.page.print_to_pdf())
if not data:
raise ProtocolException("Could not save PDF.")
data_bytes = base64.b64decode(data)
if not path:
raise RuntimeError("Invalid filename or path: '%s'" % filename)
path.write_bytes(data_bytes)
return str(path)
async def set_download_path(self, path: PathLike):
"""
Sets the download path.
When not set, a default folder is used.
:param path:
"""
await self.send(
cdp.browser.set_download_behavior(
behavior="allow", download_path=str(path.resolve())
)
)
self._download_behavior = ["allow", str(path.resolve())]
async def get_all_linked_sources(self) -> List["element.Element"]:
"""Get all elements of tag: link, a, img, scripts meta, video, audio"""
all_assets = await self.query_selector_all(
selector="a,link,img,script,meta"
)
return [element.create(asset, self) for asset in all_assets]
async def get_all_urls(self, absolute=True) -> List[str]:
"""
Convenience function, which returns all links (a,link,img,script,meta).
:param absolute:
Try to build all the links in absolute form
instead of "as is", often relative.
:return: List of URLs.
"""
import urllib.parse
res = []
all_assets = await self.query_selector_all(
selector="a,link,img,script,meta"
)
for asset in all_assets:
if not absolute:
res.append(asset.src or asset.href)
else:
for k, v in asset.attrs.items():
if k in ("src", "href"):
if "#" in v:
continue
if not any([_ in v for _ in ("http", "//", "/")]):
continue
abs_url = urllib.parse.urljoin(
"/".join(self.url.rsplit("/")[:3]), v
)
if not abs_url.startswith(("http", "//", "ws")):
continue
res.append(abs_url)
return res
async def verify_cf(self):
"""(An attempt)"""
checkbox = None
checkbox_sibling = await self.wait_for(text="verify you are human")
if checkbox_sibling:
parent = checkbox_sibling.parent
while parent:
checkbox = await parent.query_selector("input[type=checkbox]")
if checkbox:
break
parent = parent.parent
await checkbox.mouse_move()
await checkbox.mouse_click()
async def get_document(self):
return await self.send(cdp.dom.get_document())
async def get_flattened_document(self):
return await self.send(cdp.dom.get_flattened_document())
async def get_local_storage(self):
"""
Get local storage items as dict of strings.
Proper deserialization may need to be done.
"""
if not self.target.url:
await self
origin = "/".join(self.url.split("/", 3)[:-1])
items = await self.send(
cdp.dom_storage.get_dom_storage_items(
cdp.dom_storage.StorageId(
is_local_storage=True, security_origin=origin
)
)
)
retval = {}
for item in items:
retval[item[0]] = item[1]
return retval
async def set_local_storage(self, items: dict):
"""
Set local storage.
Dict items must be strings.
Simple types will be converted to strings automatically.
:param items: dict containing {key:str, value:str}
:type items: dict[str,str]
"""
if not self.target.url:
await self
origin = "/".join(self.url.split("/", 3)[:-1])
await asyncio.gather(
*[
self.send(
cdp.dom_storage.set_dom_storage_item(
storage_id=cdp.dom_storage.StorageId(
is_local_storage=True, security_origin=origin
),
key=str(key),
value=str(val),
)
)
for key, val in items.items()
]
)
def __call__(
self,
text: Optional[str] = "",
selector: Optional[str] = "",
timeout: Optional[Union[int, float]] = 10,
):
"""
Alias to query_selector_all or find_elements_by_text,
depending on whether text= is set or selector= is set.
:param selector: css selector string
:type selector: str
"""
return self.wait_for(text, selector, timeout)
def __eq__(self, other: Tab):
try:
return other.target == self.target
except (AttributeError, TypeError):
return False
def __getattr__(self, item):
try:
return getattr(self._target, item)
except AttributeError:
raise AttributeError(
f'"{self.__class__.__name__}" has no attribute "%s"' % item
)
def __repr__(self):
extra = ""
if self.target.url:
extra = f"[url: {self.target.url}]"
s = f"<{type(self).__name__} [{self.target_id}] [{self.type_}] {extra}>" # noqa
return s