ele()和s_ele()增加index参数,未完成;优化查找元素速度

This commit is contained in:
g1879 2024-01-09 23:35:36 +08:00
parent 29de18c023
commit 86ff9098b2
19 changed files with 551 additions and 434 deletions

View File

@ -14,4 +14,4 @@ from ._configs.chromium_options import ChromiumOptions
from ._configs.session_options import SessionOptions from ._configs.session_options import SessionOptions
__all__ = ['ChromiumPage', 'ChromiumOptions', 'SessionOptions', 'SessionPage', 'WebPage', '__version__'] __all__ = ['ChromiumPage', 'ChromiumOptions', 'SessionOptions', 'SessionPage', 'WebPage', '__version__']
__version__ = '4.0.1' __version__ = '4.0.0b37'

View File

@ -23,11 +23,11 @@ class BaseParser(object):
def __call__(self, loc_or_str): def __call__(self, loc_or_str):
return self.ele(loc_or_str) return self.ele(loc_or_str)
def ele(self, loc_or_ele, timeout=None): def ele(self, loc_or_ele, index=0, timeout=None):
return self._ele(loc_or_ele, timeout, True, method='ele()') return self._ele(loc_or_ele, timeout, index=index, method='ele()')
def eles(self, loc_or_str, timeout=None): def eles(self, loc_or_str, timeout=None):
return self._ele(loc_or_str, timeout, False) return self._ele(loc_or_str, timeout, index=None)
# ----------------以下属性或方法待后代实现---------------- # ----------------以下属性或方法待后代实现----------------
@property @property
@ -40,11 +40,11 @@ class BaseParser(object):
def s_eles(self, loc_or_str): def s_eles(self, loc_or_str):
pass pass
def _ele(self, loc_or_ele, timeout=None, single=True, raise_err=None, method=None): def _ele(self, loc_or_ele, timeout=None, index=0, raise_err=None, method=None):
pass pass
@abstractmethod @abstractmethod
def _find_elements(self, loc_or_ele, timeout=None, single=True, raise_err=None): def _find_elements(self, loc_or_ele, timeout=None, index=0, raise_err=None):
pass pass
@ -68,8 +68,8 @@ class BaseElement(BaseParser):
def nexts(self): def nexts(self):
pass pass
def _ele(self, loc_or_str, timeout=None, single=True, relative=False, raise_err=None, method=None): def _ele(self, loc_or_str, timeout=None, index=0, relative=False, raise_err=None, method=None):
r = self._find_elements(loc_or_str, timeout=timeout, single=single, relative=relative, raise_err=raise_err) r = self._find_elements(loc_or_str, timeout=timeout, index=index, relative=relative, raise_err=raise_err)
if r or isinstance(r, list): if r or isinstance(r, list):
return r return r
if Settings.raise_when_ele_not_found or raise_err is True: if Settings.raise_when_ele_not_found or raise_err is True:
@ -80,7 +80,7 @@ class BaseElement(BaseParser):
return r return r
@abstractmethod @abstractmethod
def _find_elements(self, loc_or_str, timeout=None, single=True, relative=False, raise_err=None): def _find_elements(self, loc_or_str, timeout=None, index=0, relative=False, raise_err=None):
pass pass
@ -122,8 +122,8 @@ class DrissionElement(BaseElement):
def parent(self, level_or_loc=1, index=1): def parent(self, level_or_loc=1, index=1):
"""返回上面某一级父元素,可指定层数或用查询语法定位 """返回上面某一级父元素,可指定层数或用查询语法定位
:param level_or_loc: 第几级父元素或定位符 :param level_or_loc: 第几级父元素1开始或定位符
:param index: 当level_or_loc传入定位符使用此参数选择第几个结果 :param index: 当level_or_loc传入定位符使用此参数选择第几个结果1开始
:return: 上级元素对象 :return: 上级元素对象
""" """
if isinstance(level_or_loc, int): if isinstance(level_or_loc, int):
@ -153,24 +153,23 @@ class DrissionElement(BaseElement):
if isinstance(filter_loc, int): if isinstance(filter_loc, int):
index = filter_loc index = filter_loc
filter_loc = '' filter_loc = ''
nodes = self.children(filter_loc=filter_loc, timeout=timeout, ele_only=ele_only) if not filter_loc:
if not nodes: loc = '*' if ele_only else 'node()'
if Settings.raise_when_ele_not_found:
raise ElementNotFoundError(None, 'child()', {'filter_loc': filter_loc,
'index': index, 'ele_only': ele_only})
else: else:
return NoneElement(self.page, 'child()', {'filter_loc': filter_loc, loc = get_loc(filter_loc, True) # 把定位符转换为xpath
'index': index, 'ele_only': ele_only}) if loc[0] == 'css selector':
raise ValueError('此css selector语法不受支持请换成xpath。')
loc = loc[1].lstrip('./')
node = self._ele(f'xpath:./{loc}', timeout=timeout, index=index, relative=True, raise_err=False)
if node:
return node
try:
return nodes[index - 1]
except IndexError:
if Settings.raise_when_ele_not_found: if Settings.raise_when_ele_not_found:
raise ElementNotFoundError(None, 'child()', {'filter_loc': filter_loc, raise ElementNotFoundError(None, 'child()', {'filter_loc': filter_loc, 'index': index,
'index': index, 'ele_only': ele_only}) 'ele_only': ele_only})
else: else:
return NoneElement(self.page, 'child()', {'filter_loc': filter_loc, return NoneElement(self.page, 'child()', {'filter_loc': filter_loc, 'index': index, 'ele_only': ele_only})
'index': index, 'ele_only': ele_only})
def prev(self, filter_loc='', index=1, timeout=None, ele_only=True): def prev(self, filter_loc='', index=1, timeout=None, ele_only=True):
"""返回前面的一个兄弟元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回前面的一个兄弟元素,可用查询语法筛选,可指定返回筛选结果的第几个
@ -180,17 +179,7 @@ class DrissionElement(BaseElement):
:param ele_only: 是否只获取元素为False时把文本注释节点也纳入 :param ele_only: 是否只获取元素为False时把文本注释节点也纳入
:return: 兄弟元素 :return: 兄弟元素
""" """
if isinstance(filter_loc, int): return self._do_relative_find('prev()', 'preceding', filter_loc, index, timeout, ele_only)
index = filter_loc
filter_loc = ''
nodes = self._get_brothers(index, filter_loc, 'preceding', timeout=timeout, ele_only=ele_only)
if nodes:
return nodes[-1]
if Settings.raise_when_ele_not_found:
raise ElementNotFoundError(None, 'prev()', {'filter_loc': filter_loc,
'index': index, 'ele_only': ele_only})
else:
return NoneElement(self.page, 'prev()', {'filter_loc': filter_loc, 'index': index, 'ele_only': ele_only})
def next(self, filter_loc='', index=1, timeout=None, ele_only=True): def next(self, filter_loc='', index=1, timeout=None, ele_only=True):
"""返回后面的一个兄弟元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回后面的一个兄弟元素,可用查询语法筛选,可指定返回筛选结果的第几个
@ -200,17 +189,7 @@ class DrissionElement(BaseElement):
:param ele_only: 是否只获取元素为False时把文本注释节点也纳入 :param ele_only: 是否只获取元素为False时把文本注释节点也纳入
:return: 兄弟元素 :return: 兄弟元素
""" """
if isinstance(filter_loc, int): return self._do_relative_find('next()', 'following', filter_loc, index, timeout, ele_only)
index = filter_loc
filter_loc = ''
nodes = self._get_brothers(index, filter_loc, 'following', timeout=timeout, ele_only=ele_only)
if nodes:
return nodes[0]
if Settings.raise_when_ele_not_found:
raise ElementNotFoundError(None, 'next()', {'filter_loc': filter_loc,
'index': index, 'ele_only': ele_only})
else:
return NoneElement(self.page, 'next()', {'filter_loc': filter_loc, 'index': index, 'ele_only': ele_only})
def before(self, filter_loc='', index=1, timeout=None, ele_only=True): def before(self, filter_loc='', index=1, timeout=None, ele_only=True):
"""返回前面的一个兄弟元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回前面的一个兄弟元素,可用查询语法筛选,可指定返回筛选结果的第几个
@ -220,17 +199,7 @@ class DrissionElement(BaseElement):
:param ele_only: 是否只获取元素为False时把文本注释节点也纳入 :param ele_only: 是否只获取元素为False时把文本注释节点也纳入
:return: 本元素前面的某个元素或节点 :return: 本元素前面的某个元素或节点
""" """
if isinstance(filter_loc, int): return self._do_relative_find('before()', 'preceding', filter_loc, index, timeout, ele_only)
index = filter_loc
filter_loc = ''
nodes = self._get_brothers(index, filter_loc, 'preceding', False, timeout=timeout, ele_only=ele_only)
if nodes:
return nodes[-1]
if Settings.raise_when_ele_not_found:
raise ElementNotFoundError(None, 'before()', {'filter_loc': filter_loc,
'index': index, 'ele_only': ele_only})
else:
return NoneElement(self.page, 'before()', {'filter_loc': filter_loc, 'index': index, 'ele_only': ele_only})
def after(self, filter_loc='', index=1, timeout=None, ele_only=True): def after(self, filter_loc='', index=1, timeout=None, ele_only=True):
"""返回后面的一个兄弟元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回后面的一个兄弟元素,可用查询语法筛选,可指定返回筛选结果的第几个
@ -240,17 +209,7 @@ class DrissionElement(BaseElement):
:param ele_only: 是否只获取元素为False时把文本注释节点也纳入 :param ele_only: 是否只获取元素为False时把文本注释节点也纳入
:return: 本元素后面的某个元素或节点 :return: 本元素后面的某个元素或节点
""" """
if isinstance(filter_loc, int): return self._do_relative_find('after()', 'following', filter_loc, index, timeout, ele_only)
index = filter_loc
filter_loc = ''
nodes = self._get_brothers(index, filter_loc, 'following', False, timeout, ele_only=ele_only)
if nodes:
return nodes[0]
if Settings.raise_when_ele_not_found:
raise ElementNotFoundError(None, 'after()', {'filter_loc': filter_loc,
'index': index, 'ele_only': ele_only})
else:
return NoneElement(self.page, 'after()', {'filter_loc': filter_loc, 'index': index, 'ele_only': ele_only})
def children(self, filter_loc='', timeout=None, ele_only=True): def children(self, filter_loc='', timeout=None, ele_only=True):
"""返回直接子元素元素或节点组成的列表,可用查询语法筛选 """返回直接子元素元素或节点组成的列表,可用查询语法筛选
@ -268,7 +227,7 @@ class DrissionElement(BaseElement):
loc = loc[1].lstrip('./') loc = loc[1].lstrip('./')
loc = f'xpath:./{loc}' loc = f'xpath:./{loc}'
nodes = self._ele(loc, timeout=timeout, single=False, relative=True) nodes = self._ele(loc, timeout=timeout, index=None, relative=True)
return [e for e in nodes if not (isinstance(e, str) and sub('[ \n\t\r]', '', e) == '')] return [e for e in nodes if not (isinstance(e, str) and sub('[ \n\t\r]', '', e) == '')]
def prevs(self, filter_loc='', timeout=None, ele_only=True): def prevs(self, filter_loc='', timeout=None, ele_only=True):
@ -278,7 +237,7 @@ class DrissionElement(BaseElement):
:param ele_only: 是否只获取元素为False时把文本注释节点也纳入 :param ele_only: 是否只获取元素为False时把文本注释节点也纳入
:return: 兄弟元素或节点文本组成的列表 :return: 兄弟元素或节点文本组成的列表
""" """
return self._get_brothers(filter_loc=filter_loc, direction='preceding', timeout=timeout, ele_only=ele_only) return self._get_relatives(filter_loc=filter_loc, direction='preceding', timeout=timeout, ele_only=ele_only)
def nexts(self, filter_loc='', timeout=None, ele_only=True): def nexts(self, filter_loc='', timeout=None, ele_only=True):
"""返回后面全部兄弟元素或节点组成的列表,可用查询语法筛选 """返回后面全部兄弟元素或节点组成的列表,可用查询语法筛选
@ -287,7 +246,7 @@ class DrissionElement(BaseElement):
:param ele_only: 是否只获取元素为False时把文本注释节点也纳入 :param ele_only: 是否只获取元素为False时把文本注释节点也纳入
:return: 兄弟元素或节点文本组成的列表 :return: 兄弟元素或节点文本组成的列表
""" """
return self._get_brothers(filter_loc=filter_loc, direction='following', timeout=timeout, ele_only=ele_only) return self._get_relatives(filter_loc=filter_loc, direction='following', timeout=timeout, ele_only=ele_only)
def befores(self, filter_loc='', timeout=None, ele_only=True): def befores(self, filter_loc='', timeout=None, ele_only=True):
"""返回后面全部兄弟元素或节点组成的列表,可用查询语法筛选 """返回后面全部兄弟元素或节点组成的列表,可用查询语法筛选
@ -296,7 +255,7 @@ class DrissionElement(BaseElement):
:param ele_only: 是否只获取元素为False时把文本注释节点也纳入 :param ele_only: 是否只获取元素为False时把文本注释节点也纳入
:return: 本元素前面的元素或节点组成的列表 :return: 本元素前面的元素或节点组成的列表
""" """
return self._get_brothers(filter_loc=filter_loc, direction='preceding', return self._get_relatives(filter_loc=filter_loc, direction='preceding',
brother=False, timeout=timeout, ele_only=ele_only) brother=False, timeout=timeout, ele_only=ele_only)
def afters(self, filter_loc='', timeout=None, ele_only=True): def afters(self, filter_loc='', timeout=None, ele_only=True):
@ -306,11 +265,31 @@ class DrissionElement(BaseElement):
:param ele_only: 是否只获取元素为False时把文本注释节点也纳入 :param ele_only: 是否只获取元素为False时把文本注释节点也纳入
:return: 本元素后面的元素或节点组成的列表 :return: 本元素后面的元素或节点组成的列表
""" """
return self._get_brothers(filter_loc=filter_loc, direction='following', return self._get_relatives(filter_loc=filter_loc, direction='following',
brother=False, timeout=timeout, ele_only=ele_only) brother=False, timeout=timeout, ele_only=ele_only)
def _get_brothers(self, index=None, filter_loc='', direction='following', def _do_relative_find(self, func, direction, filter_loc='', index=1, timeout=None, ele_only=True):
brother=True, timeout=.5, ele_only=True): """返回前面的一个兄弟元素,可用查询语法筛选,可指定返回筛选结果的第几个
:param func: 方法名称
:param direction: 方向'following' 'preceding'
:param filter_loc: 用于筛选的查询语法
:param index: 前面第几个查询结果1开始
:param timeout: 查找节点的超时时间
:param ele_only: 是否只获取元素为False时把文本注释节点也纳入
:return: 本元素前面的某个元素或节点
"""
if isinstance(filter_loc, int):
index = filter_loc
filter_loc = ''
node = self._get_relatives(index, filter_loc, direction, False, timeout, ele_only)
if node:
return node
if Settings.raise_when_ele_not_found:
raise ElementNotFoundError(None, func, {'filter_loc': filter_loc, 'index': index, 'ele_only': ele_only})
else:
return NoneElement(self.page, func, {'filter_loc': filter_loc, 'index': index, 'ele_only': ele_only})
def _get_relatives(self, index=None, filter_loc='', direction='following', brother=True, timeout=.5, ele_only=True):
"""按要求返回兄弟元素或节点组成的列表 """按要求返回兄弟元素或节点组成的列表
:param index: 获取第几个该参数不为None时只获取该编号的元素 :param index: 获取第几个该参数不为None时只获取该编号的元素
:param filter_loc: 用于筛选的查询语法 :param filter_loc: 用于筛选的查询语法
@ -319,8 +298,8 @@ class DrissionElement(BaseElement):
:param timeout: 查找等待时间 :param timeout: 查找等待时间
:return: 元素对象或字符串 :return: 元素对象或字符串
""" """
if index is not None and index < 1: if index is not None and index < 0:
raise ValueError('index必须大于等于1') raise ValueError('index必须大于等于0')
brother = '-sibling' if brother else '' brother = '-sibling' if brother else ''
@ -335,16 +314,11 @@ class DrissionElement(BaseElement):
loc = f'xpath:./{direction}{brother}::{loc}' loc = f'xpath:./{direction}{brother}::{loc}'
nodes = self._ele(loc, timeout=timeout, single=False, relative=True) if index is not None:
nodes = [e for e in nodes if not (isinstance(e, str) and sub('[ \n\t\r]', '', e) == '')]
if nodes and index is not None:
index = index - 1 if direction == 'following' else -index index = index - 1 if direction == 'following' else -index
try: nodes = self._ele(loc, timeout=timeout, index=index, relative=True, raise_err=False)
return [nodes[index]] if isinstance(nodes, list):
except IndexError: nodes = [e for e in nodes if not (isinstance(e, str) and sub('[ \n\t\r]', '', e) == '')]
return []
else:
return nodes return nodes
# ----------------以下属性或方法由后代实现---------------- # ----------------以下属性或方法由后代实现----------------
@ -442,11 +416,11 @@ class BasePage(BaseParser):
def get(self, url, show_errmsg=False, retry=None, interval=None): def get(self, url, show_errmsg=False, retry=None, interval=None):
pass pass
def _ele(self, loc_or_ele, timeout=None, single=True, raise_err=None, method=None): def _ele(self, loc_or_ele, timeout=None, index=0, raise_err=None, method=None):
if not loc_or_ele: if not loc_or_ele:
raise ElementNotFoundError(None, method, {'loc_or_str': loc_or_ele}) raise ElementNotFoundError(None, method, {'loc_or_str': loc_or_ele})
r = self._find_elements(loc_or_ele, timeout=timeout, single=single, raise_err=raise_err) r = self._find_elements(loc_or_ele, timeout=timeout, index=index, raise_err=raise_err)
if r or isinstance(r, list): if r or isinstance(r, list):
return r return r
@ -458,5 +432,5 @@ class BasePage(BaseParser):
return r return r
@abstractmethod @abstractmethod
def _find_elements(self, loc_or_ele, timeout=None, single=True, raise_err=None): def _find_elements(self, loc_or_ele, timeout=None, index=0, raise_err=None):
pass pass

View File

@ -6,7 +6,7 @@
@License : BSD 3-Clause. @License : BSD 3-Clause.
""" """
from abc import abstractmethod from abc import abstractmethod
from typing import Union, Tuple, List, Any from typing import Union, Tuple, List, Any, Optional
from DownloadKit import DownloadKit from DownloadKit import DownloadKit
@ -15,9 +15,12 @@ from .._elements.none_element import NoneElement
class BaseParser(object): class BaseParser(object):
def __call__(self, loc_or_str: Union[Tuple[str, str], str]): ... def __call__(self, loc_or_str: Union[Tuple[str, str], str], index: int = 0): ...
def ele(self, loc_or_ele: Union[Tuple[str, str], str, BaseElement], timeout: float = None): ... def ele(self,
loc_or_ele: Union[Tuple[str, str], str, BaseElement],
index: int = 0,
timeout: float = None): ...
def eles(self, loc_or_str: Union[Tuple[str, str], str], timeout=None): ... def eles(self, loc_or_str: Union[Tuple[str, str], str], timeout=None): ...
@ -25,15 +28,23 @@ class BaseParser(object):
@property @property
def html(self) -> str: ... def html(self) -> str: ...
def s_ele(self, loc_or_ele: Union[Tuple[str, str], str, BaseElement]): ... def s_ele(self, loc_or_ele: Union[Tuple[str, str], str, BaseElement], index: int = 0): ...
def s_eles(self, loc_or_str: Union[Tuple[str, str], str]): ... def s_eles(self, loc_or_str: Union[Tuple[str, str], str]): ...
def _ele(self, loc_or_ele, timeout: float = None, single: bool = True, def _ele(self,
raise_err: bool = None, method: str = None): ... loc_or_ele,
timeout: float = None,
index: Optional[int] = 0,
raise_err: bool = None,
method: str = None): ...
@abstractmethod @abstractmethod
def _find_elements(self, loc_or_ele, timeout: float = None, single: bool = True, raise_err: bool = None): ... def _find_elements(self,
loc_or_ele,
timeout: float = None,
index: Optional[int] = 0,
raise_err: bool = None): ...
class BaseElement(BaseParser): class BaseElement(BaseParser):
@ -45,11 +56,19 @@ class BaseElement(BaseParser):
@property @property
def tag(self) -> str: ... def tag(self) -> str: ...
def _ele(self, loc_or_str: Union[Tuple[str, str], str], timeout: float = None, single: bool = True, def _ele(self,
relative: bool = False, raise_err: bool = None, method: str = None): ... loc_or_str: Union[Tuple[str, str], str],
timeout: float = None,
index: Optional[int] = 0,
relative: bool = False,
raise_err: bool = None,
method: str = None): ...
@abstractmethod @abstractmethod
def _find_elements(self, loc_or_str, timeout: float = None, single: bool = True, relative: bool = False, def _find_elements(self, loc_or_str,
timeout: float = None,
index: Optional[int] = 0,
relative: bool = False,
raise_err: bool = None): ... raise_err: bool = None): ...
def parent(self, level_or_loc: Union[tuple, str, int] = 1): ... def parent(self, level_or_loc: Union[tuple, str, int] = 1): ...
@ -83,41 +102,80 @@ class DrissionElement(BaseElement):
def texts(self, text_node_only: bool = False) -> list: ... def texts(self, text_node_only: bool = False) -> list: ...
def parent(self, level_or_loc: Union[tuple, str, int] = 1, index: int = 1) -> Union[DrissionElement, None]: ... def parent(self,
level_or_loc: Union[tuple, str, int] = 1,
index: int = 1) -> Union[DrissionElement, None]: ...
def child(self, filter_loc: Union[tuple, str, int] = '', index: int = 1, def child(self,
timeout: float = None, ele_only: bool = True) -> Union[DrissionElement, str, NoneElement]: ... filter_loc: Union[tuple, str, int] = '',
index: int = 1,
timeout: float = None,
ele_only: bool = True) -> Union[DrissionElement, str, NoneElement]: ...
def prev(self, filter_loc: Union[tuple, str, int] = '', index: int = 1, def prev(self,
timeout: float = None, ele_only: bool = True) -> Union[DrissionElement, str, NoneElement]: ... filter_loc: Union[tuple, str, int] = '',
index: int = 1,
timeout: float = None,
ele_only: bool = True) -> Union[DrissionElement, str, NoneElement]: ...
def next(self, filter_loc: Union[tuple, str, int] = '', index: int = 1, def next(self,
timeout: float = None, ele_only: bool = True) -> Union[DrissionElement, str, NoneElement]: ... filter_loc: Union[tuple, str, int] = '',
index: int = 1,
timeout: float = None,
ele_only: bool = True) -> Union[DrissionElement, str, NoneElement]: ...
def before(self, filter_loc: Union[tuple, str, int] = '', index: int = 1, def before(self,
timeout: float = None, ele_only: bool = True) -> Union[DrissionElement, str, NoneElement]: ... filter_loc: Union[tuple, str, int] = '',
index: int = 1,
timeout: float = None,
ele_only: bool = True) -> Union[DrissionElement, str, NoneElement]: ...
def after(self, filter_loc: Union[tuple, str, int] = '', index: int = 1, def after(self,
timeout: float = None, ele_only: bool = True) -> Union[DrissionElement, str, NoneElement]: ... filter_loc: Union[tuple, str, int] = '',
index: int = 1,
timeout: float = None,
ele_only: bool = True) -> Union[DrissionElement, str, NoneElement]: ...
def children(self, filter_loc: Union[tuple, str] = '', timeout: float = None, def children(self,
filter_loc: Union[tuple, str] = '',
timeout: float = None,
ele_only: bool = True) -> List[Union[DrissionElement, str]]: ... ele_only: bool = True) -> List[Union[DrissionElement, str]]: ...
def prevs(self, filter_loc: Union[tuple, str] = '', timeout: float = None, def prevs(self,
filter_loc: Union[tuple, str] = '',
timeout: float = None,
ele_only: bool = True) -> List[Union[DrissionElement, str]]: ... ele_only: bool = True) -> List[Union[DrissionElement, str]]: ...
def nexts(self, filter_loc: Union[tuple, str] = '', timeout: float = None, def nexts(self,
filter_loc: Union[tuple, str] = '',
timeout: float = None,
ele_only: bool = True) -> List[Union[DrissionElement, str]]: ... ele_only: bool = True) -> List[Union[DrissionElement, str]]: ...
def befores(self, filter_loc: Union[tuple, str] = '', timeout: float = None, def befores(self,
filter_loc: Union[tuple, str] = '',
timeout: float = None,
ele_only: bool = True) -> List[Union[DrissionElement, str]]: ... ele_only: bool = True) -> List[Union[DrissionElement, str]]: ...
def afters(self, filter_loc: Union[tuple, str] = '', timeout: float = None, def afters(self,
filter_loc: Union[tuple, str] = '',
timeout: float = None,
ele_only: bool = True) -> List[Union[DrissionElement, str]]: ... ele_only: bool = True) -> List[Union[DrissionElement, str]]: ...
def _get_brothers(self, index: int = None, filter_loc: Union[tuple, str] = '', def _do_relative_find(self,
direction: str = 'following', brother: bool = True, func: str,
timeout: float = 0.5, ele_only: bool = True) -> List[Union[DrissionElement, str]]: ... direction: str,
filter_loc: Union[tuple, str] ='',
index: int =1,
timeout: float =None,
ele_only: bool =True) -> DrissionElement: ...
def _get_relatives(self,
index: int = None,
filter_loc: Union[tuple, str] = '',
direction: str = 'following',
brother: bool = True,
timeout: float = 0.5,
ele_only: bool = True) -> List[Union[DrissionElement, str]]: ...
# ----------------以下属性或方法由后代实现---------------- # ----------------以下属性或方法由后代实现----------------
@property @property
@ -184,8 +242,16 @@ class BasePage(BaseParser):
@abstractmethod @abstractmethod
def get(self, url: str, show_errmsg: bool = False, retry: int = None, interval: float = None): ... def get(self, url: str, show_errmsg: bool = False, retry: int = None, interval: float = None): ...
def _ele(self, loc_or_ele, timeout: float = None, single: bool = True, def _ele(self,
raise_err: bool = None, method: str = None): ... loc_or_ele,
timeout: float = None,
index: Optional[int] = 0,
raise_err: bool = None,
method: str = None): ...
@abstractmethod @abstractmethod
def _find_elements(self, loc_or_ele, timeout: float = None, single: bool = True, raise_err: bool = None): ... def _find_elements(self,
loc_or_ele,
timeout: float = None,
index: Optional[int] = 0,
raise_err: bool = None): ...

View File

@ -80,13 +80,13 @@ class ChromiumElement(DrissionElement):
attrs = [f"{attr}='{attrs[attr]}'" for attr in attrs] attrs = [f"{attr}='{attrs[attr]}'" for attr in attrs]
return f'<ChromiumElement {self.tag} {" ".join(attrs)}>' return f'<ChromiumElement {self.tag} {" ".join(attrs)}>'
def __call__(self, loc_or_str, timeout=None): def __call__(self, loc_or_str, index=0, timeout=None):
"""在内部查找元素 """在内部查找元素
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param timeout: 超时时间 :param timeout: 超时时间
:return: ChromiumElement对象或属性文本 :return: ChromiumElement对象或属性文本
""" """
return self.ele(loc_or_str, timeout) return self.ele(loc_or_str, index=index, timeout=timeout)
def __eq__(self, other): def __eq__(self, other):
return self._backend_id == getattr(other, '_backend_id', None) return self._backend_id == getattr(other, '_backend_id', None)
@ -227,8 +227,8 @@ class ChromiumElement(DrissionElement):
def parent(self, level_or_loc=1, index=1): def parent(self, level_or_loc=1, index=1):
"""返回上面某一级父元素,可指定层数或用查询语法定位 """返回上面某一级父元素,可指定层数或用查询语法定位
:param level_or_loc: 第几级父元素或定位符 :param level_or_loc: 第几级父元素1开始或定位符
:param index: 当level_or_loc传入定位符使用此参数选择第几个结果 :param index: 当level_or_loc传入定位符使用此参数选择第几个结果1开始
:return: 上级元素对象 :return: 上级元素对象
""" """
return super().parent(level_or_loc, index) return super().parent(level_or_loc, index)
@ -264,7 +264,7 @@ class ChromiumElement(DrissionElement):
return super().next(filter_loc, index, timeout, ele_only=ele_only) return super().next(filter_loc, index, timeout, ele_only=ele_only)
def before(self, filter_loc='', index=1, timeout=None, ele_only=True): def before(self, filter_loc='', index=1, timeout=None, ele_only=True):
"""返回文档中当前元素前面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回文档中当前元素前面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个
查找范围不限同级元素而是整个DOM文档 查找范围不限同级元素而是整个DOM文档
:param filter_loc: 用于筛选的查询语法 :param filter_loc: 用于筛选的查询语法
:param index: 前面第几个查询结果1开始 :param index: 前面第几个查询结果1开始
@ -275,7 +275,7 @@ class ChromiumElement(DrissionElement):
return super().before(filter_loc, index, timeout, ele_only=ele_only) return super().before(filter_loc, index, timeout, ele_only=ele_only)
def after(self, filter_loc='', index=1, timeout=None, ele_only=True): def after(self, filter_loc='', index=1, timeout=None, ele_only=True):
"""返回文档中此当前元素后面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回文档中此当前元素后面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个
查找范围不限同级元素而是整个DOM文档 查找范围不限同级元素而是整个DOM文档
:param filter_loc: 用于筛选的查询语法 :param filter_loc: 用于筛选的查询语法
:param index: 第几个查询结果1开始 :param index: 第几个查询结果1开始
@ -400,13 +400,14 @@ class ChromiumElement(DrissionElement):
""" """
run_js(self, script, as_expr, 0, args) run_js(self, script, as_expr, 0, args)
def ele(self, loc_or_str, timeout=None): def ele(self, loc_or_str, index=0, timeout=None):
"""返回当前元素下级符合条件的一个元素、属性或节点文本 """返回当前元素下级符合条件的一个元素、属性或节点文本
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param index: 获取第几个元素0开始
:param timeout: 查找元素超时时间默认与元素所在页面等待时间一致 :param timeout: 查找元素超时时间默认与元素所在页面等待时间一致
:return: ChromiumElement对象或属性文本 :return: ChromiumElement对象或属性文本
""" """
return self._ele(loc_or_str, timeout, method='ele()') return self._ele(loc_or_str, timeout, index=index, method='ele()')
def eles(self, loc_or_str, timeout=None): def eles(self, loc_or_str, timeout=None):
"""返回当前元素下级所有符合条件的子元素、属性或节点文本 """返回当前元素下级所有符合条件的子元素、属性或节点文本
@ -414,17 +415,18 @@ class ChromiumElement(DrissionElement):
:param timeout: 查找元素超时时间默认与元素所在页面等待时间一致 :param timeout: 查找元素超时时间默认与元素所在页面等待时间一致
:return: ChromiumElement对象或属性文本组成的列表 :return: ChromiumElement对象或属性文本组成的列表
""" """
return self._ele(loc_or_str, timeout=timeout, single=False) return self._ele(loc_or_str, timeout=timeout, index=None)
def s_ele(self, loc_or_str=None): def s_ele(self, loc_or_str=None, index=0):
"""查找一个符合条件的元素以SessionElement形式返回 """查找一个符合条件的元素以SessionElement形式返回
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param index: 获取第几个0开始
:return: SessionElement对象或属性文本 :return: SessionElement对象或属性文本
""" """
if self.tag in __FRAME_ELEMENT__: if self.tag in __FRAME_ELEMENT__:
r = make_session_ele(self.inner_html, loc_or_str) r = make_session_ele(self.inner_html, loc_or_str, index=index)
else: else:
r = make_session_ele(self, loc_or_str) r = make_session_ele(self, loc_or_str, index=index)
if isinstance(r, NoneElement): if isinstance(r, NoneElement):
if Settings.raise_when_ele_not_found: if Settings.raise_when_ele_not_found:
raise ElementNotFoundError(None, 's_ele()', {'loc_or_str': loc_or_str}) raise ElementNotFoundError(None, 's_ele()', {'loc_or_str': loc_or_str})
@ -439,19 +441,19 @@ class ChromiumElement(DrissionElement):
:return: SessionElement或属性文本组成的列表 :return: SessionElement或属性文本组成的列表
""" """
if self.tag in __FRAME_ELEMENT__: if self.tag in __FRAME_ELEMENT__:
return make_session_ele(self.inner_html, loc_or_str, single=False) return make_session_ele(self.inner_html, loc_or_str, index=None)
return make_session_ele(self, loc_or_str, single=False) return make_session_ele(self, loc_or_str, index=None)
def _find_elements(self, loc_or_str, timeout=None, single=True, relative=False, raise_err=None): def _find_elements(self, loc_or_str, timeout=None, index=0, relative=False, raise_err=None):
"""返回当前元素下级符合条件的子元素、属性或节点文本,默认返回第一个 """返回当前元素下级符合条件的子元素、属性或节点文本,默认返回第一个
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param timeout: 查找元素超时时间 :param timeout: 查找元素超时时间
:param single: True则返回第一个False则返回全部 :param index: 第几个结果0开始为None返回所有
:param relative: WebPage用的表示是否相对定位的参数 :param relative: WebPage用的表示是否相对定位的参数
:param raise_err: 找不到元素是是否抛出异常为None时根据全局设置 :param raise_err: 找不到元素是是否抛出异常为None时根据全局设置
:return: ChromiumElement对象或文本属性或其组成的列表 :return: ChromiumElement对象或文本属性或其组成的列表
""" """
return find_in_chromium_ele(self, loc_or_str, single, timeout, relative=relative) return find_in_chromium_ele(self, loc_or_str, index, timeout, relative=relative)
def style(self, style, pseudo_ele=''): def style(self, style, pseudo_ele=''):
"""返回元素样式属性值,可获取伪元素属性值 """返回元素样式属性值,可获取伪元素属性值
@ -806,14 +808,15 @@ class ShadowRoot(BaseElement):
def __repr__(self): def __repr__(self):
return f'<ShadowRoot in {self.parent_ele}>' return f'<ShadowRoot in {self.parent_ele}>'
def __call__(self, loc_or_str, timeout=None): def __call__(self, loc_or_str, index=0, timeout=None):
"""在内部查找元素 """在内部查找元素
ele2 = ele1('@id=ele_id') ele2 = ele1('@id=ele_id')
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param index: 获取第几个0开始
:param timeout: 超时时间 :param timeout: 超时时间
:return: 元素对象或属性文本 :return: 元素对象或属性文本
""" """
return self.ele(loc_or_str, timeout) return self.ele(loc_or_str, index=index, timeout=timeout)
def __eq__(self, other): def __eq__(self, other):
return self._backend_id == getattr(other, '_backend_id', None) return self._backend_id == getattr(other, '_backend_id', None)
@ -920,7 +923,7 @@ class ShadowRoot(BaseElement):
return NoneElement(self.page, 'next()', {'filter_loc': filter_loc, 'index': index}) return NoneElement(self.page, 'next()', {'filter_loc': filter_loc, 'index': index})
def before(self, filter_loc='', index=1): def before(self, filter_loc='', index=1):
"""返回文档中当前元素前面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回文档中当前元素前面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个
查找范围不限同级元素而是整个DOM文档 查找范围不限同级元素而是整个DOM文档
:param filter_loc: 用于筛选的查询语法 :param filter_loc: 用于筛选的查询语法
:param index: 前面第几个查询结果1开始 :param index: 前面第几个查询结果1开始
@ -935,7 +938,7 @@ class ShadowRoot(BaseElement):
return NoneElement(self.page, 'before()', {'filter_loc': filter_loc, 'index': index}) return NoneElement(self.page, 'before()', {'filter_loc': filter_loc, 'index': index})
def after(self, filter_loc='', index=1): def after(self, filter_loc='', index=1):
"""返回文档中此当前元素后面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回文档中此当前元素后面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个
查找范围不限同级元素而是整个DOM文档 查找范围不限同级元素而是整个DOM文档
:param filter_loc: 用于筛选的查询语法 :param filter_loc: 用于筛选的查询语法
:param index: 后面第几个查询结果1开始 :param index: 后面第几个查询结果1开始
@ -963,7 +966,7 @@ class ShadowRoot(BaseElement):
loc = loc[1].lstrip('./') loc = loc[1].lstrip('./')
loc = f'xpath:./{loc}' loc = f'xpath:./{loc}'
return self._ele(loc, single=False, relative=True) return self._ele(loc, index=None, relative=True)
def nexts(self, filter_loc=''): def nexts(self, filter_loc=''):
"""返回当前元素后面符合条件的同级元素或节点组成的列表,可用查询语法筛选 """返回当前元素后面符合条件的同级元素或节点组成的列表,可用查询语法筛选
@ -976,7 +979,7 @@ class ShadowRoot(BaseElement):
loc = loc[1].lstrip('./') loc = loc[1].lstrip('./')
xpath = f'xpath:./{loc}' xpath = f'xpath:./{loc}'
return self.parent_ele._ele(xpath, single=False, relative=True) return self.parent_ele._ele(xpath, index=None, relative=True)
def befores(self, filter_loc=''): def befores(self, filter_loc=''):
"""返回文档中当前元素前面符合条件的元素或节点组成的列表,可用查询语法筛选 """返回文档中当前元素前面符合条件的元素或节点组成的列表,可用查询语法筛选
@ -990,7 +993,7 @@ class ShadowRoot(BaseElement):
loc = loc[1].lstrip('./') loc = loc[1].lstrip('./')
xpath = f'xpath:./preceding::{loc}' xpath = f'xpath:./preceding::{loc}'
return self.parent_ele._ele(xpath, single=False, relative=True) return self.parent_ele._ele(xpath, index=None, relative=True)
def afters(self, filter_loc=''): def afters(self, filter_loc=''):
"""返回文档中当前元素后面符合条件的元素或节点组成的列表,可用查询语法筛选 """返回文档中当前元素后面符合条件的元素或节点组成的列表,可用查询语法筛选
@ -1001,15 +1004,16 @@ class ShadowRoot(BaseElement):
eles1 = self.nexts(filter_loc) eles1 = self.nexts(filter_loc)
loc = get_loc(filter_loc, True)[1].lstrip('./') loc = get_loc(filter_loc, True)[1].lstrip('./')
xpath = f'xpath:./following::{loc}' xpath = f'xpath:./following::{loc}'
return eles1 + self.parent_ele._ele(xpath, single=False, relative=True) return eles1 + self.parent_ele._ele(xpath, index=None, relative=True)
def ele(self, loc_or_str, timeout=None): def ele(self, loc_or_str, index=0, timeout=None):
"""返回当前元素下级符合条件的一个元素 """返回当前元素下级符合条件的一个元素
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param index: 获取第几个元素0开始
:param timeout: 查找元素超时时间默认与元素所在页面等待时间一致 :param timeout: 查找元素超时时间默认与元素所在页面等待时间一致
:return: ChromiumElement对象 :return: ChromiumElement对象
""" """
return self._ele(loc_or_str, timeout, method='ele()') return self._ele(loc_or_str, timeout, index=index, method='ele()')
def eles(self, loc_or_str, timeout=None): def eles(self, loc_or_str, timeout=None):
"""返回当前元素下级所有符合条件的子元素 """返回当前元素下级所有符合条件的子元素
@ -1017,14 +1021,15 @@ class ShadowRoot(BaseElement):
:param timeout: 查找元素超时时间默认与元素所在页面等待时间一致 :param timeout: 查找元素超时时间默认与元素所在页面等待时间一致
:return: ChromiumElement对象组成的列表 :return: ChromiumElement对象组成的列表
""" """
return self._ele(loc_or_str, timeout=timeout, single=False) return self._ele(loc_or_str, timeout=timeout, index=None)
def s_ele(self, loc_or_str=None): def s_ele(self, loc_or_str=None, index=0):
"""查找一个符合条件的元素以SessionElement形式返回处理复杂页面时效率很高 """查找一个符合条件的元素以SessionElement形式返回处理复杂页面时效率很高
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param index: 获取第几个0开始
:return: SessionElement对象或属性文本 :return: SessionElement对象或属性文本
""" """
r = make_session_ele(self, loc_or_str) r = make_session_ele(self, loc_or_str, index=index)
if isinstance(r, NoneElement): if isinstance(r, NoneElement):
r.method = 's_ele()' r.method = 's_ele()'
r.args = {'loc_or_str': loc_or_str} r.args = {'loc_or_str': loc_or_str}
@ -1035,13 +1040,13 @@ class ShadowRoot(BaseElement):
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:return: SessionElement对象 :return: SessionElement对象
""" """
return make_session_ele(self, loc_or_str, single=False) return make_session_ele(self, loc_or_str, index=None)
def _find_elements(self, loc_or_str, timeout=None, single=True, relative=False, raise_err=None): def _find_elements(self, loc_or_str, timeout=None, index=0, relative=False, raise_err=None):
"""返回当前元素下级符合条件的子元素、属性或节点文本,默认返回第一个 """返回当前元素下级符合条件的子元素、属性或节点文本,默认返回第一个
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param timeout: 查找元素超时时间 :param timeout: 查找元素超时时间
:param single: True则返回第一个False则返回全部 :param index: 第几个结果0开始为None返回所有
:param relative: WebPage用的表示是否相对定位的参数 :param relative: WebPage用的表示是否相对定位的参数
:param raise_err: 找不到元素是是否抛出异常为None时根据全局设置 :param raise_err: 找不到元素是是否抛出异常为None时根据全局设置
:return: ChromiumElement对象或其组成的列表 :return: ChromiumElement对象或其组成的列表
@ -1052,15 +1057,15 @@ class ShadowRoot(BaseElement):
def do_find(): def do_find():
if loc[0] == 'css selector': if loc[0] == 'css selector':
if single: if index == 0:
nod_id = self.page.run_cdp('DOM.querySelector', nodeId=self._node_id, selector=loc[1])['nodeId'] nod_id = self.page.run_cdp('DOM.querySelector', nodeId=self._node_id, selector=loc[1])['nodeId']
if nod_id: if nod_id:
r = make_chromium_ele(self.page, node_id=nod_id) r = make_chromium_eles(self.page, _ids=nod_id, is_obj_id=False)
return None if r is False else r return None if r is False else r
else: else:
nod_ids = self.page.run_cdp('DOM.querySelectorAll', nodeId=self._node_id, selector=loc[1])['nodeId'] nod_ids = self.page.run_cdp('DOM.querySelectorAll', nodeId=self._node_id, selector=loc[1])['nodeId']
r = make_chromium_eles(self.page, node_ids=nod_ids, single=False) r = make_chromium_eles(self.page, _ids=nod_ids, index=index, is_obj_id=False)
return None if r is False else r return None if r is False else r
else: else:
@ -1069,16 +1074,20 @@ class ShadowRoot(BaseElement):
return None return None
css = [i.css_path[61:] for i in eles] css = [i.css_path[61:] for i in eles]
if single: if index is not None:
node_id = self.page.run_cdp('DOM.querySelector', nodeId=self._node_id, selector=css[0])['nodeId'] try:
r = make_chromium_ele(self.page, node_id=node_id) node_id = self.page.run_cdp('DOM.querySelector', nodeId=self._node_id,
selector=css[index])['nodeId']
except IndexError:
return None
r = make_chromium_eles(self.page, _ids=node_id, is_obj_id=False)
return None if r is False else r return None if r is False else r
else: else:
node_ids = [self.page.run_cdp('DOM.querySelector', nodeId=self._node_id, selector=i)['nodeId'] node_ids = [self.page.run_cdp('DOM.querySelector', nodeId=self._node_id, selector=i)['nodeId']
for i in css] for i in css]
if 0 in node_ids: if 0 in node_ids:
return None return None
r = make_chromium_eles(self.page, node_ids=node_ids, single=False) r = make_chromium_eles(self.page, _ids=node_ids, index=index, is_obj_id=False)
return None if r is False else r return None if r is False else r
timeout = timeout if timeout is not None else self.page.timeout timeout = timeout if timeout is not None else self.page.timeout
@ -1090,7 +1099,7 @@ class ShadowRoot(BaseElement):
if result: if result:
return result return result
return NoneElement(self.page) if single else [] return NoneElement(self.page) if index is not None else []
def _get_node_id(self, obj_id): def _get_node_id(self, obj_id):
"""返回元素node id""" """返回元素node id"""
@ -1107,11 +1116,11 @@ class ShadowRoot(BaseElement):
return r['backendNodeId'] return r['backendNodeId']
def find_in_chromium_ele(ele, loc, single=True, timeout=None, relative=True): def find_in_chromium_ele(ele, loc, index=0, timeout=None, relative=True):
"""在chromium元素中查找 """在chromium元素中查找
:param ele: ChromiumElement对象 :param ele: ChromiumElement对象
:param loc: 元素定位元组 :param loc: 元素定位元组
:param single: True则返回第一个False则返回全部 :param index: 第几个结果为None返回所有
:param timeout: 查找元素超时时间 :param timeout: 查找元素超时时间
:param relative: WebPage用于标记是否相对定位使用 :param relative: WebPage用于标记是否相对定位使用
:return: 返回ChromiumElement元素或它们组成的列表 :return: 返回ChromiumElement元素或它们组成的列表
@ -1133,22 +1142,22 @@ def find_in_chromium_ele(ele, loc, single=True, timeout=None, relative=True):
# ---------------执行查找----------------- # ---------------执行查找-----------------
if loc[0] == 'xpath': if loc[0] == 'xpath':
return find_by_xpath(ele, loc[1], single, timeout, relative=relative) return find_by_xpath(ele, loc[1], index, timeout, relative=relative)
else: else:
return find_by_css(ele, loc[1], single, timeout) return find_by_css(ele, loc[1], index, timeout)
def find_by_xpath(ele, xpath, single, timeout, relative=True): def find_by_xpath(ele, xpath, index, timeout, relative=True):
"""执行用xpath在元素中查找元素 """执行用xpath在元素中查找元素
:param ele: 在此元素中查找 :param ele: 在此元素中查找
:param xpath: 查找语句 :param xpath: 查找语句
:param single: 是否只返回第一个结果 :param index: 第几个结果为None返回所有
:param timeout: 超时时间 :param timeout: 超时时间
:param relative: 是否相对定位 :param relative: 是否相对定位
:return: ChromiumElement或其组成的列表 :return: ChromiumElement或其组成的列表
""" """
type_txt = '9' if single else '7' type_txt = '9' if index == 0 else '7'
node_txt = 'this.contentDocument' if ele.tag in __FRAME_ELEMENT__ and not relative else 'this' node_txt = 'this.contentDocument' if ele.tag in __FRAME_ELEMENT__ and not relative else 'this'
js = make_js_for_find_ele_by_xpath(xpath, type_txt, node_txt) js = make_js_for_find_ele_by_xpath(xpath, type_txt, node_txt)
ele.page.wait.load_complete() ele.page.wait.load_complete()
@ -1170,21 +1179,28 @@ def find_by_xpath(ele, xpath, single, timeout, relative=True):
if res['result']['subtype'] == 'null' or res['result']['description'] in ('NodeList(0)', 'Array(0)'): if res['result']['subtype'] == 'null' or res['result']['description'] in ('NodeList(0)', 'Array(0)'):
return None return None
if single: if index == 0:
r = make_chromium_ele(ele.page, obj_id=res['result']['objectId']) r = make_chromium_eles(ele.page, _ids=res['result']['objectId'], is_obj_id=True)
return None if r is False else r return None if r is False else r
else: else:
# from pprint import pprint res = ele.page.run_cdp('Runtime.getProperties', objectId=res['result']['objectId'],
# for i in ele.page.run_cdp('Runtime.getProperties', ownProperties=True)['result'][:-1]
# objectId=res['result']['objectId'], if index is None:
# ownProperties=True)['result'][:-1]: r = [make_chromium_eles(ele.page, _ids=i['value']['objectId'], is_obj_id=True)
# pprint(i) if i['value']['type'] == 'object' else i['value']['value'] for i in res]
r = [make_chromium_ele(ele.page, obj_id=i['value']['objectId']) if i['value']['type'] == 'object' else return None if False in r else r
i['value']['value'] for i in ele.page.run_cdp('Runtime.getProperties',
objectId=res['result']['objectId'], else:
ownProperties=True)['result'][:-1]] try:
return None if not r or r is False in r else r res = res[index]
except IndexError:
return None
if res['value']['type'] == 'object':
r = make_chromium_eles(ele.page, _ids=res['value']['objectId'], is_obj_id=True)
else:
r = res['value']['value']
return None if r is False else r
end_time = perf_counter() + timeout end_time = perf_counter() + timeout
result = do_find() result = do_find()
@ -1194,19 +1210,19 @@ def find_by_xpath(ele, xpath, single, timeout, relative=True):
if result: if result:
return result return result
return NoneElement(ele.page) if single else [] return NoneElement(ele.page) if index is not None else []
def find_by_css(ele, selector, single, timeout): def find_by_css(ele, selector, index, timeout):
"""执行用css selector在元素中查找元素 """执行用css selector在元素中查找元素
:param ele: 在此元素中查找 :param ele: 在此元素中查找
:param selector: 查找语句 :param selector: 查找语句
:param single: 是否只返回第一个结果 :param index: 第几个结果为None返回所有
:param timeout: 超时时间 :param timeout: 超时时间
:return: ChromiumElement或其组成的列表 :return: ChromiumElement或其组成的列表
""" """
selector = selector.replace('"', r'\"') selector = selector.replace('"', r'\"')
find_all = '' if single else 'All' find_all = '' if index == 0 else 'All'
node_txt = 'this.contentDocument' if ele.tag in ('iframe', 'frame', 'shadow-root') else 'this' node_txt = 'this.contentDocument' if ele.tag in ('iframe', 'frame', 'shadow-root') else 'this'
js = f'function(){{return {node_txt}.querySelector{find_all}("{selector}");}}' js = f'function(){{return {node_txt}.querySelector{find_all}("{selector}");}}'
@ -1221,15 +1237,15 @@ def find_by_css(ele, selector, single, timeout):
if res['result']['subtype'] == 'null' or res['result']['description'] in ('NodeList(0)', 'Array(0)'): if res['result']['subtype'] == 'null' or res['result']['description'] in ('NodeList(0)', 'Array(0)'):
return None return None
if single: if index == 0:
r = make_chromium_ele(ele.page, obj_id=res['result']['objectId']) r = make_chromium_eles(ele.page, _ids=res['result']['objectId'], is_obj_id=True)
return None if r is False else r return None if r is False else r
else: else:
node_ids = [i['value']['objectId'] for i in ele.page.run_cdp('Runtime.getProperties', obj_ids = [i['value']['objectId'] for i in ele.page.run_cdp('Runtime.getProperties',
objectId=res['result']['objectId'], objectId=res['result']['objectId'],
ownProperties=True)['result'][:-1]] ownProperties=True)['result'][:-1]]
r = make_chromium_eles(ele.page, obj_ids=node_ids, single=False, ele_only=False) r = make_chromium_eles(ele.page, _ids=obj_ids, index=index, is_obj_id=True)
return None if r is False else r return None if r is False else r
end_time = perf_counter() + timeout end_time = perf_counter() + timeout
@ -1240,113 +1256,115 @@ def find_by_css(ele, selector, single, timeout):
if result: if result:
return result return result
return NoneElement(ele.page) if single else [] return NoneElement(ele.page) if index is not None else []
def make_chromium_ele(page, node_id=None, obj_id=None): def make_chromium_eles(page, _ids, index=0, is_obj_id=True):
"""根据node id或object id生成相应元素对象 """根据node id或object id生成相应元素对象
:param page: ChromiumPage对象 :param page: ChromiumPage对象
:param node_id: 元素的node id :param _ids: 元素的id列表
:param obj_id: 元素的object id :param index: 获取第几个为None返回全部
:return: ChromiumElement对象或ChromiumFrame对象生成失败返回False :param is_obj_id: 传入的id是obj id还是node id
:return: 浏览器元素对象或它们组成的列表生成失败返回False
""" """
if node_id: if is_obj_id:
node = page.driver.run('DOM.describeNode', nodeId=node_id) get_node_func = _get_node_by_obj_id
if 'error' in node: # id_txt = 'objectId'
return False
if node['node']['nodeName'] in ('#text', '#comment'):
# todo: Node()
return node['node']['nodeValue']
backend_id = node['node']['backendNodeId']
obj_id = page.run_cdp('DOM.resolveNode', nodeId=node_id)['object']['objectId']
if 'error' in obj_id:
return False
elif obj_id:
node = page.driver.run('DOM.describeNode', objectId=obj_id)
if 'error' in node:
return False
if node['node']['nodeName'] in ('#text', '#comment'):
# todo: Node()
return node['node']['nodeValue']
backend_id = node['node']['backendNodeId']
node_id = node['node']['nodeId']
else: else:
return False get_node_func = _get_node_by_node_id
# id_txt = 'nodeId'
if not isinstance(_ids, (list, tuple)):
_ids = (_ids,)
ele = ChromiumElement(page, obj_id=obj_id, node_id=node_id, backend_id=backend_id) # if not ele_only:
if ele.tag in __FRAME_ELEMENT__: if index is not None: # 获取一个
from .._pages.chromium_frame import ChromiumFrame obj_id = _ids[index]
ele = ChromiumFrame(page, ele, node) return get_node_func(page, obj_id)
return ele else: # 获取全部
def make_chromium_eles(page, node_ids=None, obj_ids=None, single=True, ele_only=True):
"""根据node id或object id生成相应元素对象
:param page: ChromiumPage对象
:param node_ids: 元素的node id
:param obj_ids: 元素的object id
:param single: 是否获取但个元素
:param ele_only: 是否只要ele
:return: ChromiumElement对象或ChromiumFrame对象生成失败返回False
"""
nodes = [] nodes = []
if node_ids: for obj_id in _ids:
for node_id in node_ids: tmp = get_node_func(page, obj_id)
if not node_id: if tmp is False:
return False return False
node = page.driver.run('DOM.describeNode', nodeId=node_id) nodes.append(tmp)
return nodes
# if index is None:
# nodes = []
# for obj_id in _ids:
# tmp = get_node_func(page, obj_id)
# if tmp is False:
# return False
# if not isinstance(tmp, str):
# nodes.append(tmp)
# return nodes
#
# ids_count = len(_ids)
# if index < 0:
# index = ids_count + index
# if index > ids_count - 1:
# return False
#
# tmp = get_node_func(page, _ids[index])
# if not isinstance(tmp, str):
# return tmp
#
# num = -1
# for obj_id in _ids:
# node = _get_node_info(page, id_txt, obj_id)
# if node is False:
# return False
# if node['node']['nodeName'] in ('#text', '#comment'):
# continue
# num += 1
# if num == index:
# return _make_ele(page, obj_id, node)
# return NoneElement(page)
def _get_node_info(page, id_type, _id):
if not _id:
return False
arg = {id_type: _id}
node = page.driver.run('DOM.describeNode', **arg)
if 'error' in node: if 'error' in node:
return False return False
return node
def _get_node_by_obj_id(page, obj_id):
node = _get_node_info(page, 'objectId', obj_id)
if node is False:
return False
if node['node']['nodeName'] in ('#text', '#comment'): if node['node']['nodeName'] in ('#text', '#comment'):
if ele_only:
continue
else:
if single:
return node['node']['nodeValue'] return node['node']['nodeValue']
else: else:
nodes.append(node['node']['nodeValue']) return _make_ele(page, obj_id, node)
def _get_node_by_node_id(page, node_id):
node = _get_node_info(page, 'nodeId', node_id)
if node is False:
return False
if node['node']['nodeName'] in ('#text', '#comment'):
return node['node']['nodeValue']
else:
obj_id = page.driver.run('DOM.resolveNode', nodeId=node_id) obj_id = page.driver.run('DOM.resolveNode', nodeId=node_id)
if 'error' in obj_id: if 'error' in obj_id:
return False return False
obj_id = obj_id['object']['objectId'] obj_id = obj_id['object']['objectId']
ele = ChromiumElement(page, obj_id=obj_id, node_id=node_id, backend_id=node['node']['backendNodeId']) return _make_ele(page, obj_id, node)
if ele.tag in __FRAME_ELEMENT__:
from .._pages.chromium_frame import ChromiumFrame
ele = ChromiumFrame(page, ele, node)
if single:
return ele
nodes.append(ele)
if obj_ids:
for obj_id in obj_ids:
if not obj_id:
return False
node = page.driver.run('DOM.describeNode', objectId=obj_id)
if 'error' in node:
return False
if node['node']['nodeName'] in ('#text', '#comment'):
if ele_only:
continue
else:
if single:
return node['node']['nodeValue']
else:
nodes.append(node['node']['nodeValue'])
def _make_ele(page, obj_id, node):
ele = ChromiumElement(page, obj_id=obj_id, node_id=node['node']['nodeId'], ele = ChromiumElement(page, obj_id=obj_id, node_id=node['node']['nodeId'],
backend_id=node['node']['backendNodeId']) backend_id=node['node']['backendNodeId'])
if ele.tag in __FRAME_ELEMENT__: if ele.tag in __FRAME_ELEMENT__:
from .._pages.chromium_frame import ChromiumFrame from .._pages.chromium_frame import ChromiumFrame
ele = ChromiumFrame(page, ele, node) ele = ChromiumFrame(page, ele, node)
if single:
return ele return ele
nodes.append(ele)
return NoneElement(page) if single and not nodes else nodes
def make_js_for_find_ele_by_xpath(xpath, type_txt, node_txt): def make_js_for_find_ele_by_xpath(xpath, type_txt, node_txt):
@ -1470,7 +1488,7 @@ def parse_js_result(page, ele, result):
elif class_name == 'HTMLDocument': elif class_name == 'HTMLDocument':
return result return result
else: else:
r = make_chromium_ele(page, obj_id=result['objectId']) r = make_chromium_eles(page, _ids=result['objectId'])
if r is False: if r is False:
raise ElementLostError raise ElementLostError
return r return r

View File

@ -6,7 +6,7 @@
@License : BSD 3-Clause. @License : BSD 3-Clause.
""" """
from pathlib import Path from pathlib import Path
from typing import Union, Tuple, List, Any, Literal from typing import Union, Tuple, List, Any, Literal, Optional
from .none_element import NoneElement from .none_element import NoneElement
from .._base.base import DrissionElement, BaseElement from .._base.base import DrissionElement, BaseElement
@ -47,7 +47,9 @@ class ChromiumElement(DrissionElement):
def __repr__(self) -> str: ... def __repr__(self) -> str: ...
def __call__(self, loc_or_str: Union[Tuple[str, str], str], def __call__(self,
loc_or_str: Union[Tuple[str, str], str],
index: int = 0,
timeout: float = None) -> Union[ChromiumElement, NoneElement]: ... timeout: float = None) -> Union[ChromiumElement, NoneElement]: ...
def __eq__(self, other: ChromiumElement) -> bool: ... def __eq__(self, other: ChromiumElement) -> bool: ...
@ -175,20 +177,23 @@ class ChromiumElement(DrissionElement):
def ele(self, def ele(self,
loc_or_str: Union[Tuple[str, str], str], loc_or_str: Union[Tuple[str, str], str],
index: int = 0,
timeout: float = None) -> Union[ChromiumElement, NoneElement]: ... timeout: float = None) -> Union[ChromiumElement, NoneElement]: ...
def eles(self, def eles(self,
loc_or_str: Union[Tuple[str, str], str], loc_or_str: Union[Tuple[str, str], str],
timeout: float = None) -> List[ChromiumElement]: ... timeout: float = None) -> List[ChromiumElement]: ...
def s_ele(self, loc_or_str: Union[Tuple[str, str], str] = None) -> Union[SessionElement, NoneElement]: ... def s_ele(self,
loc_or_str: Union[Tuple[str, str], str] = None,
index: int = 0) -> Union[SessionElement, NoneElement]: ...
def s_eles(self, loc_or_str: Union[Tuple[str, str], str] = None) -> List[SessionElement]: ... def s_eles(self, loc_or_str: Union[Tuple[str, str], str] = None) -> List[SessionElement]: ...
def _find_elements(self, def _find_elements(self,
loc_or_str: Union[Tuple[str, str], str], loc_or_str: Union[Tuple[str, str], str],
timeout: float = None, timeout: float = None,
single: bool = True, index: Optional[int] = True,
relative: bool = False, relative: bool = False,
raise_err: bool = False) -> Union[ChromiumElement, ChromiumFrame, NoneElement, raise_err: bool = False) -> Union[ChromiumElement, ChromiumFrame, NoneElement,
List[Union[ChromiumElement, ChromiumFrame]]]: ... List[Union[ChromiumElement, ChromiumFrame]]]: ...
@ -286,20 +291,28 @@ class ShadowRoot(BaseElement):
def afters(self, filter_loc: Union[tuple, str] = '') -> List[ChromiumElement]: ... def afters(self, filter_loc: Union[tuple, str] = '') -> List[ChromiumElement]: ...
def ele(self, loc_or_str: Union[Tuple[str, str], str], def ele(self,
loc_or_str: Union[Tuple[str, str], str],
index: int = 0,
timeout: float = None) -> Union[ChromiumElement, NoneElement]: ... timeout: float = None) -> Union[ChromiumElement, NoneElement]: ...
def eles(self, loc_or_str: Union[Tuple[str, str], str], def eles(self,
loc_or_str: Union[Tuple[str, str], str],
timeout: float = None) -> List[ChromiumElement]: ... timeout: float = None) -> List[ChromiumElement]: ...
def s_ele(self, loc_or_str: Union[Tuple[str, str], str] = None) -> Union[SessionElement, NoneElement]: ... def s_ele(self,
loc_or_str: Union[Tuple[str, str], str] = None,
index: int = 0) -> Union[SessionElement, NoneElement]: ...
def s_eles(self, loc_or_str: Union[Tuple[str, str], str]) -> List[SessionElement]: ... def s_eles(self, loc_or_str: Union[Tuple[str, str], str]) -> List[SessionElement]: ...
def _find_elements(self, loc_or_str: Union[Tuple[str, str], str], timeout: float = None, def _find_elements(self,
single: bool = True, relative: bool = False, raise_err: bool = None) \ loc_or_str: Union[Tuple[str, str], str],
-> Union[ChromiumElement, ChromiumFrame, NoneElement, str, List[Union[ChromiumElement, timeout: float = None,
ChromiumFrame, str]]]: ... index: Optional[int] = 0,
relative: bool = False,
raise_err: bool = None) -> Union[ChromiumElement, ChromiumFrame, NoneElement, str,
List[Union[ChromiumElement, ChromiumFrame, str]]]: ...
def _get_node_id(self, obj_id: str) -> int: ... def _get_node_id(self, obj_id: str) -> int: ...
@ -308,37 +321,42 @@ class ShadowRoot(BaseElement):
def _get_backend_id(self, node_id: int) -> int: ... def _get_backend_id(self, node_id: int) -> int: ...
def find_in_chromium_ele(ele: ChromiumElement, loc: Union[str, Tuple[str, str]], def find_in_chromium_ele(ele: ChromiumElement,
single: bool = True, timeout: float = None, relative: bool = True) \ loc: Union[str, Tuple[str, str]],
-> Union[ChromiumElement, NoneElement, List[ChromiumElement]]: ... index: Optional[int] = 0,
timeout: float = None,
relative: bool = True) -> Union[ChromiumElement, NoneElement, List[ChromiumElement]]: ...
def find_by_xpath(ele: ChromiumElement, xpath: str, single: bool, timeout: float, def find_by_xpath(ele: ChromiumElement,
xpath: str,
index: Optional[int],
timeout: float,
relative: bool = True) -> Union[ChromiumElement, List[ChromiumElement], NoneElement]: ... relative: bool = True) -> Union[ChromiumElement, List[ChromiumElement], NoneElement]: ...
def find_by_css(ele: ChromiumElement, selector: str, single: bool, def find_by_css(ele: ChromiumElement,
selector: str,
index: Optional[int],
timeout: float) -> Union[ChromiumElement, List[ChromiumElement], NoneElement]: ... timeout: float) -> Union[ChromiumElement, List[ChromiumElement], NoneElement]: ...
def make_chromium_ele(page: Union[ChromiumBase, ChromiumPage, WebPage, ChromiumTab, ChromiumFrame],
node_id: int = ...,
obj_id: str = ...) -> Union[ChromiumElement, ChromiumFrame, str]: ...
def make_chromium_eles(page: Union[ChromiumBase, ChromiumPage, WebPage, ChromiumTab, ChromiumFrame], def make_chromium_eles(page: Union[ChromiumBase, ChromiumPage, WebPage, ChromiumTab, ChromiumFrame],
node_ids: Union[tuple, list] = None, _ids: Union[tuple, list, str, int],
obj_ids: Union[tuple, list] = None, index: Optional[int] = 0,
single: bool = True, is_obj_id: bool = True
ele_only: bool = True) -> Union[ChromiumElement, ChromiumFrame, NoneElement, ) -> Union[ChromiumElement, ChromiumFrame, NoneElement,
List[Union[ChromiumElement, ChromiumFrame]]]: ... List[Union[ChromiumElement, ChromiumFrame]]]: ...
def make_js_for_find_ele_by_xpath(xpath: str, type_txt: str, node_txt: str) -> str: ... def make_js_for_find_ele_by_xpath(xpath: str, type_txt: str, node_txt: str) -> str: ...
def run_js(page_or_ele: Union[ChromiumBase, ChromiumElement, ShadowRoot], script: str, def run_js(page_or_ele: Union[ChromiumBase, ChromiumElement, ShadowRoot],
as_expr: bool = False, timeout: float = None, args: tuple = ...) -> Any: ... script: str,
as_expr: bool = False,
timeout: float = None,
args: tuple = ...) -> Any: ...
def parse_js_result(page: ChromiumBase, ele: ChromiumElement, result: dict): ... def parse_js_result(page: ChromiumBase, ele: ChromiumElement, result: dict): ...

View File

@ -119,7 +119,7 @@ class SessionElement(DrissionElement):
return super().next(filter_loc, index, timeout, ele_only=ele_only) return super().next(filter_loc, index, timeout, ele_only=ele_only)
def before(self, filter_loc='', index=1, timeout=None, ele_only=True): def before(self, filter_loc='', index=1, timeout=None, ele_only=True):
"""返回文档中当前元素前面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回文档中当前元素前面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个
查找范围不限同级元素而是整个DOM文档 查找范围不限同级元素而是整个DOM文档
:param filter_loc: 用于筛选的查询语法 :param filter_loc: 用于筛选的查询语法
:param index: 前面第几个查询结果1开始 :param index: 前面第几个查询结果1开始
@ -130,7 +130,7 @@ class SessionElement(DrissionElement):
return super().before(filter_loc, index, timeout, ele_only=ele_only) return super().before(filter_loc, index, timeout, ele_only=ele_only)
def after(self, filter_loc='', index=1, timeout=None, ele_only=True): def after(self, filter_loc='', index=1, timeout=None, ele_only=True):
"""返回文档中此当前元素后面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回文档中此当前元素后面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个
查找范围不限同级元素而是整个DOM文档 查找范围不限同级元素而是整个DOM文档
:param filter_loc: 用于筛选的查询语法 :param filter_loc: 用于筛选的查询语法
:param index: 第几个查询结果1开始 :param index: 第几个查询结果1开始
@ -220,13 +220,14 @@ class SessionElement(DrissionElement):
else: else:
return self.inner_ele.get(attr) return self.inner_ele.get(attr)
def ele(self, loc_or_str, timeout=None): def ele(self, loc_or_str, index=0, timeout=None):
"""返回当前元素下级符合条件的一个元素、属性或节点文本 """返回当前元素下级符合条件的一个元素、属性或节点文本
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param index: 第几个元素0开始
:param timeout: 不起实际作用 :param timeout: 不起实际作用
:return: SessionElement对象或属性文本 :return: SessionElement对象或属性文本
""" """
return self._ele(loc_or_str, method='ele()') return self._ele(loc_or_str, index=index, method='ele()')
def eles(self, loc_or_str, timeout=None): def eles(self, loc_or_str, timeout=None):
"""返回当前元素下级所有符合条件的子元素、属性或节点文本 """返回当前元素下级所有符合条件的子元素、属性或节点文本
@ -234,32 +235,33 @@ class SessionElement(DrissionElement):
:param timeout: 不起实际作用 :param timeout: 不起实际作用
:return: SessionElement对象或属性文本组成的列表 :return: SessionElement对象或属性文本组成的列表
""" """
return self._ele(loc_or_str, single=False) return self._ele(loc_or_str, index=None)
def s_ele(self, loc_or_str=None): def s_ele(self, loc_or_str=None, index=0):
"""返回当前元素下级符合条件的一个元素、属性或节点文本 """返回当前元素下级符合条件的一个元素、属性或节点文本
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param index: 获取第几个0开始
:return: SessionElement对象或属性文本 :return: SessionElement对象或属性文本
""" """
return self._ele(loc_or_str, method='s_ele()') return self._ele(loc_or_str, index=index, method='s_ele()')
def s_eles(self, loc_or_str): def s_eles(self, loc_or_str):
"""返回当前元素下级所有符合条件的子元素、属性或节点文本 """返回当前元素下级所有符合条件的子元素、属性或节点文本
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:return: SessionElement对象或属性文本组成的列表 :return: SessionElement对象或属性文本组成的列表
""" """
return self._ele(loc_or_str, single=False) return self._ele(loc_or_str, index=None)
def _find_elements(self, loc_or_str, timeout=None, single=True, relative=False, raise_err=None): def _find_elements(self, loc_or_str, timeout=None, index=0, relative=False, raise_err=None):
"""返回当前元素下级符合条件的子元素、属性或节点文本,默认返回第一个 """返回当前元素下级符合条件的子元素、属性或节点文本
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param timeout: 不起实际作用用于和父类对应 :param timeout: 不起实际作用用于和父类对应
:param single: True则返回第一个False则返回全部 :param index: 第几个结果0开始为None返回所有
:param relative: WebPage用的表示是否相对定位的参数 :param relative: WebPage用的表示是否相对定位的参数
:param raise_err: 找不到元素是是否抛出异常为None时根据全局设置 :param raise_err: 找不到元素是是否抛出异常为None时根据全局设置
:return: SessionElement对象 :return: SessionElement对象
""" """
return make_session_ele(self, loc_or_str, single) return make_session_ele(self, loc_or_str, index=index)
def _get_ele_path(self, mode): def _get_ele_path(self, mode):
"""获取css路径或xpath路径 """获取css路径或xpath路径
@ -282,19 +284,18 @@ class SessionElement(DrissionElement):
return f'{path_str[1:]}' if mode == 'css' else path_str return f'{path_str[1:]}' if mode == 'css' else path_str
def make_session_ele(html_or_ele, loc=None, single=True): def make_session_ele(html_or_ele, loc=None, index=0):
"""从接收到的对象或html文本中查找元素返回SessionElement对象 """从接收到的对象或html文本中查找元素返回SessionElement对象
如要直接从html生成SessionElement而不在下级查找loc输入None即可 如要直接从html生成SessionElement而不在下级查找loc输入None即可
:param html_or_ele: html文本BaseParser对象 :param html_or_ele: html文本BaseParser对象
:param loc: 定位元组或字符串为None时不在下级查找返回根元素 :param loc: 定位元组或字符串为None时不在下级查找返回根元素
:param single: True则返回第一个False则返回全部 :param index: 获取第几个元素None获取所有
:return: 返回SessionElement元素或列表或属性文本 :return: 返回SessionElement元素或列表或属性文本
""" """
# ---------------处理定位符--------------- # ---------------处理定位符---------------
if not loc: if not loc:
if isinstance(html_or_ele, SessionElement): if isinstance(html_or_ele, SessionElement):
return html_or_ele if single else [html_or_ele] return html_or_ele
loc = ('xpath', '.') loc = ('xpath', '.')
elif isinstance(loc, (str, tuple)): elif isinstance(loc, (str, tuple)):
@ -368,16 +369,25 @@ def make_session_ele(html_or_ele, loc=None, single=True):
# ---------------执行查找----------------- # ---------------执行查找-----------------
try: try:
if loc[0] == 'xpath': # 用lxml内置方法获取lxml的元素对象列表 if loc[0] == 'xpath': # 用lxml内置方法获取lxml的元素对象列表
ele = html_or_ele.xpath(loc[1]) eles = html_or_ele.xpath(loc[1])
else: # 用css selector获取元素对象列表 else: # 用css selector获取元素对象列表
ele = html_or_ele.cssselect(loc[1]) eles = html_or_ele.cssselect(loc[1])
if not isinstance(ele, list): # 结果不是列表,如数字 if not isinstance(eles, list): # 结果不是列表,如数字
return ele return eles
# 把lxml元素对象包装成SessionElement对象并按需要返回第一个或全部 # 把lxml元素对象包装成SessionElement对象并按需要返回一个或全部
if single: if index is None:
ele = ele[0] if ele else None return [SessionElement(e, page) if isinstance(e, HtmlElement) else e for e in eles if e != '\n']
else:
eles_count = len(eles)
if index < 0:
index = eles_count + index
if index > eles_count - 1:
return NoneElement(page)
ele = eles[index]
if isinstance(ele, HtmlElement): if isinstance(ele, HtmlElement):
return SessionElement(ele, page) return SessionElement(ele, page)
elif isinstance(ele, str): elif isinstance(ele, str):
@ -385,9 +395,6 @@ def make_session_ele(html_or_ele, loc=None, single=True):
else: else:
return NoneElement(page) return NoneElement(page)
else: # 返回全部
return [SessionElement(e, page) if isinstance(e, HtmlElement) else e for e in ele if e != '\n']
except Exception as e: except Exception as e:
if 'Invalid expression' in str(e): if 'Invalid expression' in str(e):
raise SyntaxError(f'无效的xpath语句{loc}') raise SyntaxError(f'无效的xpath语句{loc}')

View File

@ -30,6 +30,7 @@ class SessionElement(DrissionElement):
def __call__(self, def __call__(self,
loc_or_str: Union[Tuple[str, str], str], loc_or_str: Union[Tuple[str, str], str],
index: int = 0,
timeout: float = None) -> Union[SessionElement, NoneElement]: ... timeout: float = None) -> Union[SessionElement, NoneElement]: ...
def __eq__(self, other: SessionElement) -> bool: ... def __eq__(self, other: SessionElement) -> bool: ...
@ -115,6 +116,7 @@ class SessionElement(DrissionElement):
def ele(self, def ele(self,
loc_or_str: Union[Tuple[str, str], str], loc_or_str: Union[Tuple[str, str], str],
index: int = 0,
timeout: float = None) -> Union[SessionElement, NoneElement]: ... timeout: float = None) -> Union[SessionElement, NoneElement]: ...
def eles(self, def eles(self,
@ -122,18 +124,17 @@ class SessionElement(DrissionElement):
timeout: float = None) -> List[SessionElement]: ... timeout: float = None) -> List[SessionElement]: ...
def s_ele(self, def s_ele(self,
loc_or_str: Union[Tuple[str, str], str] = None) -> Union[SessionElement, NoneElement]: ... loc_or_str: Union[Tuple[str, str], str] = None,
index: int = 0) -> Union[SessionElement, NoneElement]: ...
def s_eles(self, def s_eles(self, loc_or_str: Union[Tuple[str, str], str]) -> List[SessionElement]: ...
loc_or_str: Union[Tuple[str, str], str]) -> List[SessionElement]: ...
def _find_elements(self, def _find_elements(self,
loc_or_str: Union[Tuple[str, str], str], loc_or_str: Union[Tuple[str, str], str],
timeout: float = None, timeout: float = None,
single: bool = True, index: Optional[int] = 0,
relative: bool = False, relative: bool = False,
raise_err: bool = None) \ raise_err: bool = None) -> Union[SessionElement, NoneElement, List[SessionElement]]: ...
-> Union[SessionElement, NoneElement, List[SessionElement]]: ...
def _get_ele_path(self, mode: str) -> str: ... def _get_ele_path(self, mode: str) -> str: ...
@ -141,5 +142,4 @@ class SessionElement(DrissionElement):
def make_session_ele(html_or_ele: Union[str, SessionElement, SessionPage, ChromiumElement, BaseElement, ChromiumFrame, def make_session_ele(html_or_ele: Union[str, SessionElement, SessionPage, ChromiumElement, BaseElement, ChromiumFrame,
ChromiumBase], ChromiumBase],
loc: Union[str, Tuple[str, str]] = None, loc: Union[str, Tuple[str, str]] = None,
single: bool = True) -> Union[ index: Optional[int] = 0) -> Union[SessionElement, NoneElement, List[SessionElement]]: ...
SessionElement, NoneElement, List[SessionElement]]: ...

View File

@ -244,14 +244,15 @@ class ChromiumBase(BasePage):
self.run_cdp('Page.setInterceptFileChooserDialog', enabled=False) self.run_cdp('Page.setInterceptFileChooserDialog', enabled=False)
self._upload_list = None self._upload_list = None
def __call__(self, loc_or_str, timeout=None): def __call__(self, loc_or_str, index=0, timeout=None):
"""在内部查找元素 """在内部查找元素
ele = page('@id=ele_id') ele = page('@id=ele_id')
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param index: 获取第几个元素0开始
:param timeout: 超时时间 :param timeout: 超时时间
:return: ChromiumElement对象 :return: ChromiumElement对象
""" """
return self.ele(loc_or_str, timeout) return self.ele(loc_or_str, index, timeout)
def _wait_to_stop(self): def _wait_to_stop(self):
"""eager策略超时时使页面停止加载""" """eager策略超时时使页面停止加载"""
@ -490,13 +491,14 @@ class ChromiumBase(BasePage):
return [{'name': cookie['name'], 'value': cookie['value'], 'domain': cookie['domain']} return [{'name': cookie['name'], 'value': cookie['value'], 'domain': cookie['domain']}
for cookie in cookies] for cookie in cookies]
def ele(self, loc_or_ele, timeout=None): def ele(self, loc_or_ele, index=0, timeout=None):
"""获取一个符合条件的元素对象 """获取一个符合条件的元素对象
:param loc_or_ele: 定位符或元素对象 :param loc_or_ele: 定位符或元素对象
:param index: 获取第几个元素0开始
:param timeout: 查找超时时间 :param timeout: 查找超时时间
:return: ChromiumElement对象 :return: ChromiumElement对象
""" """
return self._ele(loc_or_ele, timeout=timeout, method='ele()') return self._ele(loc_or_ele, timeout=timeout, index=index, method='ele()')
def eles(self, loc_or_str, timeout=None): def eles(self, loc_or_str, timeout=None):
"""获取所有符合条件的元素对象 """获取所有符合条件的元素对象
@ -504,14 +506,15 @@ class ChromiumBase(BasePage):
:param timeout: 查找超时时间 :param timeout: 查找超时时间
:return: ChromiumElement对象组成的列表 :return: ChromiumElement对象组成的列表
""" """
return self._ele(loc_or_str, timeout=timeout, single=False) return self._ele(loc_or_str, timeout=timeout, index=None)
def s_ele(self, loc_or_ele=None): def s_ele(self, loc_or_ele=None, index=0):
"""查找一个符合条件的元素以SessionElement形式返回处理复杂页面时效率很高 """查找一个符合条件的元素以SessionElement形式返回处理复杂页面时效率很高
:param loc_or_ele: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_ele: 元素的定位信息可以是loc元组或查询字符串
:param index: 获取第几个0开始
:return: SessionElement对象或属性文本 :return: SessionElement对象或属性文本
""" """
r = make_session_ele(self, loc_or_ele) r = make_session_ele(self, loc_or_ele, index=index)
if isinstance(r, NoneElement): if isinstance(r, NoneElement):
if Settings.raise_when_ele_not_found: if Settings.raise_when_ele_not_found:
raise ElementNotFoundError(None, 's_ele()', {'loc_or_ele': loc_or_ele}) raise ElementNotFoundError(None, 's_ele()', {'loc_or_ele': loc_or_ele})
@ -525,13 +528,13 @@ class ChromiumBase(BasePage):
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:return: SessionElement对象组成的列表 :return: SessionElement对象组成的列表
""" """
return make_session_ele(self, loc_or_str, single=False) return make_session_ele(self, loc_or_str, index=None)
def _find_elements(self, loc_or_ele, timeout=None, single=True, relative=False, raise_err=None): def _find_elements(self, loc_or_ele, timeout=None, index=0, relative=False, raise_err=None):
"""执行元素查找 """执行元素查找
:param loc_or_ele: 定位符或元素对象 :param loc_or_ele: 定位符或元素对象
:param timeout: 查找超时时间 :param timeout: 查找超时时间
:param single: 是否只返回第一个 :param index: 第几个结果0开始为None返回所有
:param relative: WebPage用的表示是否相对定位的参数 :param relative: WebPage用的表示是否相对定位的参数
:param raise_err: 找不到元素是是否抛出异常为None时根据全局设置 :param raise_err: 找不到元素是是否抛出异常为None时根据全局设置
:return: ChromiumElement对象或元素对象组成的列表 :return: ChromiumElement对象或元素对象组成的列表
@ -558,16 +561,28 @@ class ChromiumBase(BasePage):
while True: while True:
if num > 0: if num > 0:
num = 1 if single else num from_index = index_arg = 0
nIds = self._driver.run('DOM.getSearchResults', searchId=result['searchId'], fromIndex=0, toIndex=num) if index is None:
end_index = num
index_arg = None
elif index < 0:
from_index = index + num
end_index = from_index + 1
else:
from_index = index
end_index = from_index + 1
if from_index <= num - 1:
nIds = self._driver.run('DOM.getSearchResults', searchId=result['searchId'],
fromIndex=from_index, toIndex=end_index)
if __ERROR__ not in nIds: if __ERROR__ not in nIds:
if nIds['nodeIds'][0] != 0: if nIds['nodeIds'][0] != 0:
r = make_chromium_eles(self, node_ids=nIds['nodeIds'], single=single) r = make_chromium_eles(self, _ids=nIds['nodeIds'], index=index_arg, is_obj_id=False)
if r is not False: if r is not False:
break break
if perf_counter() >= end_time: if perf_counter() >= end_time:
return NoneElement(self) if single else [] return NoneElement(self) if index is not None else []
sleep(.1) sleep(.1)
timeout = end_time - perf_counter() timeout = end_time - perf_counter()
@ -699,7 +714,7 @@ class ChromiumBase(BasePage):
:return: ChromiumFrame对象组成的列表 :return: ChromiumFrame对象组成的列表
""" """
loc = loc or 'xpath://*[name()="iframe" or name()="frame"]' loc = loc or 'xpath://*[name()="iframe" or name()="frame"]'
frames = self._ele(loc, timeout=timeout, single=False, raise_err=False) frames = self._ele(loc, timeout=timeout, index=None, raise_err=False)
return [i for i in frames if str(type(i)).endswith(".ChromiumFrame'>")] return [i for i in frames if str(type(i)).endswith(".ChromiumFrame'>")]
def get_session_storage(self, item=None): def get_session_storage(self, item=None):

View File

@ -93,7 +93,9 @@ class ChromiumBase(BasePage):
def _d_set_runtime_settings(self) -> None: ... def _d_set_runtime_settings(self) -> None: ...
def __call__(self, loc_or_str: Union[Tuple[str, str], str, ChromiumElement], def __call__(self,
loc_or_str: Union[Tuple[str, str], str, ChromiumElement],
index: int = 0,
timeout: float = None) -> Union[ChromiumElement, NoneElement]: ... timeout: float = None) -> Union[ChromiumElement, NoneElement]: ...
@property @property
@ -177,19 +179,27 @@ class ChromiumBase(BasePage):
def get_cookies(self, as_dict: bool = False, all_domains: bool = False, def get_cookies(self, as_dict: bool = False, all_domains: bool = False,
all_info: bool = False) -> Union[list, dict]: ... all_info: bool = False) -> Union[list, dict]: ...
def ele(self, loc_or_ele: Union[Tuple[str, str], str, ChromiumElement, ChromiumFrame], def ele(self,
loc_or_ele: Union[Tuple[str, str], str, ChromiumElement, ChromiumFrame],
index: int = 0,
timeout: float = None) -> Union[ChromiumElement, NoneElement]: ... timeout: float = None) -> Union[ChromiumElement, NoneElement]: ...
def eles(self, loc_or_str: Union[Tuple[str, str], str], def eles(self,
loc_or_str: Union[Tuple[str, str], str],
timeout: float = None) -> List[ChromiumElement]: ... timeout: float = None) -> List[ChromiumElement]: ...
def s_ele(self, loc_or_ele: Union[Tuple[str, str], str] = None) \ def s_ele(self,
-> Union[SessionElement, NoneElement]: ... loc_or_ele: Union[Tuple[str, str], str] = None,
index:int = 0) -> Union[SessionElement, NoneElement]: ...
def s_eles(self, loc_or_str: Union[Tuple[str, str], str]) -> List[SessionElement]: ... def s_eles(self, loc_or_str: Union[Tuple[str, str], str]) -> List[SessionElement]: ...
def _find_elements(self, loc_or_ele: Union[Tuple[str, str], str, ChromiumElement, ChromiumFrame], def _find_elements(self,
timeout: float = None, single: bool = True, relative: bool = False, raise_err: bool = None) \ loc_or_ele: Union[Tuple[str, str], str, ChromiumElement, ChromiumFrame],
timeout: float = None,
index: Optional[int] = 0,
relative: bool = False,
raise_err: bool = None) \
-> Union[ChromiumElement, ChromiumFrame, NoneElement, List[Union[ChromiumElement, ChromiumFrame]]]: ... -> Union[ChromiumElement, ChromiumFrame, NoneElement, List[Union[ChromiumElement, ChromiumFrame]]]: ...
def refresh(self, ignore_cache: bool = False) -> None: ... def refresh(self, ignore_cache: bool = False) -> None: ...
@ -279,4 +289,4 @@ def get_mhtml(page: Union[ChromiumPage, ChromiumTab],
def get_pdf(page: Union[ChromiumPage, ChromiumTab], def get_pdf(page: Union[ChromiumPage, ChromiumTab],
path: Union[str, Path] = None, path: Union[str, Path] = None,
name: str = None, kwargs: dict=None) -> bytes: ... name: str = None, kwargs: dict = None) -> bytes: ...

View File

@ -64,14 +64,15 @@ class ChromiumFrame(ChromiumBase):
break break
sleep(.1) sleep(.1)
def __call__(self, loc_or_str, timeout=None): def __call__(self, loc_or_str, index=0, timeout=None):
"""在内部查找元素 """在内部查找元素
ele2 = ele1('@id=ele_id') ele2 = ele1('@id=ele_id')
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param index: 获取第几个0开始
:param timeout: 超时时间 :param timeout: 超时时间
:return: ChromiumElement对象或属性文本 :return: ChromiumElement对象或属性文本
""" """
return self.ele(loc_or_str, timeout) return self.ele(loc_or_str, index=index, timeout=timeout)
def __eq__(self, other): def __eq__(self, other):
return self._frame_id == getattr(other, '_frame_id', None) return self._frame_id == getattr(other, '_frame_id', None)
@ -388,8 +389,8 @@ class ChromiumFrame(ChromiumBase):
def parent(self, level_or_loc=1, index=1): def parent(self, level_or_loc=1, index=1):
"""返回上面某一级父元素,可指定层数或用查询语法定位 """返回上面某一级父元素,可指定层数或用查询语法定位
:param level_or_loc: 第几级父元素或定位符 :param level_or_loc: 第几级父元素1开始或定位符
:param index: 当level_or_loc传入定位符使用此参数选择第几个结果 :param index: 当level_or_loc传入定位符使用此参数选择第几个结果1开始
:return: 上级元素对象 :return: 上级元素对象
""" """
return self.frame_ele.parent(level_or_loc, index) return self.frame_ele.parent(level_or_loc, index)
@ -415,7 +416,7 @@ class ChromiumFrame(ChromiumBase):
return self.frame_ele.next(filter_loc, index, timeout, ele_only=ele_only) return self.frame_ele.next(filter_loc, index, timeout, ele_only=ele_only)
def before(self, filter_loc='', index=1, timeout=None, ele_only=True): def before(self, filter_loc='', index=1, timeout=None, ele_only=True):
"""返回文档中当前元素前面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回文档中当前元素前面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个
查找范围不限同级元素而是整个DOM文档 查找范围不限同级元素而是整个DOM文档
:param filter_loc: 用于筛选的查询语法 :param filter_loc: 用于筛选的查询语法
:param index: 前面第几个查询结果1开始 :param index: 前面第几个查询结果1开始
@ -426,7 +427,7 @@ class ChromiumFrame(ChromiumBase):
return self.frame_ele.before(filter_loc, index, timeout, ele_only=ele_only) return self.frame_ele.before(filter_loc, index, timeout, ele_only=ele_only)
def after(self, filter_loc='', index=1, timeout=None, ele_only=True): def after(self, filter_loc='', index=1, timeout=None, ele_only=True):
"""返回文档中此当前元素后面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个 """返回文档中此当前元素后面符合条件的一个元素,可用查询语法筛选,可指定返回筛选结果的第几个
查找范围不限同级元素而是整个DOM文档 查找范围不限同级元素而是整个DOM文档
:param filter_loc: 用于筛选的查询语法 :param filter_loc: 用于筛选的查询语法
:param index: 后面第几个查询结果1开始 :param index: 后面第几个查询结果1开始
@ -561,11 +562,11 @@ class ChromiumFrame(ChromiumBase):
self.tab.remove_ele(new_ele) self.tab.remove_ele(new_ele)
return r return r
def _find_elements(self, loc_or_ele, timeout=None, single=True, relative=False, raise_err=None): def _find_elements(self, loc_or_ele, timeout=None, index=0, relative=False, raise_err=None):
"""在frame内查找单个元素 """在frame内查找单个元素
:param loc_or_ele: 定位符或元素对象 :param loc_or_ele: 定位符或元素对象
:param timeout: 查找超时时间 :param timeout: 查找超时时间
:param single: True则返回第一个False则返回全部 :param index: 第几个结果0开始为None返回所有
:param relative: WebPage用的表示是否相对定位的参数 :param relative: WebPage用的表示是否相对定位的参数
:param raise_err: 找不到元素是是否抛出异常为None时根据全局设置 :param raise_err: 找不到元素是是否抛出异常为None时根据全局设置
:return: ChromiumElement对象 :return: ChromiumElement对象
@ -574,7 +575,7 @@ class ChromiumFrame(ChromiumBase):
return loc_or_ele return loc_or_ele
self.wait.load_complete() self.wait.load_complete()
return self.doc_ele._ele(loc_or_ele, timeout, return self.doc_ele._ele(loc_or_ele, timeout,
raise_err=raise_err) if single else self.doc_ele.eles(loc_or_ele, timeout) raise_err=raise_err) if index is not None else self.doc_ele.eles(loc_or_ele, timeout)
def _is_inner_frame(self): def _is_inner_frame(self):
"""返回当前frame是否同域""" """返回当前frame是否同域"""

View File

@ -6,7 +6,7 @@
@License : BSD 3-Clause. @License : BSD 3-Clause.
""" """
from pathlib import Path from pathlib import Path
from typing import Union, Tuple, List, Any from typing import Union, Tuple, List, Any, Optional
from .chromium_base import ChromiumBase from .chromium_base import ChromiumBase
from .chromium_page import ChromiumPage from .chromium_page import ChromiumPage
@ -44,6 +44,7 @@ class ChromiumFrame(ChromiumBase):
def __call__(self, def __call__(self,
loc_or_str: Union[Tuple[str, str], str], loc_or_str: Union[Tuple[str, str], str],
index: int = 0,
timeout: float = None) -> Union[ChromiumElement, NoneElement]: ... timeout: float = None) -> Union[ChromiumElement, NoneElement]: ...
def __eq__(self, other: ChromiumFrame) -> bool: ... def __eq__(self, other: ChromiumFrame) -> bool: ...
@ -209,7 +210,7 @@ class ChromiumFrame(ChromiumBase):
def _find_elements(self, def _find_elements(self,
loc_or_ele: Union[Tuple[str, str], str, ChromiumElement, ChromiumFrame], loc_or_ele: Union[Tuple[str, str], str, ChromiumElement, ChromiumFrame],
timeout: float = None, timeout: float = None,
single: bool = True, index: Optional[int] = 0,
relative: bool = False, relative: bool = False,
raise_err: bool = None) \ raise_err: bool = None) \
-> Union[ChromiumElement, ChromiumFrame, None, List[Union[ChromiumElement, ChromiumFrame]]]: ... -> Union[ChromiumElement, ChromiumFrame, None, List[Union[ChromiumElement, ChromiumFrame]]]: ...

View File

@ -355,20 +355,19 @@ class WebPageTab(SessionPage, ChromiumTab, BasePage):
if self._response is not None: if self._response is not None:
self._response.close() self._response.close()
def _find_elements(self, loc_or_ele, timeout=None, single=True, relative=False, raise_err=None): def _find_elements(self, loc_or_ele, timeout=None, index=0, relative=False, raise_err=None):
"""返回页面中符合条件的元素、属性或节点文本,默认返回第一个 """返回页面中符合条件的元素、属性或节点文本,默认返回第一个
:param loc_or_ele: 元素的定位信息可以是元素对象loc元组或查询字符串 :param loc_or_ele: 元素的定位信息可以是元素对象loc元组或查询字符串
:param timeout: 查找元素超时时间d模式专用 :param timeout: 查找元素超时时间d模式专用
:param single: True则返回第一个False则返回全部 :param index: 第几个结果0开始为None返回所有
:param relative: WebPage用的表示是否相对定位的参数 :param relative: WebPage用的表示是否相对定位的参数
:param raise_err: 找不到元素是是否抛出异常为None时根据全局设置 :param raise_err: 找不到元素是是否抛出异常为None时根据全局设置
:return: 元素对象或属性文本节点文本 :return: 元素对象或属性文本节点文本
""" """
if self._mode == 's': if self._mode == 's':
return super()._find_elements(loc_or_ele, single=single) return super()._find_elements(loc_or_ele, index=index)
elif self._mode == 'd': elif self._mode == 'd':
return super(SessionPage, self)._find_elements(loc_or_ele, timeout=timeout, single=single, return super(SessionPage, self)._find_elements(loc_or_ele, timeout=timeout, index=index, relative=relative)
relative=relative)
def __repr__(self): def __repr__(self):
return f'<WebPageTab browser_id={self.browser.id} tab_id={self.tab_id}>' return f'<WebPageTab browser_id={self.browser.id} tab_id={self.tab_id}>'

View File

@ -191,7 +191,11 @@ class WebPageTab(SessionPage, ChromiumTab):
@property @property
def set(self) -> WebPageTabSetter: ... def set(self) -> WebPageTabSetter: ...
def _find_elements(self, loc_or_ele: Union[Tuple[str, str], str, ChromiumElement, SessionElement, ChromiumFrame], def _find_elements(self,
timeout: float = None, single: bool = True, relative: bool = False, raise_err: bool = None) \ loc_or_ele: Union[Tuple[str, str], str, ChromiumElement, SessionElement, ChromiumFrame],
timeout: float = None,
index: Optional[int] = 0,
relative: bool = False,
raise_err: bool = None) \
-> Union[ChromiumElement, SessionElement, ChromiumFrame, NoneElement, List[SessionElement], List[ -> Union[ChromiumElement, SessionElement, ChromiumFrame, NoneElement, List[SessionElement], List[
Union[ChromiumElement, ChromiumFrame]]]: ... Union[ChromiumElement, ChromiumFrame]]]: ...

View File

@ -174,13 +174,14 @@ class SessionPage(BasePage):
""" """
return self._s_connect(url, 'post', show_errmsg, retry, interval, **kwargs) return self._s_connect(url, 'post', show_errmsg, retry, interval, **kwargs)
def ele(self, loc_or_ele, timeout=None): def ele(self, loc_or_ele, index=0, timeout=None):
"""返回页面中符合条件的一个元素、属性或节点文本 """返回页面中符合条件的一个元素、属性或节点文本
:param loc_or_ele: 元素的定位信息可以是元素对象loc元组或查询字符串 :param loc_or_ele: 元素的定位信息可以是元素对象loc元组或查询字符串
:param index: 获取第几个0开始
:param timeout: 不起实际作用用于和ChromiumElement对应便于无差别调用 :param timeout: 不起实际作用用于和ChromiumElement对应便于无差别调用
:return: SessionElement对象或属性文本 :return: SessionElement对象或属性文本
""" """
return self._ele(loc_or_ele, method='ele()') return self._ele(loc_or_ele, index=index, method='ele()')
def eles(self, loc_or_str, timeout=None): def eles(self, loc_or_str, timeout=None):
"""返回页面中所有符合条件的元素、属性或节点文本 """返回页面中所有符合条件的元素、属性或节点文本
@ -188,31 +189,33 @@ class SessionPage(BasePage):
:param timeout: 不起实际作用用于和ChromiumElement对应便于无差别调用 :param timeout: 不起实际作用用于和ChromiumElement对应便于无差别调用
:return: SessionElement对象或属性文本组成的列表 :return: SessionElement对象或属性文本组成的列表
""" """
return self._ele(loc_or_str, single=False) return self._ele(loc_or_str, index=None)
def s_ele(self, loc_or_ele=None): def s_ele(self, loc_or_ele=None, index=0):
"""返回页面中符合条件的一个元素、属性或节点文本 """返回页面中符合条件的一个元素、属性或节点文本
:param loc_or_ele: 元素的定位信息可以是元素对象loc元组或查询字符串 :param loc_or_ele: 元素的定位信息可以是元素对象loc元组或查询字符串
:param index: 获取第几个0开始
:return: SessionElement对象或属性文本 :return: SessionElement对象或属性文本
""" """
return make_session_ele(self.html) if loc_or_ele is None else self._ele(loc_or_ele, method='s_ele()') return make_session_ele(self.html) if loc_or_ele is None else self._ele(loc_or_ele,
index=index, method='s_ele()')
def s_eles(self, loc_or_str): def s_eles(self, loc_or_str):
"""返回页面中符合条件的所有元素、属性或节点文本 """返回页面中符合条件的所有元素、属性或节点文本
:param loc_or_str: 元素的定位信息可以是元素对象loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是元素对象loc元组或查询字符串
:return: SessionElement对象或属性文本 :return: SessionElement对象或属性文本
""" """
return self._ele(loc_or_str, single=False) return self._ele(loc_or_str, index=None)
def _find_elements(self, loc_or_ele, timeout=None, single=True, raise_err=None): def _find_elements(self, loc_or_ele, timeout=None, index=0, raise_err=None):
"""返回页面中符合条件的元素、属性或节点文本,默认返回第一个 """返回页面中符合条件的元素、属性或节点文本,默认返回第一个
:param loc_or_ele: 元素的定位信息可以是元素对象loc元组或查询字符串 :param loc_or_ele: 元素的定位信息可以是元素对象loc元组或查询字符串
:param timeout: 不起实际作用用于和父类对应 :param timeout: 不起实际作用用于和父类对应
:param single: True则返回第一个False则返回全部 :param index: 第几个结果0开始为None返回所有
:param raise_err: 找不到元素是是否抛出异常为None时根据全局设置 :param raise_err: 找不到元素是是否抛出异常为None时根据全局设置
:return: SessionElement对象 :return: SessionElement对象
""" """
return loc_or_ele if isinstance(loc_or_ele, SessionElement) else make_session_ele(self, loc_or_ele, single) return loc_or_ele if isinstance(loc_or_ele, SessionElement) else make_session_ele(self, loc_or_ele, index=index)
def get_cookies(self, as_dict=False, all_domains=False, all_info=False): def get_cookies(self, as_dict=False, all_domains=False, all_info=False):
"""返回cookies """返回cookies

View File

@ -106,7 +106,7 @@ class SessionPage(BasePage):
def _find_elements(self, def _find_elements(self,
loc_or_ele: Union[Tuple[str, str], str, SessionElement], loc_or_ele: Union[Tuple[str, str], str, SessionElement],
timeout: float = None, timeout: float = None,
single: bool = True, index: Optional[int] = 0,
raise_err: bool = None) \ raise_err: bool = None) \
-> Union[SessionElement, NoneElement, List[SessionElement]]: ... -> Union[SessionElement, NoneElement, List[SessionElement]]: ...

View File

@ -38,17 +38,18 @@ class WebPage(SessionPage, ChromiumPage, BasePage):
super(SessionPage, self).__init__(addr_or_opts=chromium_options, timeout=timeout) super(SessionPage, self).__init__(addr_or_opts=chromium_options, timeout=timeout)
self.change_mode(self._mode, go=False, copy_cookies=False) self.change_mode(self._mode, go=False, copy_cookies=False)
def __call__(self, loc_or_str, timeout=None): def __call__(self, loc_or_str, index=0, timeout=None):
"""在内部查找元素 """在内部查找元素
ele = page('@id=ele_id') ele = page('@id=ele_id')
:param loc_or_str: 元素的定位信息可以是loc元组或查询字符串 :param loc_or_str: 元素的定位信息可以是loc元组或查询字符串
:param index: 获取第几个0开始
:param timeout: 超时时间 :param timeout: 超时时间
:return: 子元素对象 :return: 子元素对象
""" """
if self._mode == 'd': if self._mode == 'd':
return super(SessionPage, self).__call__(loc_or_str, timeout) return super(SessionPage, self).__call__(loc_or_str, index=index, timeout=timeout)
elif self._mode == 's': elif self._mode == 's':
return super().__call__(loc_or_str) return super().__call__(loc_or_str, index=index)
@property @property
def set(self): def set(self):
@ -360,20 +361,19 @@ class WebPage(SessionPage, ChromiumPage, BasePage):
if self._response is not None: if self._response is not None:
self._response.close() self._response.close()
def _find_elements(self, loc_or_ele, timeout=None, single=True, relative=False, raise_err=None): def _find_elements(self, loc_or_ele, timeout=None, index=0, relative=False, raise_err=None):
"""返回页面中符合条件的元素、属性或节点文本,默认返回第一个 """返回页面中符合条件的元素、属性或节点文本,默认返回第一个
:param loc_or_ele: 元素的定位信息可以是元素对象loc元组或查询字符串 :param loc_or_ele: 元素的定位信息可以是元素对象loc元组或查询字符串
:param timeout: 查找元素超时时间d模式专用 :param timeout: 查找元素超时时间d模式专用
:param single: True则返回第一个False则返回全部 :param index: 第几个结果0开始为None返回所有
:param relative: WebPage用的表示是否相对定位的参数 :param relative: WebPage用的表示是否相对定位的参数
:param raise_err: 找不到元素是是否抛出异常为None时根据全局设置 :param raise_err: 找不到元素是是否抛出异常为None时根据全局设置
:return: 元素对象或属性文本节点文本 :return: 元素对象或属性文本节点文本
""" """
if self._mode == 's': if self._mode == 's':
return super()._find_elements(loc_or_ele, single=single) return super()._find_elements(loc_or_ele, index=index)
elif self._mode == 'd': elif self._mode == 'd':
return super(SessionPage, self)._find_elements(loc_or_ele, timeout=timeout, single=single, return super(SessionPage, self)._find_elements(loc_or_ele, timeout=timeout, index=index, relative=relative)
relative=relative)
def quit(self, timeout=5, force=True): def quit(self, timeout=5, force=True):
"""关闭浏览器和Session """关闭浏览器和Session

View File

@ -5,7 +5,7 @@
@Copyright: (c) 2024 by g1879, Inc. All Rights Reserved. @Copyright: (c) 2024 by g1879, Inc. All Rights Reserved.
@License : BSD 3-Clause. @License : BSD 3-Clause.
""" """
from typing import Union, Tuple, List, Any from typing import Union, Tuple, List, Any, Optional
from requests import Session, Response from requests import Session, Response
@ -38,6 +38,7 @@ class WebPage(SessionPage, ChromiumPage, BasePage):
def __call__(self, def __call__(self,
loc_or_str: Union[Tuple[str, str], str, ChromiumElement, SessionElement], loc_or_str: Union[Tuple[str, str], str, ChromiumElement, SessionElement],
index: int = 0,
timeout: float = None) -> Union[ChromiumElement, SessionElement, NoneElement]: ... timeout: float = None) -> Union[ChromiumElement, SessionElement, NoneElement]: ...
# -----------------共有属性和方法------------------- # -----------------共有属性和方法-------------------
@ -167,7 +168,7 @@ class WebPage(SessionPage, ChromiumPage, BasePage):
def _find_elements(self, def _find_elements(self,
loc_or_ele: Union[Tuple[str, str], str, ChromiumElement, SessionElement, ChromiumFrame], loc_or_ele: Union[Tuple[str, str], str, ChromiumElement, SessionElement, ChromiumFrame],
timeout: float = None, timeout: float = None,
single: bool = True, index: Optional[int] = 0,
relative: bool = False, relative: bool = False,
raise_err: bool = None) \ raise_err: bool = None) \
-> Union[ChromiumElement, SessionElement, ChromiumFrame, NoneElement, List[SessionElement], -> Union[ChromiumElement, SessionElement, ChromiumFrame, NoneElement, List[SessionElement],

View File

@ -2,7 +2,7 @@ requests
lxml lxml
cssselect cssselect
DownloadKit>=2.0.0 DownloadKit>=2.0.0
websocket-client>=1.7.0 websocket-client
click click
tldextract tldextract
psutil psutil

View File

@ -6,7 +6,7 @@ with open("README.md", "r", encoding='utf-8') as fh:
setup( setup(
name="DrissionPage", name="DrissionPage",
version="4.0.1", version="4.0.0b37",
author="g1879", author="g1879",
author_email="g1879@qq.com", author_email="g1879@qq.com",
description="Python based web automation tool. It can control the browser and send and receive data packets.", description="Python based web automation tool. It can control the browser and send and receive data packets.",
@ -23,18 +23,18 @@ setup(
'requests', 'requests',
'cssselect', 'cssselect',
'DownloadKit>=2.0.0', 'DownloadKit>=2.0.0',
'websocket-client>=1.7.0', 'websocket-client',
'click', 'click',
'tldextract', 'tldextract',
'psutil' 'psutil'
], ],
classifiers=[ classifiers=[
"Programming Language :: Python :: 3.8", "Programming Language :: Python :: 3.6",
"Development Status :: 4 - Beta", "Development Status :: 4 - Beta",
"Topic :: Utilities", "Topic :: Utilities",
"License :: OSI Approved :: BSD License", "License :: OSI Approved :: BSD License",
], ],
python_requires='>=3.8', python_requires='>=3.6',
entry_points={ entry_points={
'console_scripts': [ 'console_scripts': [
'dp = DrissionPage.commons.cli:main', 'dp = DrissionPage.commons.cli:main',