重构公用函数文件结构

2024-12-10 04:00:23 +08:00 · 2023-01-18 10:35:34 +08:00 · 2023-01-18 10:35:34 +08:00 · 1fd0d0c87f
commit 1fd0d0c87f
parent 3c1e3b9690
25 changed files with 903 additions and 873 deletions
--- a/DrissionPage/init.py
+++ b/DrissionPage/init.py
@ -3,16 +3,24 @@
@Author  :   g1879
@Contact :   g1879@qq.com
 """
 # 常用页面类
 from .chromium_page import ChromiumPage
 from .session_page import SessionPage
 from .web_page import WebPage
 # 启动配置类
 from .configs.chromium_options import ChromiumOptions
 from .configs.session_options import SessionOptions
 # 常用工具
 from .action_chains import ActionChains
 from .keys import Keys
 # 旧版页面类和启动配置类
 from .mix_page import MixPage
 from .drission import Drission
 from .configs.driver_options import DriverOptions
 from warnings import filterwarnings
 filterwarnings('ignore')
 from .mix_page import MixPage
 from .web_page import WebPage
 from .chromium_page import ChromiumPage
 from .session_page import SessionPage
 from .drission import Drission
 from .configs.driver_options import DriverOptions
 from .configs.chromium_options import ChromiumOptions
 from .configs.session_options import SessionOptions
 from .action_chains import ActionChains
--- a/DrissionPage/action_chains.py
+++ b/DrissionPage/action_chains.py
@ -5,7 +5,7 @@
 """
 from time import sleep
-from .common import location_in_viewport
+from .functions.web import location_in_viewport
 from .keys import _modifierBit, _keyDescriptionForString
--- a/DrissionPage/base.py
+++ b/DrissionPage/base.py
@ -7,7 +7,8 @@ from abc import abstractmethod
 from re import sub
 from urllib.parse import quote
-from .common import format_html, get_loc
+from .functions.web import format_html
 from .functions.locator import get_loc
 class BaseParser(object):
--- a/DrissionPage/chromium_base.py
+++ b/DrissionPage/chromium_base.py
@ -10,7 +10,8 @@ from requests import Session
 from .base import BasePage
 from .chromium_element import ChromiumElementWaiter, ChromiumScroll, ChromiumElement, run_js, make_chromium_ele
-from .common import get_loc, offset_scroll, cookies_to_tuple
+from .functions.locator import get_loc
 from .functions.web import offset_scroll, cookies_to_tuple
 from .session_element import make_session_ele
 from .chromium_driver import ChromiumDriver
--- a/DrissionPage/chromium_element.py
+++ b/DrissionPage/chromium_element.py
@ -9,8 +9,8 @@ from pathlib import Path
 from time import perf_counter, sleep
 from .base import DrissionElement, BaseElement
-from .common import make_absolute_link, get_loc, get_ele_txt, format_html, is_js_func, location_in_viewport, \
+from .functions.locator import get_loc
-    offset_scroll
+from .functions.web import make_absolute_link, get_ele_txt, format_html, is_js_func, location_in_viewport, offset_scroll
 from .keys import _keys_to_typing, _keyDescriptionForString, _keyDefinitions
 from .session_element import make_session_ele
--- a/DrissionPage/chromium_page.py
+++ b/DrissionPage/chromium_page.py
@ -13,7 +13,7 @@ from requests import Session
 from .chromium_base import Timeout, ChromiumBase
 from .chromium_driver import ChromiumDriver
 from .chromium_tab import ChromiumTab
-from .common import connect_browser
+from .functions.browser import connect_browser
 from .configs.driver_options import DriverOptions
 from .session_page import DownloadSetter
--- a/DrissionPage/common.py
+++ b/DrissionPage/common.py
@ -1,768 +0,0 @@
 # -*- coding:utf-8 -*-
 """
@Author  :   g1879
@Contact :   g1879@qq.com
 """
 from html import unescape
 from http.cookiejar import Cookie
 from pathlib import Path
 from platform import system
 from re import split, search, sub
 from shutil import rmtree
 from subprocess import Popen
 from time import perf_counter, sleep
 from urllib.parse import urlparse, urljoin, urlunparse
 from zipfile import ZipFile
 from requests import get as requests_get
 from requests.cookies import RequestsCookieJar
 # from .configs.chromium_options import ChromiumOptions
 from .configs.driver_options import DriverOptions
 def get_ele_txt(e):
    """获取元素内所有文本
    :param e: 元素对象
    :return: 元素内所有文本
    """
    # 前面无须换行的元素
    nowrap_list = ('br', 'sub', 'sup', 'em', 'strong', 'a', 'font', 'b', 'span', 's', 'i', 'del', 'ins', 'img', 'td',
                   'th', 'abbr', 'bdi', 'bdo', 'cite', 'code', 'data', 'dfn', 'kbd', 'mark', 'q', 'rp', 'rt', 'ruby',
                   'samp', 'small', 'time', 'u', 'var', 'wbr', 'button', 'slot', 'content')
    # 后面添加换行的元素
    wrap_after_list = ('p', 'div', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'ol', 'li', 'blockquote', 'header',
                       'footer', 'address' 'article', 'aside', 'main', 'nav', 'section', 'figcaption', 'summary')
    # 不获取文本的元素
    noText_list = ('script', 'style', 'video', 'audio', 'iframe', 'embed', 'noscript', 'canvas', 'template')
    # 用/t分隔的元素
    tab_list = ('td', 'th')
    if e.tag in noText_list:
        return e.raw_text
    def get_node_txt(ele, pre: bool = False):
        tag = ele.tag
        if tag == 'br':
            return [True]
        if not pre and tag == 'pre':
            pre = True
        str_list = []
        if tag in noText_list and not pre:  # 标签内的文本不返回
            return str_list
        nodes = ele.eles('xpath:./text() | *')
        prev_ele = ''
        for el in nodes:
            if isinstance(el, str):  # 字符节点
                if pre:
                    str_list.append(el)
                else:
                    if sub('[ \n\t\r]', '', el) != '':  # 字符除了回车和空格还有其它内容
                        txt = el
                        if not pre:
                            txt = txt.replace('\n', ' ').strip(' ')
                            txt = sub(r' {2,}', ' ', txt)
                        str_list.append(txt)
            else:  # 元素节点
                if el.tag not in nowrap_list and str_list and str_list[-1] != '\n':  # 元素间换行的情况
                    str_list.append('\n')
                if el.tag in tab_list and prev_ele in tab_list:  # 表格的行
                    str_list.append('\t')
                str_list.extend(get_node_txt(el, pre))
                prev_ele = el.tag
        if tag in wrap_after_list and str_list and str_list[-1] not in ('\n', True):  # 有些元素后面要添加回车
            str_list.append('\n')
        return str_list
    re_str = get_node_txt(e)
    if re_str and re_str[-1] == '\n':
        re_str.pop()
    re_str = ''.join([i if i is not True else '\n' for i in re_str])
    return format_html(re_str)
 def get_loc(loc, translate_css=False):
    """接收selenium定位元组或本库定位语法，转换为标准定位元组，可翻译css selector为xpath  \n
    :param loc: selenium定位元组或本库定位语法
    :param translate_css: 是否翻译css selector为xpath
    :return: DrissionPage定位元组
    """
    if isinstance(loc, tuple):
        loc = translate_loc(loc)
    elif isinstance(loc, str):
        loc = str_to_loc(loc)
    else:
        raise TypeError('loc参数只能是tuple或str。')
    if loc[0] == 'css selector' and translate_css:
        from lxml.cssselect import CSSSelector, ExpressionError
        try:
            path = str(CSSSelector(loc[1], translator='html').path)
            path = path[20:] if path.startswith('descendant-or-self::') else path
            loc = 'xpath', path
        except ExpressionError:
            pass
    return loc
 def str_to_loc(loc):
    """处理元素查找语句                                                                 \n
    查找方式：属性、tag name及属性、文本、xpath、css selector、id、class                    \n
    @表示属性，.表示class，#表示id，=表示精确匹配，:表示模糊匹配，无控制字符串时默认搜索该字符串    \n
    """
    loc_by = 'xpath'
    if loc.startswith('.'):
        if loc.startswith(('.=', '.:',)):
            loc = loc.replace('.', '@class', 1)
        else:
            loc = loc.replace('.', '@class=', 1)
    elif loc.startswith('#'):
        if loc.startswith(('#=', '#:',)):
            loc = loc.replace('#', '@id', 1)
        else:
            loc = loc.replace('#', '@id=', 1)
    elif loc.startswith(('t:', 't=')):
        loc = f'tag:{loc[2:]}'
    elif loc.startswith(('tx:', 'tx=')):
        loc = f'text{loc[2:]}'
    # ------------------------------------------------------------------
    # 多属性查找
    if loc.startswith('@@') and loc != '@@':
        loc_str = _make_multi_xpath_str('*', loc)
    # 单属性查找
    elif loc.startswith('@') and loc != '@':
        loc_str = _make_single_xpath_str('*', loc)
    # 根据tag name查找
    elif loc.startswith(('tag:', 'tag=')) and loc not in ('tag:', 'tag='):
        at_ind = loc.find('@')
        if at_ind == -1:
            loc_str = f'//*[name()="{loc[4:]}"]'
        else:
            if loc[at_ind:].startswith('@@'):
                loc_str = _make_multi_xpath_str(loc[4:at_ind], loc[at_ind:])
            else:
                loc_str = _make_single_xpath_str(loc[4:at_ind], loc[at_ind:])
    # 根据文本查找
    elif loc.startswith('text='):
        loc_str = f'//*[text()={_make_search_str(loc[5:])}]'
    elif loc.startswith('text:') and loc != 'text:':
        loc_str = f'//*/text()[contains(., {_make_search_str(loc[5:])})]/..'
    # 用xpath查找
    elif loc.startswith(('xpath:', 'xpath=')) and loc not in ('xpath:', 'xpath='):
        loc_str = loc[6:]
    elif loc.startswith(('x:', 'x=')) and loc not in ('x:', 'x='):
        loc_str = loc[2:]
    # 用css selector查找
    elif loc.startswith(('css:', 'css=')) and loc not in ('css:', 'css='):
        loc_by = 'css selector'
        loc_str = loc[4:]
    elif loc.startswith(('c:', 'c=')) and loc not in ('c:', 'c='):
        loc_by = 'css selector'
        loc_str = loc[2:]
    # 根据文本模糊查找
    elif loc:
        loc_str = f'//*/text()[contains(., {_make_search_str(loc)})]/..'
    else:
        loc_str = '//*'
    return loc_by, loc_str
 def _make_single_xpath_str(tag: str, text: str) -> str:
    """生成xpath语句                  \n
    :param tag: 标签名
    :param text: 待处理的字符串
    :return: xpath字符串
    """
    arg_list = [] if tag == '*' else [f'name()="{tag}"']
    arg_str = txt_str = ''
    if text == '@':
        arg_str = 'not(@*)'
    else:
        r = split(r'([:=])', text, maxsplit=1)
        len_r = len(r)
        len_r0 = len(r[0])
        if len_r != 3 and len_r0 > 1:
            arg_str = 'normalize-space(text())' if r[0] in ('@text()', '@tx()') else f'{r[0]}'
        elif len_r == 3 and len_r0 > 1:
            if r[1] == '=':  # 精确查找
                arg = '.' if r[0] in ('@text()', '@tx()') else r[0]
                arg_str = f'{arg}={_make_search_str(r[2])}'
            else:  # 模糊查找
                if r[0] in ('@text()', '@tx()'):
                    txt_str = f'/text()[contains(., {_make_search_str(r[2])})]/..'
                    arg_str = ''
                else:
                    arg_str = f"contains({r[0]},{_make_search_str(r[2])})"
    if arg_str:
        arg_list.append(arg_str)
    arg_str = ' and '.join(arg_list)
    return f'//*[{arg_str}]{txt_str}' if arg_str else f'//*{txt_str}'
 def _make_multi_xpath_str(tag: str, text: str) -> str:
    """生成多属性查找的xpath语句                    \n
    :param tag: 标签名
    :param text: 待处理的字符串
    :return: xpath字符串
    """
    arg_list = [] if tag == '*' else [f'name()="{tag}"']
    args = text.split('@@')
    for arg in args[1:]:
        r = split(r'([:=])', arg, maxsplit=1)
        arg_str = ''
        len_r = len(r)
        if not r[0]:  # 不查询任何属性
            arg_str = 'not(@*)'
        else:
            r[0], ignore = (r[0][1:], True) if r[0][0] == '-' else (r[0], None)  # 是否去除某个属性
            if len_r != 3:  # 只有属性名没有属性内容，查询是否存在该属性
                arg_str = 'normalize-space(text())' if r[0] in ('text()', 'tx()') else f'@{r[0]}'
            elif len_r == 3:  # 属性名和内容都有
                arg = '.' if r[0] in ('text()', 'tx()') else f'@{r[0]}'
                if r[1] == '=':
                    arg_str = f'{arg}={_make_search_str(r[2])}'
                else:
                    arg_str = f'contains({arg},{_make_search_str(r[2])})'
            if arg_str and ignore:
                arg_str = f'not({arg_str})'
        if arg_str:
            arg_list.append(arg_str)
    arg_str = ' and '.join(arg_list)
    return f'//*[{arg_str}]' if arg_str else f'//*'
 def _make_search_str(search_str: str) -> str:
    """将"转义，不知何故不能直接用 \ 来转义 \n
    :param search_str: 查询字符串
    :return: 把"转义后的字符串
    """
    parts = search_str.split('"')
    parts_num = len(parts)
    search_str = 'concat('
    for key, i in enumerate(parts):
        search_str += f'"{i}"'
        search_str += ',' + '\'"\',' if key < parts_num - 1 else ''
    search_str += ',"")'
    return search_str
 def translate_loc(loc):
    """把By类型的loc元组转换为css selector或xpath类型的  \n
    :param loc: By类型的loc元组
    :return: css selector或xpath类型的loc元组
    """
    if len(loc) != 2:
        raise ValueError('定位符长度必须为2。')
    loc_by = 'xpath'
    loc_0 = loc[0].lower()
    if loc_0 == 'xpath':
        loc_str = loc[1]
    elif loc_0 == 'css selector':
        loc_by = loc_0
        loc_str = loc[1]
    elif loc_0 == 'id':
        loc_str = f'//*[@id="{loc[1]}"]'
    elif loc_0 == 'class name':
        loc_str = f'//*[@class="{loc[1]}"]'
    elif loc_0 == 'link text':
        loc_str = f'//a[text()="{loc[1]}"]'
    elif loc_0 == 'name':
        loc_str = f'//*[@name="{loc[1]}"]'
    elif loc_0 == 'tag name':
        loc_str = f'//{loc[1]}'
    elif loc_0 == 'partial link text':
        loc_str = f'//a[contains(text(),"{loc[1]}")]'
    else:
        raise ValueError('无法识别的定位符。')
    return loc_by, loc_str
 def format_html(text):
    """处理html编码字符             \n
    :param text: html文本
    :return: 格式化后的html文本
    """
    return unescape(text).replace('\xa0', ' ') if text else text
 def cookie_to_dict(cookie):
    """把Cookie对象转为dict格式                \n
    :param cookie: Cookie对象
    :return: cookie字典
    """
    if isinstance(cookie, Cookie):
        cookie_dict = cookie.__dict__.copy()
        cookie_dict.pop('rfc2109')
        cookie_dict.pop('_rest')
        return cookie_dict
    elif isinstance(cookie, dict):
        cookie_dict = cookie
    elif isinstance(cookie, str):
        cookie = cookie.split(',' if ',' in cookie else ';')
        cookie_dict = {}
        for key, attr in enumerate(cookie):
            attr_val = attr.lstrip().split('=')
            if key == 0:
                cookie_dict['name'] = attr_val[0]
                cookie_dict['value'] = attr_val[1] if len(attr_val) == 2 else ''
            else:
                cookie_dict[attr_val[0]] = attr_val[1] if len(attr_val) == 2 else ''
        return cookie_dict
    else:
        raise TypeError('cookie参数必须为Cookie、str或dict类型。')
    return cookie_dict
 def cookies_to_tuple(cookies):
    """把cookies转为tuple格式                                                \n
    :param cookies: cookies信息，可为CookieJar, list, tuple, str, dict
    :return: 返回tuple形式的cookies
    """
    if isinstance(cookies, (list, tuple, RequestsCookieJar)):
        cookies = tuple(cookie_to_dict(cookie) for cookie in cookies)
    elif isinstance(cookies, str):
        cookies = tuple(cookie_to_dict(cookie.lstrip()) for cookie in cookies.split(";"))
    elif isinstance(cookies, dict):
        cookies = tuple({'name': cookie, 'value': cookies[cookie]} for cookie in cookies)
    else:
        raise TypeError('cookies参数必须为RequestsCookieJar、list、tuple、str或dict类型。')
    return cookies
 def clean_folder(folder_path, ignore=None):
    """清空一个文件夹，除了ignore里的文件和文件夹  \n
    :param folder_path: 要清空的文件夹路径
    :param ignore: 忽略列表
    :return: None
    """
    ignore = [] if not ignore else ignore
    p = Path(folder_path)
    for f in p.iterdir():
        if f.name not in ignore:
            if f.is_file():
                f.unlink()
            elif f.is_dir():
                rmtree(f, True)
 def unzip(zip_path, to_path):
    """解压下载的chromedriver.zip文件"""
    if not zip_path:
        return
    with ZipFile(zip_path, 'r') as f:
        return [f.extract(f.namelist()[0], path=to_path)]
 def get_exe_from_port(port):
    """获取端口号第一条进程的可执行文件路径      \n
    :param port: 端口号
    :return: 可执行文件的绝对路径
    """
    from os import popen
    pid = get_pid_from_port(port)
    if not pid:
        return
    else:
        file_lst = popen(f'wmic process where processid={pid} get executablepath').read().split('\n')
        return file_lst[2].strip() if len(file_lst) > 2 else None
 def get_pid_from_port(port):
    """获取端口号第一条进程的pid           \n
    :param port: 端口号
    :return: 进程id
    """
    from platform import system
    if system().lower() != 'windows' or port is None:
        return None
    from os import popen
    from time import perf_counter
    try:  # 避免Anaconda中可能产生的报错
        process = popen(f'netstat -ano |findstr {port}').read().split('\n')[0]
        t = perf_counter()
        while not process and perf_counter() - t < 5:
            process = popen(f'netstat -ano |findstr {port}').read().split('\n')[0]
        return process.split(' ')[-1] or None
    except AttributeError:
        return None
 def get_usable_path(path):
    """检查文件或文件夹是否有重名，并返回可以使用的路径           \n
    :param path: 文件或文件夹路径
    :return: 可用的路径，Path对象
    """
    path = Path(path)
    parent = path.parent
    path = parent / make_valid_name(path.name)
    name = path.stem if path.is_file() else path.name
    ext = path.suffix if path.is_file() else ''
    first_time = True
    while path.exists():
        r = search(r'(.*)_(\d+)$', name)
        if not r or (r and first_time):
            src_name, num = name, '1'
        else:
            src_name, num = r.group(1), int(r.group(2)) + 1
        name = f'{src_name}_{num}'
        path = parent / f'{name}{ext}'
        first_time = None
    return path
 def make_valid_name(full_name):
    """获取有效的文件名                  \n
    :param full_name: 文件名
    :return: 可用的文件名
    """
    # ----------------去除前后空格----------------
    full_name = full_name.strip()
    # ----------------使总长度不大于255个字符（一个汉字是2个字符）----------------
    r = search(r'(.*)(\.[^.]+$)', full_name)  # 拆分文件名和后缀名
    if r:
        name, ext = r.group(1), r.group(2)
        ext_long = len(ext)
    else:
        name, ext = full_name, ''
        ext_long = 0
    while get_long(name) > 255 - ext_long:
        name = name[:-1]
    full_name = f'{name}{ext}'
    # ----------------去除不允许存在的字符----------------
    return sub(r'[<>/\\|:*?\n]', '', full_name)
 def get_long(txt):
    """返回字符串中字符个数（一个汉字是2个字符）          \n
    :param txt: 字符串
    :return: 字符个数
    """
    txt_len = len(txt)
    return int((len(txt.encode('utf-8')) - txt_len) / 2 + txt_len)
 def make_absolute_link(link, page=None):
    """获取绝对url
    :param link: 超链接
    :param page: 页面对象
    :return: 绝对链接
    """
    if not link:
        return link
    parsed = urlparse(link)._asdict()
    # 是相对路径，与页面url拼接并返回
    if not parsed['netloc']:
        return urljoin(page.url, link) if page else link
    # 是绝对路径但缺少协议，从页面url获取协议并修复
    if not parsed['scheme'] and page:
        parsed['scheme'] = urlparse(page.url).scheme
        parsed = tuple(v for v in parsed.values())
        return urlunparse(parsed)
    # 绝对路径且不缺协议，直接返回
    return link
 def is_js_func(func):
    """检查文本是否js函数"""
    func = func.strip()
    if func.startswith('function') or func.startswith('async '):
        return True
    elif '=>' in func:
        return True
    return False
 def port_is_using(ip, port):
    """检查端口是否被占用               \n
    :param ip: 浏览器地址
    :param port: 浏览器端口
    :return: bool
    """
    from socket import socket, AF_INET, SOCK_STREAM
    s = socket(AF_INET, SOCK_STREAM)
    result = s.connect_ex((ip, int(port)))
    s.close()
    return result == 0
 def connect_browser(option):
    """连接或启动浏览器                           \n
    :param option: DriverOptions对象
    :return: chrome 路径和进程对象组成的元组
    """
    system_type = system().lower()
    debugger_address = option.debugger_address
    chrome_path = option.browser_path
    debugger_address = debugger_address[7:] if debugger_address.startswith('http://') else debugger_address
    ip, port = debugger_address.split(':')
    if ip not in ('127.0.0.1', 'localhost'):
        return None, None
    if port_is_using(ip, port):
        chrome_path = get_exe_from_port(port) if chrome_path == 'chrome' and system_type == 'windows' else chrome_path
        return chrome_path, None
    args = get_launch_args(option)
    set_prefs(option)
    # ----------创建浏览器进程----------
    try:
        debugger = _run_browser(port, chrome_path, args)
        if chrome_path == 'chrome' and system_type == 'windows':
            chrome_path = get_exe_from_port(port)
    # 传入的路径找不到，主动在ini文件、注册表、系统变量中找
    except FileNotFoundError:
        from DrissionPage.easy_set import get_chrome_path
        chrome_path = get_chrome_path(show_msg=False)
        if not chrome_path:
            raise FileNotFoundError('无法找到chrome路径，请手动配置。')
        debugger = _run_browser(port, chrome_path, args)
    return chrome_path, debugger
 def get_launch_args(opt):
    """从DriverOptions获取命令行启动参数"""
    sys = system().lower()
    result = []
    # ----------处理arguments-----------
    args = opt.arguments
    for arg in args:
        index = arg.find('=') + 1
        if index == 0:
            result.append(arg)
        else:
            a = arg[index:].strip()
            if a.startswith('"') and a.endswith('"'):
                result.append(arg)
            else:
                result.append(f'{arg[:index]}"{a}"')
    # ----------处理插件extensions-------------
    ext = opt._extension_files if isinstance(opt, DriverOptions) else opt.extensions
    if ext:
        ext = set(ext)
        if sys == 'windows':
            ext = '","'.join(ext)
            ext = f'"{ext}"'
        else:
            ext = ','.join(ext)
        ext = f'--load-extension={ext}'
        result.append(ext)
    return result
 def set_prefs(opt):
    """处理启动配置中的prefs项，目前只能对已存在文件夹配置"""
    # todo: 支持删除pref项
    prefs = opt.experimental_options.get('prefs', None) if isinstance(opt, DriverOptions) else opt.preferences
    if prefs and opt.user_data_path:
        args = opt.arguments
        user = 'Default'
        for arg in args:
            if arg.startswith('--profile-directory'):
                user = arg.split('=')[-1].strip()
                break
        prefs_file = Path(opt.user_data_path) / user / 'Preferences'
        if not prefs_file.exists():
            prefs_file.parent.mkdir(parents=True, exist_ok=True)
            with open(prefs_file, 'w') as f:
                f.write('{}')
        from json import load, dump
        with open(prefs_file, "r", encoding='utf-8') as f:
            j = load(f)
            for pref in prefs:
                value = prefs[pref]
                pref = pref.split('.')
                _make_leave_in_dict(j, pref, 0, len(pref))
                _set_value_to_dict(j, pref, value)
        with open(prefs_file, 'w', encoding='utf-8') as f:
            dump(j, f)
 def _run_browser(port, path: str, args) -> Popen:
    """创建chrome进程          \n
    :param port: 端口号
    :param path: 浏览器地址
    :param args: 启动参数
    :return: 进程对象
    """
    sys = system().lower()
    if sys == 'windows':
        args = ' '.join(args)
        debugger = Popen(f'"{path}" --remote-debugging-port={port} {args}', shell=False)
    else:
        arguments = [path, f'--remote-debugging-port={port}'] + list(args)
        debugger = Popen(arguments, shell=False)
    t1 = perf_counter()
    while perf_counter() - t1 < 10:
        try:
            tabs = requests_get(f'http://127.0.0.1:{port}/json').json()
            for tab in tabs:
                if tab['type'] == 'page':
                    return debugger
        except Exception:
            sleep(.2)
    raise ConnectionError('无法连接浏览器。')
 def _make_leave_in_dict(target_dict: dict, src: list, num: int, end: int) -> None:
    """把prefs中a.b.c形式的属性转为a['b']['c']形式
    :param target_dict: 要处理的dict
    :param src: 属性层级列表[a, b, c]
    :param num: 当前处理第几个
    :param end: src长度
    :return: None
    """
    if num == end:
        return
    if src[num] not in target_dict:
        target_dict[src[num]] = {}
    num += 1
    _make_leave_in_dict(target_dict[src[num - 1]], src, num, end)
 def _set_value_to_dict(target_dict: dict, src: list, value) -> None:
    """把a.b.c形式的属性的值赋值到a['b']['c']形式的字典中
    :param target_dict: 要处理的dict
    :param src: 属性层级列表[a, b, c]
    :param value: 属性值
    :return: None
    """
    src = "']['".join(src)
    src = f"target_dict['{src}']=value"
    exec(src)
 def location_in_viewport(page, loc_x, loc_y):
    """判断给定的坐标是否在视口中          |n
    :param page: ChromePage对象
    :param loc_x: 页面绝对坐标x
    :param loc_y: 页面绝对坐标y
    :return:
    """
    js = f'''function(){{var x = {loc_x}; var y = {loc_y};
    const scrollLeft = document.documentElement.scrollLeft;
    const scrollTop = document.documentElement.scrollTop;
    const vWidth = document.documentElement.clientWidth;
    const vHeight = document.documentElement.clientHeight;
    if (x< scrollLeft || y < scrollTop || x > vWidth + scrollLeft || y > vHeight + scrollTop){{return false;}}
    return true;}}'''
    return page.run_js(js)
    # const vWidth = window.innerWidth || document.documentElement.clientWidth;
    # const vHeight = window.innerHeight || document.documentElement.clientHeight;
 def offset_scroll(ele, offset_x, offset_y):
    """接收元素及偏移坐标，把坐标滚动到页面中间，返回该点在视口中的坐标    \n
    有偏移量时以元素左上角坐标为基准，没有时以_click_point为基准
    :param ele: 元素对象
    :param offset_x: 偏移量x
    :param offset_y: 偏移量y
    :return: 视口中的坐标
    """
    loc_x, loc_y = ele.location
    cp_x, cp_y = ele._click_point
    lx = loc_x + offset_x if offset_x else cp_x
    ly = loc_y + offset_y if offset_y else cp_y
    if not location_in_viewport(ele.page, lx, ly):
        clientWidth = ele.page.run_js('return document.body.clientWidth;')
        clientHeight = ele.page.run_js('return document.body.clientHeight;')
        ele.page.scroll.to_location(lx - clientWidth // 2, ly - clientHeight // 2)
    cl_x, cl_y = ele.client_location
    ccp_x, ccp_y = ele._client_click_point
    cx = cl_x + offset_x if offset_x else ccp_x
    cy = cl_y + offset_y if offset_y else ccp_y
    return cx, cy
--- a/DrissionPage/common.pyi
+++ b/DrissionPage/common.pyi
@ -1,81 +0,0 @@
 # -*- coding:utf-8 -*-
 """
@Author  :   g1879
@Contact :   g1879@qq.com
 """
 from http.cookiejar import Cookie
 from pathlib import Path
 from typing import Union
 from requests.cookies import RequestsCookieJar
 from .base import BasePage, DrissionElement
 from .chromium_element import ChromiumElement
 from .config import DriverOptions
 from .configs.chromium_options import ChromiumOptions
 def get_ele_txt(e: DrissionElement) -> str: ...
 def get_loc(loc: Union[tuple, str], translate_css: bool = False) -> tuple: ...
 def str_to_loc(loc: str) -> tuple: ...
 def translate_loc(loc: tuple) -> tuple: ...
 def format_html(text: str) -> str: ...
 def cookie_to_dict(cookie: Union[Cookie, str, dict]) -> dict: ...
 def cookies_to_tuple(cookies: Union[RequestsCookieJar, list, tuple, str, dict]) -> tuple: ...
 def clean_folder(folder_path: str, ignore: list = None) -> None: ...
 def unzip(zip_path: str, to_path: str) -> Union[list, None]: ...
 def get_exe_from_port(port: Union[str, int]) -> Union[str, None]: ...
 def get_pid_from_port(port: Union[str, int]) -> Union[str, None]: ...
 def get_usable_path(path: Union[str, Path]) -> Path: ...
 def make_valid_name(full_name: str) -> str: ...
 def get_long(txt) -> int: ...
 def make_absolute_link(link, page: BasePage = None) -> str: ...
 def is_js_func(func: str) -> bool: ...
 def port_is_using(ip: str, port: Union[str, int]) -> bool: ...
 def connect_browser(option: Union[ChromiumOptions, DriverOptions]) -> tuple: ...
 def get_launch_args(opt: Union[ChromiumOptions, DriverOptions]) -> list: ...
 def set_prefs(opt: Union[ChromiumOptions, DriverOptions]) -> None: ...
 def location_in_viewport(page, loc_x: int, loc_y: int) -> bool: ...
 def offset_scroll(ele: ChromiumElement, offset_x: int, offset_y: int) -> tuple: ...
--- a/DrissionPage/configs/chromium_options.py
+++ b/DrissionPage/configs/chromium_options.py
@ -2,7 +2,7 @@
 from pathlib import Path
 from shutil import rmtree
-from DrissionPage.common import port_is_using
+from DrissionPage.functions.tools import port_is_using
 from .options_manage import OptionsManager
--- a/DrissionPage/configs/session_options.py
+++ b/DrissionPage/configs/session_options.py
@ -2,7 +2,7 @@
 from pathlib import Path
-from DrissionPage.common import cookies_to_tuple
+from DrissionPage.functions.web import cookies_to_tuple
 from .options_manage import OptionsManager
--- a/DrissionPage/drission.py
+++ b/DrissionPage/drission.py
@ -14,7 +14,9 @@ from selenium.webdriver.chrome.options import Options
 from selenium.webdriver.remote.webdriver import WebDriver as RemoteWebDriver
 from tldextract import extract
-from .common import get_pid_from_port, connect_browser, cookies_to_tuple
+from .functions.tools import get_pid_from_port
 from .functions.browser import connect_browser
 from .functions.web import cookies_to_tuple
 from .configs.session_options import SessionOptions, session_options_to_dict
 from .configs.driver_options import DriverOptions
--- a/DrissionPage/driver_element.py
+++ b/DrissionPage/driver_element.py
@ -15,7 +15,9 @@ from selenium.webdriver.support import expected_conditions as ec
 from selenium.webdriver.support.wait import WebDriverWait
 from .base import DrissionElement, BaseElement
-from .common import str_to_loc, get_usable_path, format_html, get_ele_txt, get_loc
+from .functions.locator import str_to_loc, get_loc
 from .functions.tools import get_usable_path
 from .functions.web import format_html, get_ele_txt
 from .session_element import make_session_ele
--- a/DrissionPage/driver_page.py
+++ b/DrissionPage/driver_page.py
@ -13,7 +13,7 @@ from selenium.webdriver.remote.webelement import WebElement
 from selenium.webdriver.support.wait import WebDriverWait
 from .base import BasePage
-from .common import get_usable_path
+from .functions.tools import get_usable_path
 from .driver_element import DriverElement, make_driver_ele, Scroll, ElementWaiter
 from .session_element import make_session_ele
--- a/DrissionPage/functions/browser.py
+++ b/DrissionPage/functions/browser.py
@ -0,0 +1,156 @@
 # -*- coding:utf-8 -*-
 from pathlib import Path
 from platform import system
 from subprocess import Popen
 from time import perf_counter, sleep
 from requests import get as requests_get
 from DrissionPage.configs.driver_options import DriverOptions
 from .tools import port_is_using, get_exe_from_port
 def connect_browser(option):
    """连接或启动浏览器                           \n
    :param option: DriverOptions对象
    :return: chrome 路径和进程对象组成的元组
    """
    system_type = system().lower()
    debugger_address = option.debugger_address
    chrome_path = option.browser_path
    debugger_address = debugger_address[7:] if debugger_address.startswith('http://') else debugger_address
    ip, port = debugger_address.split(':')
    if ip not in ('127.0.0.1', 'localhost'):
        return None, None
    if port_is_using(ip, port):
        chrome_path = get_exe_from_port(port) if chrome_path == 'chrome' and system_type == 'windows' else chrome_path
        return chrome_path, None
    args = get_launch_args(option)
    set_prefs(option)
    # ----------创建浏览器进程----------
    try:
        debugger = _run_browser(port, chrome_path, args)
        if chrome_path == 'chrome' and system_type == 'windows':
            chrome_path = get_exe_from_port(port)
    # 传入的路径找不到，主动在ini文件、注册表、系统变量中找
    except FileNotFoundError:
        from DrissionPage.easy_set import get_chrome_path
        chrome_path = get_chrome_path(show_msg=False)
        if not chrome_path:
            raise FileNotFoundError('无法找到chrome路径，请手动配置。')
        debugger = _run_browser(port, chrome_path, args)
    return chrome_path, debugger
 def get_launch_args(opt):
    """从DriverOptions获取命令行启动参数
    :param opt: DriverOptions或ChromiumOptions
    :return: 启动参数列表
    """
    # ----------处理arguments-----------
    result = set(i for i in opt.arguments if not i.startswith(('--load-extension=', '--remote-debugging-port=')))
    result = list(result)
    # ----------处理插件extensions-------------
    ext = opt._extension_files if isinstance(opt, DriverOptions) else opt.extensions
    if ext:
        ext = ','.join(set(ext))
        ext = f'--load-extension={ext}'
        result.append(ext)
    return result
 def set_prefs(opt):
    """处理启动配置中的prefs项，目前只能对已存在文件夹配置
    :param opt: DriverOptions或ChromiumOptions
    :return: None
    """
    # todo: 支持删除pref项
    prefs = opt.experimental_options.get('prefs', None) if isinstance(opt, DriverOptions) else opt.preferences
    if prefs and opt.user_data_path:
        args = opt.arguments
        user = 'Default'
        for arg in args:
            if arg.startswith('--profile-directory'):
                user = arg.split('=')[-1].strip()
                break
        prefs_file = Path(opt.user_data_path) / user / 'Preferences'
        if not prefs_file.exists():
            prefs_file.parent.mkdir(parents=True, exist_ok=True)
            with open(prefs_file, 'w') as f:
                f.write('{}')
        from json import load, dump
        with open(prefs_file, "r", encoding='utf-8') as f:
            j = load(f)
            for pref in prefs:
                value = prefs[pref]
                pref = pref.split('.')
                _make_leave_in_dict(j, pref, 0, len(pref))
                _set_value_to_dict(j, pref, value)
        with open(prefs_file, 'w', encoding='utf-8') as f:
            dump(j, f)
 def _run_browser(port, path: str, args) -> Popen:
    """创建chrome进程          \n
    :param port: 端口号
    :param path: 浏览器地址
    :param args: 启动参数
    :return: 进程对象
    """
    arguments = [path, f'--remote-debugging-port={port}']
    arguments.extend(args)
    debugger = Popen(arguments, shell=False)
    end_time = perf_counter() + 10
    while perf_counter() < end_time:
        try:
            tabs = requests_get(f'http://127.0.0.1:{port}/json').json()
            for tab in tabs:
                if tab['type'] == 'page':
                    return debugger
        except Exception:
            sleep(.2)
    raise ConnectionError('无法连接浏览器。')
 def _make_leave_in_dict(target_dict: dict, src: list, num: int, end: int) -> None:
    """把prefs中a.b.c形式的属性转为a['b']['c']形式
    :param target_dict: 要处理的dict
    :param src: 属性层级列表[a, b, c]
    :param num: 当前处理第几个
    :param end: src长度
    :return: None
    """
    if num == end:
        return
    if src[num] not in target_dict:
        target_dict[src[num]] = {}
    num += 1
    _make_leave_in_dict(target_dict[src[num - 1]], src, num, end)
 def _set_value_to_dict(target_dict: dict, src: list, value) -> None:
    """把a.b.c形式的属性的值赋值到a['b']['c']形式的字典中
    :param target_dict: 要处理的dict
    :param src: 属性层级列表[a, b, c]
    :param value: 属性值
    :return: None
    """
    src = "']['".join(src)
    src = f"target_dict['{src}']=value"
    exec(src)
--- a/DrissionPage/functions/browser.pyi
+++ b/DrissionPage/functions/browser.pyi
@ -0,0 +1,14 @@
 # -*- coding:utf-8 -*-
 from typing import Union
 from DrissionPage.configs.chromium_options import ChromiumOptions
 from DrissionPage.configs.driver_options import DriverOptions
 def connect_browser(option: Union[ChromiumOptions, DriverOptions]) -> tuple: ...
 def get_launch_args(opt: Union[ChromiumOptions, DriverOptions]) -> list: ...
 def set_prefs(opt: Union[ChromiumOptions, DriverOptions]) -> None: ...
--- a/DrissionPage/functions/locator.py
+++ b/DrissionPage/functions/locator.py
@ -0,0 +1,243 @@
 # -*- coding:utf-8 -*-
 """
@Author  :   g1879
@Contact :   g1879@qq.com
 """
 from re import split
 def get_loc(loc, translate_css=False):
    """接收selenium定位元组或本库定位语法，转换为标准定位元组，可翻译css selector为xpath  \n
    :param loc: selenium定位元组或本库定位语法
    :param translate_css: 是否翻译css selector为xpath
    :return: DrissionPage定位元组
    """
    if isinstance(loc, tuple):
        loc = translate_loc(loc)
    elif isinstance(loc, str):
        loc = str_to_loc(loc)
    else:
        raise TypeError('loc参数只能是tuple或str。')
    if loc[0] == 'css selector' and translate_css:
        from lxml.cssselect import CSSSelector, ExpressionError
        try:
            path = str(CSSSelector(loc[1], translator='html').path)
            path = path[20:] if path.startswith('descendant-or-self::') else path
            loc = 'xpath', path
        except ExpressionError:
            pass
    return loc
 def str_to_loc(loc):
    """处理元素查找语句                                                                 \n
    查找方式：属性、tag name及属性、文本、xpath、css selector、id、class                    \n
    @表示属性，.表示class，#表示id，=表示精确匹配，:表示模糊匹配，无控制字符串时默认搜索该字符串    \n
    """
    loc_by = 'xpath'
    if loc.startswith('.'):
        if loc.startswith(('.=', '.:',)):
            loc = loc.replace('.', '@class', 1)
        else:
            loc = loc.replace('.', '@class=', 1)
    elif loc.startswith('#'):
        if loc.startswith(('#=', '#:',)):
            loc = loc.replace('#', '@id', 1)
        else:
            loc = loc.replace('#', '@id=', 1)
    elif loc.startswith(('t:', 't=')):
        loc = f'tag:{loc[2:]}'
    elif loc.startswith(('tx:', 'tx=')):
        loc = f'text{loc[2:]}'
    # ------------------------------------------------------------------
    # 多属性查找
    if loc.startswith('@@') and loc != '@@':
        loc_str = _make_multi_xpath_str('*', loc)
    # 单属性查找
    elif loc.startswith('@') and loc != '@':
        loc_str = _make_single_xpath_str('*', loc)
    # 根据tag name查找
    elif loc.startswith(('tag:', 'tag=')) and loc not in ('tag:', 'tag='):
        at_ind = loc.find('@')
        if at_ind == -1:
            loc_str = f'//*[name()="{loc[4:]}"]'
        else:
            if loc[at_ind:].startswith('@@'):
                loc_str = _make_multi_xpath_str(loc[4:at_ind], loc[at_ind:])
            else:
                loc_str = _make_single_xpath_str(loc[4:at_ind], loc[at_ind:])
    # 根据文本查找
    elif loc.startswith('text='):
        loc_str = f'//*[text()={_make_search_str(loc[5:])}]'
    elif loc.startswith('text:') and loc != 'text:':
        loc_str = f'//*/text()[contains(., {_make_search_str(loc[5:])})]/..'
    # 用xpath查找
    elif loc.startswith(('xpath:', 'xpath=')) and loc not in ('xpath:', 'xpath='):
        loc_str = loc[6:]
    elif loc.startswith(('x:', 'x=')) and loc not in ('x:', 'x='):
        loc_str = loc[2:]
    # 用css selector查找
    elif loc.startswith(('css:', 'css=')) and loc not in ('css:', 'css='):
        loc_by = 'css selector'
        loc_str = loc[4:]
    elif loc.startswith(('c:', 'c=')) and loc not in ('c:', 'c='):
        loc_by = 'css selector'
        loc_str = loc[2:]
    # 根据文本模糊查找
    elif loc:
        loc_str = f'//*/text()[contains(., {_make_search_str(loc)})]/..'
    else:
        loc_str = '//*'
    return loc_by, loc_str
 def _make_single_xpath_str(tag: str, text: str) -> str:
    """生成xpath语句                  \n
    :param tag: 标签名
    :param text: 待处理的字符串
    :return: xpath字符串
    """
    arg_list = [] if tag == '*' else [f'name()="{tag}"']
    arg_str = txt_str = ''
    if text == '@':
        arg_str = 'not(@*)'
    else:
        r = split(r'([:=])', text, maxsplit=1)
        len_r = len(r)
        len_r0 = len(r[0])
        if len_r != 3 and len_r0 > 1:
            arg_str = 'normalize-space(text())' if r[0] in ('@text()', '@tx()') else f'{r[0]}'
        elif len_r == 3 and len_r0 > 1:
            if r[1] == '=':  # 精确查找
                arg = '.' if r[0] in ('@text()', '@tx()') else r[0]
                arg_str = f'{arg}={_make_search_str(r[2])}'
            else:  # 模糊查找
                if r[0] in ('@text()', '@tx()'):
                    txt_str = f'/text()[contains(., {_make_search_str(r[2])})]/..'
                    arg_str = ''
                else:
                    arg_str = f"contains({r[0]},{_make_search_str(r[2])})"
    if arg_str:
        arg_list.append(arg_str)
    arg_str = ' and '.join(arg_list)
    return f'//*[{arg_str}]{txt_str}' if arg_str else f'//*{txt_str}'
 def _make_multi_xpath_str(tag: str, text: str) -> str:
    """生成多属性查找的xpath语句                    \n
    :param tag: 标签名
    :param text: 待处理的字符串
    :return: xpath字符串
    """
    arg_list = [] if tag == '*' else [f'name()="{tag}"']
    args = text.split('@@')
    for arg in args[1:]:
        r = split(r'([:=])', arg, maxsplit=1)
        arg_str = ''
        len_r = len(r)
        if not r[0]:  # 不查询任何属性
            arg_str = 'not(@*)'
        else:
            r[0], ignore = (r[0][1:], True) if r[0][0] == '-' else (r[0], None)  # 是否去除某个属性
            if len_r != 3:  # 只有属性名没有属性内容，查询是否存在该属性
                arg_str = 'normalize-space(text())' if r[0] in ('text()', 'tx()') else f'@{r[0]}'
            elif len_r == 3:  # 属性名和内容都有
                arg = '.' if r[0] in ('text()', 'tx()') else f'@{r[0]}'
                if r[1] == '=':
                    arg_str = f'{arg}={_make_search_str(r[2])}'
                else:
                    arg_str = f'contains({arg},{_make_search_str(r[2])})'
            if arg_str and ignore:
                arg_str = f'not({arg_str})'
        if arg_str:
            arg_list.append(arg_str)
    arg_str = ' and '.join(arg_list)
    return f'//*[{arg_str}]' if arg_str else f'//*'
 def _make_search_str(search_str: str) -> str:
    """将"转义，不知何故不能直接用 \ 来转义 \n
    :param search_str: 查询字符串
    :return: 把"转义后的字符串
    """
    parts = search_str.split('"')
    parts_num = len(parts)
    search_str = 'concat('
    for key, i in enumerate(parts):
        search_str += f'"{i}"'
        search_str += ',' + '\'"\',' if key < parts_num - 1 else ''
    search_str += ',"")'
    return search_str
 def translate_loc(loc):
    """把By类型的loc元组转换为css selector或xpath类型的  \n
    :param loc: By类型的loc元组
    :return: css selector或xpath类型的loc元组
    """
    if len(loc) != 2:
        raise ValueError('定位符长度必须为2。')
    loc_by = 'xpath'
    loc_0 = loc[0].lower()
    if loc_0 == 'xpath':
        loc_str = loc[1]
    elif loc_0 == 'css selector':
        loc_by = loc_0
        loc_str = loc[1]
    elif loc_0 == 'id':
        loc_str = f'//*[@id="{loc[1]}"]'
    elif loc_0 == 'class name':
        loc_str = f'//*[@class="{loc[1]}"]'
    elif loc_0 == 'link text':
        loc_str = f'//a[text()="{loc[1]}"]'
    elif loc_0 == 'name':
        loc_str = f'//*[@name="{loc[1]}"]'
    elif loc_0 == 'tag name':
        loc_str = f'//{loc[1]}'
    elif loc_0 == 'partial link text':
        loc_str = f'//a[contains(text(),"{loc[1]}")]'
    else:
        raise ValueError('无法识别的定位符。')
    return loc_by, loc_str
--- a/DrissionPage/functions/locator.pyi
+++ b/DrissionPage/functions/locator.pyi
@ -0,0 +1,15 @@
 # -*- coding:utf-8 -*-
 """
@Author  :   g1879
@Contact :   g1879@qq.com
 """
 from typing import Union
 def get_loc(loc: Union[tuple, str], translate_css: bool = False) -> tuple: ...
 def str_to_loc(loc: str) -> tuple: ...
 def translate_loc(loc: tuple) -> tuple: ...
--- a/DrissionPage/functions/tools.py
+++ b/DrissionPage/functions/tools.py
@ -0,0 +1,151 @@
 # -*- coding:utf-8 -*-
 """
@Author  :   g1879
@Contact :   g1879@qq.com
 """
 from pathlib import Path
 from re import search, sub
 from shutil import rmtree
 from zipfile import ZipFile
 def get_exe_from_port(port):
    """获取端口号第一条进程的可执行文件路径      \n
    :param port: 端口号
    :return: 可执行文件的绝对路径
    """
    from os import popen
    pid = get_pid_from_port(port)
    if not pid:
        return
    else:
        file_lst = popen(f'wmic process where processid={pid} get executablepath').read().split('\n')
        return file_lst[2].strip() if len(file_lst) > 2 else None
 def get_pid_from_port(port):
    """获取端口号第一条进程的pid           \n
    :param port: 端口号
    :return: 进程id
    """
    from platform import system
    if system().lower() != 'windows' or port is None:
        return None
    from os import popen
    from time import perf_counter
    try:  # 避免Anaconda中可能产生的报错
        process = popen(f'netstat -ano |findstr {port}').read().split('\n')[0]
        t = perf_counter()
        while not process and perf_counter() - t < 5:
            process = popen(f'netstat -ano |findstr {port}').read().split('\n')[0]
        return process.split(' ')[-1] or None
    except AttributeError:
        return None
 def get_usable_path(path):
    """检查文件或文件夹是否有重名，并返回可以使用的路径           \n
    :param path: 文件或文件夹路径
    :return: 可用的路径，Path对象
    """
    path = Path(path)
    parent = path.parent
    path = parent / make_valid_name(path.name)
    name = path.stem if path.is_file() else path.name
    ext = path.suffix if path.is_file() else ''
    first_time = True
    while path.exists():
        r = search(r'(.*)_(\d+)$', name)
        if not r or (r and first_time):
            src_name, num = name, '1'
        else:
            src_name, num = r.group(1), int(r.group(2)) + 1
        name = f'{src_name}_{num}'
        path = parent / f'{name}{ext}'
        first_time = None
    return path
 def make_valid_name(full_name):
    """获取有效的文件名                  \n
    :param full_name: 文件名
    :return: 可用的文件名
    """
    # ----------------去除前后空格----------------
    full_name = full_name.strip()
    # ----------------使总长度不大于255个字符（一个汉字是2个字符）----------------
    r = search(r'(.*)(\.[^.]+$)', full_name)  # 拆分文件名和后缀名
    if r:
        name, ext = r.group(1), r.group(2)
        ext_long = len(ext)
    else:
        name, ext = full_name, ''
        ext_long = 0
    while get_long(name) > 255 - ext_long:
        name = name[:-1]
    full_name = f'{name}{ext}'
    # ----------------去除不允许存在的字符----------------
    return sub(r'[<>/\\|:*?\n]', '', full_name)
 def get_long(txt):
    """返回字符串中字符个数（一个汉字是2个字符）          \n
    :param txt: 字符串
    :return: 字符个数
    """
    txt_len = len(txt)
    return int((len(txt.encode('utf-8')) - txt_len) / 2 + txt_len)
 def port_is_using(ip, port):
    """检查端口是否被占用               \n
    :param ip: 浏览器地址
    :param port: 浏览器端口
    :return: bool
    """
    from socket import socket, AF_INET, SOCK_STREAM
    s = socket(AF_INET, SOCK_STREAM)
    result = s.connect_ex((ip, int(port)))
    s.close()
    return result == 0
 def clean_folder(folder_path, ignore=None):
    """清空一个文件夹，除了ignore里的文件和文件夹  \n
    :param folder_path: 要清空的文件夹路径
    :param ignore: 忽略列表
    :return: None
    """
    ignore = [] if not ignore else ignore
    p = Path(folder_path)
    for f in p.iterdir():
        if f.name not in ignore:
            if f.is_file():
                f.unlink()
            elif f.is_dir():
                rmtree(f, True)
 def unzip(zip_path, to_path):
    """解压下载的chromedriver.zip文件"""
    if not zip_path:
        return
    with ZipFile(zip_path, 'r') as f:
        return [f.extract(f.namelist()[0], path=to_path)]
--- a/DrissionPage/functions/tools.pyi
+++ b/DrissionPage/functions/tools.pyi
@ -0,0 +1,31 @@
 # -*- coding:utf-8 -*-
 """
@Author  :   g1879
@Contact :   g1879@qq.com
 """
 from pathlib import Path
 from typing import Union
 def get_exe_from_port(port: Union[str, int]) -> Union[str, None]: ...
 def get_pid_from_port(port: Union[str, int]) -> Union[str, None]: ...
 def get_usable_path(path: Union[str, Path]) -> Path: ...
 def make_valid_name(full_name: str) -> str: ...
 def get_long(txt) -> int: ...
 def port_is_using(ip: str, port: Union[str, int]) -> bool: ...
 def clean_folder(folder_path: str, ignore: list = None) -> None: ...
 def unzip(zip_path: str, to_path: str) -> Union[list, None]: ...
--- a/DrissionPage/functions/web.py
+++ b/DrissionPage/functions/web.py
@ -0,0 +1,218 @@
 # -*- coding:utf-8 -*-
 """
@Author  :   g1879
@Contact :   g1879@qq.com
 """
 from html import unescape
 from http.cookiejar import Cookie
 from re import sub
 from urllib.parse import urlparse, urljoin, urlunparse
 from requests.cookies import RequestsCookieJar
 def get_ele_txt(e):
    """获取元素内所有文本
    :param e: 元素对象
    :return: 元素内所有文本
    """
    # 前面无须换行的元素
    nowrap_list = ('br', 'sub', 'sup', 'em', 'strong', 'a', 'font', 'b', 'span', 's', 'i', 'del', 'ins', 'img', 'td',
                   'th', 'abbr', 'bdi', 'bdo', 'cite', 'code', 'data', 'dfn', 'kbd', 'mark', 'q', 'rp', 'rt', 'ruby',
                   'samp', 'small', 'time', 'u', 'var', 'wbr', 'button', 'slot', 'content')
    # 后面添加换行的元素
    wrap_after_list = ('p', 'div', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'ol', 'li', 'blockquote', 'header',
                       'footer', 'address' 'article', 'aside', 'main', 'nav', 'section', 'figcaption', 'summary')
    # 不获取文本的元素
    noText_list = ('script', 'style', 'video', 'audio', 'iframe', 'embed', 'noscript', 'canvas', 'template')
    # 用/t分隔的元素
    tab_list = ('td', 'th')
    if e.tag in noText_list:
        return e.raw_text
    def get_node_txt(ele, pre: bool = False):
        tag = ele.tag
        if tag == 'br':
            return [True]
        if not pre and tag == 'pre':
            pre = True
        str_list = []
        if tag in noText_list and not pre:  # 标签内的文本不返回
            return str_list
        nodes = ele.eles('xpath:./text() | *')
        prev_ele = ''
        for el in nodes:
            if isinstance(el, str):  # 字符节点
                if pre:
                    str_list.append(el)
                else:
                    if sub('[ \n\t\r]', '', el) != '':  # 字符除了回车和空格还有其它内容
                        txt = el
                        if not pre:
                            txt = txt.replace('\n', ' ').strip(' ')
                            txt = sub(r' {2,}', ' ', txt)
                        str_list.append(txt)
            else:  # 元素节点
                if el.tag not in nowrap_list and str_list and str_list[-1] != '\n':  # 元素间换行的情况
                    str_list.append('\n')
                if el.tag in tab_list and prev_ele in tab_list:  # 表格的行
                    str_list.append('\t')
                str_list.extend(get_node_txt(el, pre))
                prev_ele = el.tag
        if tag in wrap_after_list and str_list and str_list[-1] not in ('\n', True):  # 有些元素后面要添加回车
            str_list.append('\n')
        return str_list
    re_str = get_node_txt(e)
    if re_str and re_str[-1] == '\n':
        re_str.pop()
    re_str = ''.join([i if i is not True else '\n' for i in re_str])
    return format_html(re_str)
 def format_html(text):
    """处理html编码字符             \n
    :param text: html文本
    :return: 格式化后的html文本
    """
    return unescape(text).replace('\xa0', ' ') if text else text
 def location_in_viewport(page, loc_x, loc_y):
    """判断给定的坐标是否在视口中          |n
    :param page: ChromePage对象
    :param loc_x: 页面绝对坐标x
    :param loc_y: 页面绝对坐标y
    :return:
    """
    js = f'''function(){{var x = {loc_x}; var y = {loc_y};
    const scrollLeft = document.documentElement.scrollLeft;
    const scrollTop = document.documentElement.scrollTop;
    const vWidth = document.documentElement.clientWidth;
    const vHeight = document.documentElement.clientHeight;
    if (x< scrollLeft || y < scrollTop || x > vWidth + scrollLeft || y > vHeight + scrollTop){{return false;}}
    return true;}}'''
    return page.run_js(js)
    # const vWidth = window.innerWidth || document.documentElement.clientWidth;
    # const vHeight = window.innerHeight || document.documentElement.clientHeight;
 def offset_scroll(ele, offset_x, offset_y):
    """接收元素及偏移坐标，把坐标滚动到页面中间，返回该点在视口中的坐标    \n
    有偏移量时以元素左上角坐标为基准，没有时以_click_point为基准
    :param ele: 元素对象
    :param offset_x: 偏移量x
    :param offset_y: 偏移量y
    :return: 视口中的坐标
    """
    loc_x, loc_y = ele.location
    cp_x, cp_y = ele._click_point
    lx = loc_x + offset_x if offset_x else cp_x
    ly = loc_y + offset_y if offset_y else cp_y
    if not location_in_viewport(ele.page, lx, ly):
        clientWidth = ele.page.run_js('return document.body.clientWidth;')
        clientHeight = ele.page.run_js('return document.body.clientHeight;')
        ele.page.scroll.to_location(lx - clientWidth // 2, ly - clientHeight // 2)
    cl_x, cl_y = ele.client_location
    ccp_x, ccp_y = ele._client_click_point
    cx = cl_x + offset_x if offset_x else ccp_x
    cy = cl_y + offset_y if offset_y else ccp_y
    return cx, cy
 def make_absolute_link(link, page=None):
    """获取绝对url
    :param link: 超链接
    :param page: 页面对象
    :return: 绝对链接
    """
    if not link:
        return link
    parsed = urlparse(link)._asdict()
    # 是相对路径，与页面url拼接并返回
    if not parsed['netloc']:
        return urljoin(page.url, link) if page else link
    # 是绝对路径但缺少协议，从页面url获取协议并修复
    if not parsed['scheme'] and page:
        parsed['scheme'] = urlparse(page.url).scheme
        parsed = tuple(v for v in parsed.values())
        return urlunparse(parsed)
    # 绝对路径且不缺协议，直接返回
    return link
 def is_js_func(func):
    """检查文本是否js函数"""
    func = func.strip()
    if func.startswith('function') or func.startswith('async '):
        return True
    elif '=>' in func:
        return True
    return False
 def cookie_to_dict(cookie):
    """把Cookie对象转为dict格式                \n
    :param cookie: Cookie对象
    :return: cookie字典
    """
    if isinstance(cookie, Cookie):
        cookie_dict = cookie.__dict__.copy()
        cookie_dict.pop('rfc2109')
        cookie_dict.pop('_rest')
        return cookie_dict
    elif isinstance(cookie, dict):
        cookie_dict = cookie
    elif isinstance(cookie, str):
        cookie = cookie.split(',' if ',' in cookie else ';')
        cookie_dict = {}
        for key, attr in enumerate(cookie):
            attr_val = attr.lstrip().split('=')
            if key == 0:
                cookie_dict['name'] = attr_val[0]
                cookie_dict['value'] = attr_val[1] if len(attr_val) == 2 else ''
            else:
                cookie_dict[attr_val[0]] = attr_val[1] if len(attr_val) == 2 else ''
        return cookie_dict
    else:
        raise TypeError('cookie参数必须为Cookie、str或dict类型。')
    return cookie_dict
 def cookies_to_tuple(cookies):
    """把cookies转为tuple格式                                                \n
    :param cookies: cookies信息，可为CookieJar, list, tuple, str, dict
    :return: 返回tuple形式的cookies
    """
    if isinstance(cookies, (list, tuple, RequestsCookieJar)):
        cookies = tuple(cookie_to_dict(cookie) for cookie in cookies)
    elif isinstance(cookies, str):
        cookies = tuple(cookie_to_dict(cookie.lstrip()) for cookie in cookies.split(";"))
    elif isinstance(cookies, dict):
        cookies = tuple({'name': cookie, 'value': cookies[cookie]} for cookie in cookies)
    else:
        raise TypeError('cookies参数必须为RequestsCookieJar、list、tuple、str或dict类型。')
    return cookies
--- a/DrissionPage/functions/web.pyi
+++ b/DrissionPage/functions/web.pyi
@ -0,0 +1,36 @@
 # -*- coding:utf-8 -*-
 """
@Author  :   g1879
@Contact :   g1879@qq.com
 """
 from http.cookiejar import Cookie
 from typing import Union
 from requests.cookies import RequestsCookieJar
 from DrissionPage.base import DrissionElement, BasePage
 from DrissionPage.chromium_element import ChromiumElement
 def get_ele_txt(e: DrissionElement) -> str: ...
 def format_html(text: str) -> str: ...
 def location_in_viewport(page, loc_x: int, loc_y: int) -> bool: ...
 def offset_scroll(ele: ChromiumElement, offset_x: int, offset_y: int) -> tuple: ...
 def make_absolute_link(link, page: BasePage = None) -> str: ...
 def is_js_func(func: str) -> bool: ...
 def cookie_to_dict(cookie: Union[Cookie, str, dict]) -> dict: ...
 def cookies_to_tuple(cookies: Union[RequestsCookieJar, list, tuple, str, dict]) -> tuple: ...
--- a/DrissionPage/session_element.py
+++ b/DrissionPage/session_element.py
@ -10,7 +10,8 @@ from lxml.etree import tostring
 from lxml.html import HtmlElement, fromstring
 from .base import DrissionElement, BasePage, BaseElement
-from .common import get_ele_txt, get_loc, make_absolute_link
+from .functions.web import get_ele_txt, make_absolute_link
 from .functions.locator import get_loc
 class SessionElement(DrissionElement):
--- a/DrissionPage/session_page.py
+++ b/DrissionPage/session_page.py
@ -14,7 +14,7 @@ from tldextract import extract
 from .base import BasePage
 from .configs.session_options import SessionOptions
-from .common import cookies_to_tuple, cookie_to_dict
+from .functions.web import cookies_to_tuple, cookie_to_dict
 from .session_element import SessionElement, make_session_ele
--- a/DrissionPage/shadow_root_element.py
+++ b/DrissionPage/shadow_root_element.py
@ -9,7 +9,7 @@ from typing import Union
 from selenium.webdriver.remote.webelement import WebElement
 from .base import BaseElement
-from .common import get_loc
+from .functions.locator import get_loc
 from .driver_element import make_driver_ele
 from .session_element import make_session_ele, SessionElement
--- a/DrissionPage/web_page.py
+++ b/DrissionPage/web_page.py
@ -15,7 +15,7 @@ from .chromium_driver import ChromiumDriver
 from .chromium_page import ChromiumPage, ChromiumDownloadSetter
 from .configs.session_options import SessionOptions
 from .configs.driver_options import DriverOptions
-from .common import cookies_to_tuple
+from .functions.web import cookies_to_tuple
 from .session_page import SessionPage