完善texts()方法

2024-12-10 04:00:23 +08:00 · 2021-01-04 17:42:45 +08:00 · 2021-01-04 17:42:45 +08:00 · e03a67c3a5
commit e03a67c3a5
parent 0f9f52b1f6
2 changed files with 13 additions and 5 deletions
--- a/DrissionPage/driver_element.py
+++ b/DrissionPage/driver_element.py
@ -155,9 +155,11 @@ class DriverElement(DrissionElement):
        :return: 文本列表
        """
        if text_node_only:
-            return self.eles('xpath:/text()')
+            texts = self.eles('xpath:/text()')
        else:
-            return [x if isinstance(x, str) else x.text for x in self.eles('xpath:./text() | *')]
+            texts = [x if isinstance(x, str) else x.text for x in self.eles('xpath:./text() | *')]
        return [x.strip(' ') for x in texts if x and x.replace('\n', '').replace('\t', '').replace(' ', '') != '']
    def parents(self, num: int = 1):
        """返回上面第num级父元素              \n
--- a/DrissionPage/session_element.py
+++ b/DrissionPage/session_element.py
@ -54,7 +54,12 @@ class SessionElement(DrissionElement):
            str_list = []
            if ele.tag == 'pre':
                pre = True
            current_tag = None
            for el in ele.eles('xpath:./text() | *'):
                if current_tag in ('br', 'p') and str_list and str_list[-1] != '\n':
                    str_list.append('\n')
                if isinstance(el, str):
                    if el.replace(' ', '').replace('\n', '') != '':
                        if pre:
@ -66,10 +71,10 @@ class SessionElement(DrissionElement):
                        str_list.append('\n')
                    else:
                        str_list.append(' ')
                    current_tag = None
                else:
                    str_list.extend(get_node(el, pre))
-                    if el.tag in ('br', 'p',) and str_list and str_list[-1] != '\n':
+                    current_tag = el.tag
                        str_list.append('\n')
            return str_list
@ -138,7 +143,8 @@ class SessionElement(DrissionElement):
        else:
            texts = [x if isinstance(x, str) else x.text for x in self.eles('xpath:./text() | *')]
-        return [format_html(x) for x in texts if x and x.replace('\n', '').replace('\t', '').replace(' ', '') != '']
+        return [format_html(x.strip(' ')) for x in texts if
                x and x.replace('\n', '').replace('\t', '').replace(' ', '') != '']
    def parents(self, num: int = 1):
        """返回上面第num级父元素                                         \n