在response._content删除\x08(退格)字符,以避免页面上有这个字符时解析出错

This commit is contained in:
g1879 2020-06-09 14:32:11 +08:00
parent fe9b308562
commit 43b942e1ec

View File

@ -231,7 +231,7 @@ class SessionPage(object):
charset = 'utf-8'
else:
charset = headers['Content-Type'].split('=')[1]
r._content = r.content.replace(b'\x08', b'').replace(b'\x0d', b'') # TODO: 待测试
r._content = r.content.replace(b'\x08', b'\\b') # 避免存在退格符导致乱码或解析出错
r.encoding = charset
return_value = r
return return_value