fix: utf-8 decode error close #156 #157 #158 #161

This commit is contained in:
wangxiaowen 2024-11-13 18:36:46 +08:00
parent dae30ecce8
commit b70b6725f3
2 changed files with 6 additions and 2 deletions

View File

@ -14,6 +14,7 @@ from tqdm import trange, tqdm
import requests
import time
import platform
import chardet
texts = list()
all_friends = list()
@ -234,7 +235,9 @@ if __name__ == '__main__':
signal.signal(signal.SIGINT, signal_handler)
signal.signal(signal.SIGTERM, signal_handler)
for i in trange(int(count / 100) + 1, desc='Progress', unit='100条'):
message = Request.get_message(i * 100, 100).content.decode('utf-8')
content_bytes = Request.get_message(i * 100, 100).content
detected_encoding = chardet.detect(content_bytes)['encoding']
message = content_bytes.decode(detected_encoding if detected_encoding else "utf-8")
time.sleep(0.2)
html = Tools.process_old_html(message)
if "li" not in html:

View File

@ -7,4 +7,5 @@ pyarrow==14.0.1
openpyxl==3.1.2
pyzbar~=0.1.9
qrcode~=7.4.2
fake-useragent
fake-useragent~=1.5.1
chardet~=5.2.0