必备条件
需要先手写一个文字的列表(就是不知道怎么自动获取这个列表, 待解决)
word_list = [
"坏", "少", "远", "大", "九", "左", "近", "呢", "十...word in utf_word_map.items():
html = html.replace("%s;" % utf_code, word)
# 使用xpath 获取 主贴
xp_html...= etree.HTML(html)
subject_text = ''.join(xp_html.xpath('//div[@xname="content"]//div[@class="tz-paragraph...word_list = [
"坏", "少", "远", "大", "九", "左", "近", "呢", "十", "高", "着",...= etree.HTML(normal_html)
subject_text = ''.join(xp_html.xpath('//div[@xname="content"]//div