用python爬出的网页内容是乱码的怎么回事,该怎么改呀求告知
import requests
from bs4 import BeautifulSoup
def get_novel_chapter():
root_url = 'https://fanqienovel.com/page/7377020139255893054?enter_from=search'
response = requests.get(root_url)
response.encoding = 'utf-8'
soup = BeautifulSoup(response.text, 'html.parser')
data = []
for chapter in soup.find_all('div', class_='chapter-item'):
link = chapter.find('a')
if not link:
continue
data.append(("https://fanqienovel.com%s"%link['href'],link.get_text()))
return data
def get_chapter_content(url):
response = requests.get(url)
response.encoding = 'utf-8'
soup = BeautifulSoup(response.text, 'html.parser')
return soup.find('div', class_='muye-reader-content noselect').get_text()
for chapter in get_novel_chapter():
url, title = chapter
with open("%s.txt"%title,"w",encoding='utf-8') as fout:
fout.write(get_chapter_content(url))
break
输出的结果是乱码的