下面是我用python写的小爬虫,报错错误出在eval()附近,但是我找了一下午都没有找到错误在那里!!跪求大神们帮助。
下面是我的代码
import requests
import time
import urllib3
import requests
from urllib.parse import urlencode
content=[]
relation=[]
eventlist=[]##所有event记录
texts=[]
texts.append('货币超发')##event会不断的加content到text里,当遍历了所有content没有新的content加进来了,程序就会自动停止
headers = {
'Host':'eeg.8wss.com',
'Referer':'http://eeg.8wss.com/main',
'User_Agent':'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/61.0.3163.79 Safari/537.36 Maxthon/5.2.7.5000',
'X-Requested-With':'XMLHttpRequest',
}
params = {
'text':texts,
'layers':1
}
base_url='http://eeg.8wss.com/api/query_abstract_event?'
def get_page(text):
url = base_url + urlencode(params)
try:
time.sleep(5)
#response=requests.get(url,headers=headers)
http=urllib3.PoolManager()
response=http.request('GET',url)
htmll=response.data.decode('UTF-8')
html=eval(htmll)
return html
except requests.ConnectionError as e:
print('Error', e.args)
time.sleep(300)
get_page(text)
def parse_page(html):
relations=html.get('relations')
event=html.get('events')
if relations:##当当前节点不能再展开时,返回的response为空
for i in relations:
if len(i)==9 and i['code'] not in content:
content.append(i)
if len(i)==4 and i['code'] not in relation:
relation.append(i)
else:
continue
if event:
for j in event:
if j['code'] not in eventlist:
eventlist.append(j)
if j['category']=='abstract':##abstract为蓝色的可衍生节点
texts.append(j['text'])
else:
continue
if __name__=='__main__':
#for text in texts:
haha = get_page(text)
results=parse_page(haha)
报错:
File "", line 36, in get_page
html=eval(htmll)
File "", line unknown
^
SyntaxError: unexpected EOF while parsing