因为他爬回来有的页数据是方块 但重新爬取一下就不是了 我想让他重新爬取这个方块数据的页 但是为什么except一直在爬这个页出不来了啊 应该怎么写 怎么办啊
import requests
import parsel
for page in range(1,168):
def get_html():
print("函数开始")
cars_data=parsel.Selector(response.text)
lis=cars_data.css('#__next > div.tw-flex > div.new-main.new > div > div > div.jsx-2898915557.wrap > ul > li')
# return lis
# def get_inf(lis_1):
for li in lis:
car_title=li.css(' li > a > dl > dt > p::text').get()
car_info_1=li.css('li > a > dl >dd:nth-child(2)::text').getall()
car_info_2=li.css('li > a > dl >dd:nth-child(3)>span::text').getall()
car_price_1 = li.css('li > a > dl >dd:nth-child(4)::text').get().replace('万','')
car_price_2=li.css('li > a > dl >dd:nth-child(4)>span::text').get().replace('新车指导价:','').replace('万','')
car_years=''.join(car_info_1).split('|')[0]
car_gonli=''.join(car_info_1).split('|')[1].replace('万公里','')
car_posotion = ''.join(car_info_1).split('|')[2]
if len(car_info_2)==2:
car_jianche=car_info_2[0]
car_guohu=car_info_2[0]
else:
car_jianche="无检测报告"
car_guohu=car_info_2[0]
for i in car_price_1:
try:
int(i)
print(car_title, car_years, car_gonli, car_posotion, car_jianche, car_guohu, car_price_1,
car_price_2)
break
except :
print(i)
print("错误开始",page)
print(car_title, car_years, car_gonli, car_posotion, car_jianche, car_guohu, car_price_1,
car_price_2)
get_html()
# get_inf(lis_5)
print("错误结束")
break
continue
print("跳出循环")
print("函数结束")
get_html()
get_inf(lis_0)
print('---------------------------------------第', page, '页---------------------------------------')