qq_38824178 2019-08-08 16:53 采纳率: 50%
浏览 846

scarpy框架如何循环爬取列表中所有的url的信息

代码如下
import scrapy
import json
import re
from plane.items import PlaneItem

class PlanespiderSpider(scrapy.Spider):
name = 'planespider'
allowed_domains = ['tuniu.com']
start_urls = ['https://flight-api.tuniu.com/query/flight/v2/list?callback=jQuery17207759591352059797_1565148905476&{"withTransfer":true,"passengers":[{"count":1,"psgType":"ADT"}],"voyType":"ST","voys":[{"orgCity":"CAN","dstCity":"BJS","deptDate":"2019-08-09"}],"tokenKey":"G92ZWFuZHBlYWNlMmxpZ2h0L3YyL2xpc","useToken":true}&_=1565148905672']

cityname = ('AQG', 'AKA', 'ABC')
url1 = []
for i in cityname:
    for j in cityname:
        if i != j:
            urls = ( 'https://flight-api.tuniu.com/query/flight/v2/list?callback=jQuery17207759591352059797_1565148905476&{"withTransfer":true,"passengers":[{"count":1,"psgType":"ADT"}],"voyType":"ST","voys":[{"orgCity":"%s","dstCity":"%s","deptDate":"2019-08-09"}],"tokenKey":"G92ZWFuZHBlYWNlMmxpZ2h0L3YyL2xpc","useToken":true}&_=1565148905672' % (i, j))
            url1.append(urls)
def parse(self, response):
    plane_json = json.loads(re.match(".*?({.*}).*", response.body.decode(), re.S).group(1))
    item = PlaneItem()
    data = plane_json['data']
    airbasic = data['airBasic']
    flightmap = airbasic['flightMap'].values()
    for each in flightmap:
        item["airCom"] = each["airCom"]
        item['flightNo'] = each['flightNo']
        item['orgCity'] = each['orgCity']
        item['dstCity'] = each['dstCity']
        item['orgAirport'] = each['orgAirport']
        item['dstAirport'] = each['dstAirport']
        item['deptTime'] = each['deptTime']
        item['arrvTime'] = each['arrvTime']
        item['rate'] = each['rate']
        yield item
  • 写回答

1条回答 默认 最新

  • zqbnqsdsmd 2019-08-10 23:48
    关注
    评论

报告相同问题?

悬赏问题

  • ¥50 永磁型步进电机PID算法
  • ¥15 sqlite 附加(attach database)加密数据库时,返回26是什么原因呢?
  • ¥88 找成都本地经验丰富懂小程序开发的技术大咖
  • ¥15 如何处理复杂数据表格的除法运算
  • ¥15 如何用stc8h1k08的片子做485数据透传的功能?(关键词-串口)
  • ¥15 有兄弟姐妹会用word插图功能制作类似citespace的图片吗?
  • ¥200 uniapp长期运行卡死问题解决
  • ¥15 latex怎么处理论文引理引用参考文献
  • ¥15 请教:如何用postman调用本地虚拟机区块链接上的合约?
  • ¥15 为什么使用javacv转封装rtsp为rtmp时出现如下问题:[h264 @ 000000004faf7500]no frame?