"""
http://www.ccgp-hunan.gov.cn/page/notice/more.jsp
https://hunan.zcygov.cn/luban/announcement/list?utm=a0017.b0064.3.5.f7fcb4c03c7411ed84984b6678c33275
需求
1.招投标网站爬虫软件
2.需要有软件界面
3.可以选择下载保存公告文件
4.文件格式pdf
"""
import requests
from lxml import etree
url = 'http://www.ccgp-hunan.gov.cn/mvc/getNoticeList4Web.do'
headers = {
'Accept': 'application/json, text/javascript, */*; q=0.01',
'Accept-Language': 'zh-CN,zh;q=0.9',
'Connection': 'keep-alive',
'Content-Type': 'application/x-www-form-urlencoded; charset=UTF-8',
# 'Cookie': 'JSESSIONID=BD97B12D61360D93BEC5912F62B0F8BC',
'Origin': 'http://www.ccgp-hunan.gov.cn',
'Referer': 'http://www.ccgp-hunan.gov.cn/page/notice/more.jsp',
'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/111.0.0.0 Safari/537.36',
'X-Requested-With': 'XMLHttpRequest',
}
data = {
'pType': '',
'prcmPrjName': '',
'prcmItemCode': '',
'prcmOrgName': '',
'startDate': '2023-01-01',
'endDate': '2023-03-11',
'prcmPlanNo': '',
'page': '1',
'pageSize': '18',
}
cookies = {
'JSESSIONID': 'BD97B12D61360D93BEC5912F62B0F8BC',
}
resp = requests.post(url,headers=headers,data=data,cookies=cookies)
data = resp.json()["rows"]
tree = etree.HTML(resp.text)
lis = tree.xpath('//table[@class="ejcggg"]/tr')
print(lis)