

大学软科爬取,数据进行爬取,并传入列表,并进行下载,提取出相应的信息
import requests
from bs4 import BeautifulSoup
# 发送请求获取HTML页面
url = 'http://www.zuihaodaxue.cn/zuihaodaxuepaiming2019.html'
response = requests.get(url)
# 解析HTML页面并提取所需信息
soup = BeautifulSoup(response.text, 'html.parser')
table = soup.find('table', attrs={'class': 'table table-hover'})
schools_list = []
for row in table.tbody.find_all('tr')[1:]:
school_info = []
for cell in row.find_all('td'):
school_info.append(cell.text.strip())
schools_list.append(school_info)
# 将信息保存至文件
with open('schools.txt', 'w', encoding='utf-8') as f:
f.write('学校名称\t排名\t城市\t学校类型
')
for school_info in schools_list:
f.write('\t'.join(school_info) + '
')
# 打印列表
for school_info in schools_list:
print(school_info)