import requests
from bs4 import BeautifulSoup
urls = [
f"https://cnblogs.com/#p{page}"
for page in range(1,5+1)
]
def parse(url):
print(url)
r = requests.get(url)
r.encoding = 'uft-8'
html= r.text
soup = BeautifulSoup(html,'lxml')
links = soup.find_all('a',class_ = 'post-item-title')
return [
(link.get('href'),link.text)
for link in links ]
def main():
for url in urls:
for result in parse(url):
print(result)
print('\n')
if __name__ == "__main__":
main()