import requests
import csv,re
url1 = 'http://category.dangdang.com/'
url2 = 'cp01.58.03.00.00.00.html'
url3 = url1 + url2
f = open('book.csv', mode='w', encoding='utf-8')
csvwriter = csv.writer(f)
resp = requests.get(url3)
obj = re.compile(
r'</div>.*?单品标题" target="_blank" > (?P<name>.*?)</a>.*?target="_blank" title="(?P<chinapublisher>.*?)">.*?p">(?P<commentnum>.*?)</a></p>.*?单品出版社(?P<foreignpublisher>.*?)>',
re.S)
result = obj.finditer(resp.text)
print(result)
for it in result:
print(it.group("name"))
print(it.group("chinapublisher"))
print(it.group("commentnum"))
print(it.group("foreignpublisher"))
dic = it.groupdict()
csvwriter.writerow(dic.values())
print('over!')