import urllib
from bs4 import BeautifulSoup
from urllib import request
head = {'User-Agent': 'Mozilla/5.0 (X11; OpenBSD i386) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/36.0.1985.125 Safari/537.36'}
url = "https://book.douban.com/subject/26642302/"
request = urllib.request.Request(url, headers=head)
response = urllib.request.urlopen(request)
html = response.read().decode("utf-8")
bs = BeautifulSoup(html, 'html.parser')
web = bs.find_all(attrs={"class":{"intro"}})
for i in web:
cd = i.find_all('q')
print (cd[0].get('href'))
ç®å说ï¼é¤äºUser-Agentçheaderä¹åï¼è¿å¯è½éè¦å ¶ä»ï¼æ´ææçï¼è½é²æ¢è¢«å¯¹æ¹æ£æµåºæ¥ä½ æ¯ç¬è«ï¼çheaderãä½æ¯å ·ä½æ¯åªä¸ªï¼åéè¦ä½ èªå·±è°è¯æ¾åºæ¥æè¡ã
å ·ä½å¦ä½è°è¯æ¾åºæ¥ï¼æåªäºheaderï¼
çï¼è¯¦è§ææç¨ï¼æ¤å¤ä¸ç»è´´å°åï¼åªè½ç»ä½ çå¾ï¼ä½ èªå·±æï¼ï¼