"""
Crawler
@author: Dazhuang
"""
import requests
from bs4 import BeautifulSoup
import re #正規表示式
s = 0
r = requests.get('https://book.douban.com/')
soup = BeautifulSoup(r.text, 'lxml')
pattern = soup.find_all('a') # 之前此处标签为'p', 'comment-content'
for item in pattern:
print(item.string)
pattern_s = re.compile('