example10.py 405 B

123456789101112131415
  1. import random
  2. import time
  3. import requests
  4. from bs4 import BeautifulSoup
  5. for page in range(10):
  6. resp = requests.get(
  7. url=f'https://movie.douban.com/top250?start={25 * page}',
  8. headers={'User-Agent': 'BaiduSpider'}
  9. )
  10. soup = BeautifulSoup(resp.text, "lxml")
  11. for elem in soup.select('a > span.title:nth-child(1)'):
  12. print(elem.text)
  13. time.sleep(random.random() * 5)