这几天在学习selenium,顺便用selenium + python写了一个比较简陋的爬虫,现附上源码,有时间再补充补充: from selenium import webdriver from selenium.webdriver.support.wait import WebDriverWait from selenium.webdriver.support import expected_conditions as EC from selenium.webdriver.common.by…
基础页面:https://movie.douban.com/top250 代码: from time import sleep from requests import get from bs4 import BeautifulSoup import re import pymysql db = pymysql.connect(host='localhost', user='root', password='123456', db='douban', charset='utf8mb4', cur…
# -*- coding:utf-8 -*- __author__ = "MuT6 Sch01aR" import requests from pyquery import PyQuery def GetDouBanMovie(): a = 1 for i in range(0,250,25): url = "https://movie.douban.com/top250?start=%s&filter=" %i r = requests.get(url)…
1 import json import requests from requests.exceptions import RequestException import re import time def get_one_page(url): try: headers = { 'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_13_3) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/…