最近学习python爬虫,写了一个小例子.主要用来爬取bing壁纸.
源码如下:
‘’’
import requests
from bs4 import BeautifulSoup
import re
import os
from urllib.request import urlretrieve
import time
from email.header import Header
from email.mime.text import MIMEText
from email.utils import parseaddr, formataddr
import smtplibclass BingImgSave:def __init__(self):self.user_agent = 'Mozilla/4.0 (compatible; MSIE 5.5; Windows NT)'self.headers={'User-Agent':self.user_agent}self.baseurl='https://bing.ioliu.cn/'self.nextpage = 0def getHtml(self, urls):r = requests.get(urls, headers=self.headers)print(type(r))return rdef parseHtml(self, response):soup = BeautifulSoup(response.text, 'lxml', from_encoding='utf-8') items = soup.find_all('div&#