看完了python基础语法教程,弄了个下载网页图片的练手。下载图片只要3行代码,慢慢理解了那句人生苦短,我用python的境界
import re
import requests
from bs4 import BeautifulSoup
import xlwt
import os
def getpicurl(alist):
imgUrlSet =[]
for k in alist:
urls = k.get('src')
imgUrlSet.append(urls)
return imgUrlSet
def downPic(picUrlSet):
for IMAGE_URL in picUrlSet:
r = requests.get(IMAGE_URL)
fileName=IMAGE_URL.split('/')[-1]
os.makedirs("d://downGirls/img/")
with open('d://downGirls/img/'+fileName, 'wb') as f:
f.write(r.content)
def mainMethod(url):
response = requests.get(url)
response.encoding = response.apparent_encoding
# 因为网站使用的不是通用的utf-9格式,而是gzip,所以要让它判断解码格式
html = BeautifulSoup(response.text, 'lxml')
imgList = html.find_all('img')
picUrlSet = getpicurl(imgList)
downPic(picUrlSet)
mainMethod("http://www.webkfa.com/ageof18/picxjitem_web.jsp?id=255")