Python爬取必应壁纸

获取必应高清壁纸

import requests
import re
import os
from lxml import etree

dirName = '必应壁纸'
if not os.path.exists(dirName):
    os.mkdir(dirName)
    
#必应图片网页地址
url = 'https://bing.ioliu.cn//?p=%d'
#图片的张数
number = 0
for page in range(1,6):
    if page == 1:
        new_url = 'https://bing.ioliu.cn//?p=1'
    else:
        new_url = format(url%page) # 表示非第一页的url

    headers = {
        "User-Agent": 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/80.0.3987.116 Safari/537.36'
    }

    html = requests.get(new_url,headers=headers).text    # 下载网页
    etree_html = etree.HTML(html)                 # 构造xpath的解析对象
    img_src_list = etree_html.xpath('//img/@src')        # 获取图片地址列表
    for img_src in img_src_list:                        
        img_src = re.sub('640x480','1920x1080',img_src) # 获取1920x1080高清壁纸
        img_name = re.search('bing/(\w+?)_',img_src)    # 获取图片对应名称
        img = requests.get(img_src,headers=headers).content
        number+=1
        print('正在下载第{}张图片,地址为:{}'.format(number,img_src))
        img_name = '必应壁纸\\{}.jpg'.format(img_name.group(1))      #保存至指定位置
        with open(img_name,'wb') as save_img:
            save_img.write(img)

print('下载完毕!!!')
posted @ 2020-06-06 21:00  Free_thinker_py  阅读(103)  评论(0编辑  收藏  举报