#!/usr/bin/env python
# -*- coding:utf-8 -*-

import re
import requests

# 拿到校花网主页的内容
response = requests.get('http://www.xiaohuar.com/')
data = response.text

# 拿到校花网所有的图片链接
results = re.findall('lazysrc="(.*?)"', data)
for result in results:  # type:str

    # 判断是不是有链接的
    if result.startswith('htt'):
        pass
    else:
        img_result = 'http://www.xiaohuar.com/' + result

        # 获取图片内容
        img_response = requests.get(img_result)
        img_data = img_response.content
        img_name = result.split('/')[3]
        img_filename = img_name + '.jpg'
        print(img_filename)

        # 保存图片内容
        with open(img_filename, 'wb') as f:  # write,read,wb是写入二进制
            f.write(img_data)
            print('爬取成功一张')

相关文章:

  • 2021-08-06
  • 2021-12-10
  • 2021-10-07
  • 2021-11-17
  • 2021-08-06
  • 2021-04-29
  • 2021-11-26
  • 2021-11-02
猜你喜欢
  • 2021-11-06
  • 2021-11-07
  • 2022-01-01
  • 2021-12-14
  • 2021-11-05
  • 2021-11-05
  • 2021-05-18
相关资源
相似解决方案