天天看點

牛刀小試

目标:http://qq.yh31.com/zjbq/2920180_2.html

#!/urs/bin/evn python
# -*- coding:utf-8 -*-
import requests
import re


def get_urls(url):
    """
    擷取目标url
    :param url: 
    :return: 
    """
    response = requests.get(url)
    response.encoding = "utf-8"
    ret = '<img .*?src="(.*?)"'
    url_list = re.findall(ret, response.text)
    return url_list


def get_gif(url, name):
    """
    擷取完整圖檔url
    :param url: 
    :param name: 
    :return: 
    """
    response_img = requests.get(url)
    response_img.encoding = "utf-8"
    with open(r"D:\data\%d.gif" % name, "wb") as ft:
        ft.write(response_img.content)

if __name__ == "__main__":
    first_url =["http://qq.yh31.com/zjbq/2920180.html", "http://qq.yh31.com/zjbq/2920180_2.html"]
    a = 1
    for url in first_url:
        url_list = get_urls(url)

        for url in url_list:
            com_url = "http://qq.yh31.com" + url # 圖檔路徑拼接
            # print(com_url)  測試
            get_gif(com_url, a)
            a += 1
# requests.text  把我擷取到requests轉成 字元串
# requests.json  從requests擷取json檔案
# requests.content 從requests擷取二進制檔案      
牛刀小試

轉載于:https://www.cnblogs.com/zqxqx/p/9313342.html