master

分支 (1)

管理

管理

master

fun
/
爬ZOL美女图.py

import re
import urllib.request
import time
# proxy = urllib.request.ProxyHandler({"http" :"183.172.192.248:1080"})
# opener = urllib.request.build_opener(proxy ,urllib.request.HTTPHandler)
# urllib.request.install_opener(opener)
count = 0
try:
    for c in range(0,10):
        new_url = "http://bbs.zol.com.cn/dcbbs/d33975_good_p" + str(c) + ".html#c"
        data_new = urllib.request.urlopen(new_url).read().decode("utf-8","ignore")
        tj_new = 'data-url="/dcbbs/(.*?).html">'
        p1 = re.compile(tj_new).findall(str(data_new))

        for sen in range(len(p1)):
            url = "http://bbs.zol.com.cn/dcbbs/" + str(p1[sen]) + ".html"
            data = urllib.request.urlopen(url).read().decode("GBK","ignore")
            tj = 'data-original="https://bbs-fd.zol-img.com.cn/t_s(.*?).jpg'
            p = re.compile(tj).findall(data)
            for i in range(len(p)):
                url = "https://bbs-fd.zol-img.com.cn/t_s" + str(p[i]) + ".jpg"
                file = "d:/zol/" + str(p[i][-8:-1]) + ".jpg"
                count +=1
                if count%5 ==0:
                    time.sleep(0.65)
                print("正在保存第%s张图片" % count)
                urllib.request.urlretrieve(url,filename=file)
except urllib.error.URLError as e:
    if hasattr(e, 'code'):
        print(e.code)
    if hasattr(e, "reason"):
        print(e.reason)