當前位置：首頁 > 编程语言 > python >内容正文

python

python爬取图片源码_python抓取百度图片源码

發布時間：2025/3/21 python 24 豆豆

生活随笔收集整理的這篇文章主要介紹了 python爬取图片源码_python抓取百度图片源码小編覺得挺不錯的,現在分享給大家,幫大家做個參考.

#!/usr/bin/python

# -*- coding:utf-8 -*-

import httplib2

import urllib.request

import json

#import urllib2

import re

import os

import string

class BaiduImage(object):

def __init__(self):

super(BaiduImage, self).__init__()

u'圖片獲取中,CTRL+C 退出程序...'

self.page = 60 # 當前頁數

if not os.path.exists(r'./image'):

os.mkdir(r'./image')

def request(self):

try:

urlError=""

while 1:

conn = httplib2.Http()

request_url = 'http://image.baidu.com/search/avatarjson?tn=resultjsonavatarnew&ie=utf-8&word=風景&cg=girl&rn=60&pn=' + str(

self.page)

headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64; rv:40.0) Gecko/20100101 Firefox/40.0',

'Content-type': 'test/html'}

# body = urllib.urlencode({'tn':'resultjsonavatarnew','ie':'utf-8','word':'%E7%BE%8E%E5%A5%B3','cg':'girl','pn':self.page,'rn':'60'})

# conn.request( request_url,'GET', body=None, headers=headers)

resp,content = conn.request(request_url,'GET', body=None, headers=headers)

# print r.status

if resp.status == 200:

data =content

#data =unicode(data, errors='ignore')

d= data.decode("UTF-8")

decode = json.loads(d)

urlError=decode

self.download(decode['imgs'])

self.page += 60

print(self.page)

except Exception as e:

print (e+urlError)

finally:

print(conn)

def download(self, data):

imgCount=0

for d in data:

# url = d['thumbURL'] 縮略圖尺寸200

# url = d['hoverURL'] 尺寸360

try:

url = d['objURL']

print(url)

data = urllib.request.urlopen(url).read()

pattern = re.compile(r'.*/(.*?)\.jpg', re.S)

item = re.findall(pattern, url)

if item is None:

continue

if ".jpg" in url:

FileName = str('image/') + item[0] + str('.jpg')

if f.__exit__(FileName):

with open(FileName, 'wb') as f:

f.write(data)

else:

print(FileName+"存在!")

except Exception as e:

print(e)

finally:

imgCount+=1

print(imgCount.__str__() +":"+url)

if __name__ == '__main__':

bi = BaiduImage()

bi.request()

總結

以上是生活随笔為你收集整理的python爬取图片源码_python抓取百度图片源码的全部內容，希望文章能夠幫你解決所遇到的問題。

如果覺得生活随笔網站內容還不錯，歡迎將生活随笔推薦給好友。

上一篇：奇安信为什么大量招人_券商招人鄙视链：9
下一篇： python做社会网络分析_社交网络分析

日韩av黄I国产麻豆传媒I国产91av视频在线观看I日韩一区二区三区在线看I美女国产在线I麻豆视频国产在线观看I成人黄色短片

python

python爬取图片源码_python抓取百度图片源码

總結