下载比较小的文件:
# 方法一:使用urllib库 # -*- coding:utf-8 -*- import urllib import time url = 'http://mvideo.spriteapp.cn/video/2017/0414' \ '/697de826-20b5-11e7-9c72-1866daeb0df1cut_wpcco.mp4' print "downloading with urllib" start = time.time() urllib.urlretrieve(url, "video.mp4") end = time.time() print 'Finish in :', end - start
# 方法二:使用urllib2库 # -*- coding:utf-8 -*- import urllib2 import time url = 'http://mvideo.spriteapp.cn/video/2017/0414/' \ '697de826-20b5-11e7-9c72-1866daeb0df1cut_wpcco.mp4' print "downloading with urllib2" start = time.time() data = urllib2.urlopen(url).read() with open('video.mp4', 'wb') as video: video.write(data) end = time.time() print 'Finish in :', end - start
# 方法三:使用requests库 # -*- coding:utf-8 -*- import requests import time url = 'http://mvideo.spriteapp.cn/video/2017/0414/' \ '697de826-20b5-11e7-9c72-1866daeb0df1cut_wpcco.mp4' print "downloading with requests" start = time.time() r = requests.get(url) with open('video.mp4', 'wb') as video: video.write(r.content) end = time.time() print 'Finish in :', end - start
下载比较大的文件:
# 方法一:使用urllib2库 # -*- coding:utf-8 -*- import urllib2 import time url = 'http://mvideo.spriteapp.cn/video/2017/0414/' \ '697de826-20b5-11e7-9c72-1866daeb0df1cut_wpcco.mp4' r = urllib2.Request(url) u = urllib2.urlopen(r) start = time.time() with open('video.mp4', 'w') as f: while True: tmp = u.read(1024) if not tmp: break f.write(tmp) end = time.time() print 'Finish in :', end - start
# 方法二:使用requests库 # -*- coding:utf-8 -*- import requests import time url = 'http://mvideo.spriteapp.cn/video/2017/0414/' \ '697de826-20b5-11e7-9c72-1866daeb0df1cut_wpcco.mp4' # 当把get函数的stream参数设置成False时, # 它会立即开始下载文件并放到内存中,如果文件过大,有可能导致内存不足。 # 当把get函数的stream参数设置成True时,它不会立即开始下载, # 使用iter_content或iter_lines遍历内容或访问内容属性时才开始下载 r = requests.get(url, stream=True) f = open("file_path", "wb") start = time.time() for chunk in r.iter_content(chunk_size=1024): if chunk: f.write(chunk) f.flush() # iter_content:一块一块的遍历要下载的内容 # iter_lines:一行一行的遍历要下载的内容 # 这两个函数下载大文件可以防止占用过多的内存,因为每次只下载小部分数据 end = time.time() print 'Finish in :', end - start