- https://vd4.bdstatic.com/mda-na52r5q2j82ygva2/sc/cae_h264_nowatermark/1641435544451331823/mda-na52r5q2j82ygva2.mp4?v_from_s=hkapp-haokan-hbe&auth_key=1641483831-0-0-b9a71064a13394ea1324fdb4480d1c5e&bcevod_channel=searchbox_feed&pd=1&pt=3&logid=0830919840&vid=12005734968040248575&abtest=3000203_4&klogid=0830919840‘
res = urllib.request.urlopen(url)
f = open(‘./zuoye/shiping.mp4’,’wb’)
f.write(res.read())
f.close()">爬 视频
import urllib.request
url = ‘https://vd4.bdstatic.com/mda-na52r5q2j82ygva2/sc/cae_h264_nowatermark/1641435544451331823/mda-na52r5q2j82ygva2.mp4?v_from_s=hkapp-haokan-hbe&auth_key=1641483831-0-0-b9a71064a13394ea1324fdb4480d1c5e&bcevod_channel=searchbox_feed&pd=1&pt=3&logid=0830919840&vid=12005734968040248575&abtest=3000203_4&klogid=0830919840‘
res = urllib.request.urlopen(url)
f = open(‘./zuoye/shiping.mp4’,’wb’)
f.write(res.read())
f.close() - https://cu-sycdn.kuwo.cn/ad47ca411673aeb42536c8d3e159814c/61d70a7f/resource/n2/89/83/1406545095.mp3‘
res = urllib.request.urlopen(url)
f = open(‘./zuoye/歌曲.mp3’,’wb’)
f.write(res.read())
f.close()">爬歌曲
import urllib.request
url = ‘https://cu-sycdn.kuwo.cn/ad47ca411673aeb42536c8d3e159814c/61d70a7f/resource/n2/89/83/1406545095.mp3‘
res = urllib.request.urlopen(url)
f = open(‘./zuoye/歌曲.mp3’,’wb’)
f.write(res.read())
f.close()
一、urllib模块向服务器发起请求的方法是?
urllib.request.urlopen(url)
二、翻页爬取这个网页上面的源代码,并且保存到本地,注意编码https://www.1ppt.com/moban/
import urllib.parse
import urllib.request
headrs = {
‘User-Agent’:’Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/94.0.4606.81 Safari/537.36’
}
for n in range(1,4):
url = f’https://www.1ppt.com/moban/ppt_moban_{n}.html‘
print(url)
# 创建请求对象
res = urllib.request.Request(url=url, headers=headrs)
# 发送请求
req = urllib.request.urlopen(res)
# print(req.read().decode(‘gb2312’))
# 打印字节流
html = req.read().decode(‘gb2312’)
# 保存到本地 w 创建文件并写入 open(文件名,写入方式,编码格式)
with open(‘./zuoye/第’ + str(n) + ‘页.html’, ‘w’, encoding=’utf-8’)as file:
file.write(html)
print(f’第{n}页.html写入成功’)
三、自己去网上找一张喜欢的图片或者视频,爬取下来,保存到本地(图片视频没有要求)
#爬图片
import urllib.request
url = ‘https://gimg2.baidu.com/image_search/src=http%3A%2F%2Farticle-fd.zol-img.com.cn%2Ft_s998x562c5%2Fg5%2FM00%2F0A%2F02%2FChMkJltpVKGIQENcAAKaC93UFtUAAqi5QPdcOwAApoj403.jpg&refer=http%3A%2F%2Farticle-fd.zol-img.com.cn&app=2002&size=f9999,10000&q=a80&n=0&g=0n&fmt=jpeg?sec=1644072868&t=c9b5ba34baebe0d96a083b818e30cee4‘
res = urllib.request.urlopen(url)
f = open(‘./zuoye/图片.jpg’,’wb’)
f.write(res.read())
f.close()
