1. import requests, os
    2. base_url = 'https://tieba.baidu.com/f?'
    3. headers = {
    4. 'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/77.0.3865.90 Safari/537.36',
    5. }
    6. # 保存文件地址
    7. dirname = './tieba/woman/'
    8. if not os.path.exists(dirname):
    9. os.makedirs(dirname)
    10. # len(对象)表示某个字符串或者数组的长度
    11. # range函数表示 返回的是列表
    12. # pn中表示的是页码,i为range定义的页码,从0-10,使用抓包,寻找规律
    13. # key自定义关键词
    14. key = 'JavaScript'
    15. for i in range(0, 10):
    16. params = {
    17. 'ie': 'utf-8',
    18. 'kw': key,
    19. 'pn': str(i * 50)
    20. }
    21. response = requests.get(base_url, headers=headers, params=params)
    22. with open(dirname + '美女第%s页.html' % (i+1), 'w', encoding='utf-8') as file:
    23. file.write(response.content.decode('utf-8'))