• https://fanyi.baidu.com/
    # ● 爬取要求:
    # ○ 1、输入要翻译的内容
    # ○ 2、通过post请求拿到json数据(可以用urllib模块,也可以用requests模块)
    # ○ 3、把翻译后的数据提取出来,直接打印到控制台就行
    #
    #
    # 作业二
    # ● 目标网站:https://haokan.baidu.com/
    # ● 爬取要求:
    # ○ 1、输入搜索内容
    # ○ 2、拿到对应内容的视频的名字和链接(不要求全部拿到)
    # ○ 3、把内容提取出来,直接打印到控制台即可">1. 作业1
    # ● 目标网站:https://fanyi.baidu.com/
    # ● 爬取要求:
    # ○ 1、输入要翻译的内容
    # ○ 2、通过post请求拿到json数据(可以用urllib模块,也可以用requests模块)
    # ○ 3、把翻译后的数据提取出来,直接打印到控制台就行
    #
    #
    # 作业二
    # ● 目标网站:https://haokan.baidu.com/
    # ● 爬取要求:
    # ○ 1、输入搜索内容
    # ○ 2、拿到对应内容的视频的名字和链接(不要求全部拿到)
    # ○ 3、把内容提取出来,直接打印到控制台即可
  • https://fanyi.baidu.com/v2transapi?from=zh&to=en
    # headers = {
    # ‘User-Agent’: ‘Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.82 Safari/537.36’
    # }
    # data = {
    # ‘from’: ‘zh’,
    # ‘to’: ‘en’,
    # ‘query’: ‘你好’,
    # ‘simple_means_flag’: ‘3’,
    # ‘sign’: ‘232427.85594’,
    # ‘token’: ‘5799cf84c7102344d4d4295fe404e58d’,
    # ‘domain’: ‘common’,
    #
    # }
    # response = requests.post(url, data=data, headers=headers)
    # res_json = response.text
    # print(res_json)
    # url = ‘https://fanyi.baidu.com/sug
    # headers = {
    # ‘User-Agent’: ‘Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.82 Safari/537.36’
    # }
    # data = {
    # ‘kw’: ‘你好吗’
    #
    # }
    # response = requests.post(url, data=data, headers=headers)
    # res_json = json.loads(response.text)
    # print(res_json)
    # print(res_json[‘data’][0][‘v’])">作业1(第一种完不成)
    # url = ‘https://fanyi.baidu.com/v2transapi?from=zh&to=en
    # headers = {
    # ‘User-Agent’: ‘Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.82 Safari/537.36’
    # }
    # data = {
    # ‘from’: ‘zh’,
    # ‘to’: ‘en’,
    # ‘query’: ‘你好’,
    # ‘simple_means_flag’: ‘3’,
    # ‘sign’: ‘232427.85594’,
    # ‘token’: ‘5799cf84c7102344d4d4295fe404e58d’,
    # ‘domain’: ‘common’,
    #
    # }
    # response = requests.post(url, data=data, headers=headers)
    # res_json = response.text
    # print(res_json)
    # url = ‘https://fanyi.baidu.com/sug
    # headers = {
    # ‘User-Agent’: ‘Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.82 Safari/537.36’
    # }
    # data = {
    # ‘kw’: ‘你好吗’
    #
    # }
    # response = requests.post(url, data=data, headers=headers)
    # res_json = json.loads(response.text)
    # print(res_json)
    # print(res_json[‘data’][0][‘v’])
  • https://haokan.baidu.com/web/search/api?pn=1&rn=10&type=video&query=python
    https://haokan.baidu.com/web/search/api?pn=3&rn=10&type=video&query=python
    https://haokan.baidu.com/web/search/api?pn=4&rn=10&type=video&query=python
    ‘’’
    url = ‘https://haokan.baidu.com/web/search/api?pn=1&rn=10&type=video&query=python
    headers = {
    ‘User-Agent’: ‘Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.82 Safari/537.36’
    }
    response = requests.get(url,headers=headers)
    res_text = json.loads(response.text)
    name_list = [data[‘title’]for data in res_text[‘data’][‘list’]]
    url_list = [data[‘url’]for data in res_text[‘data’][‘list’]]
    # print(name_list,url_list)
    for data in zip(name_list,url_list):
    print(data)">作业2
    ‘’’
    https://haokan.baidu.com/web/search/api?pn=1&rn=10&type=video&query=python
    https://haokan.baidu.com/web/search/api?pn=3&rn=10&type=video&query=python
    https://haokan.baidu.com/web/search/api?pn=4&rn=10&type=video&query=python
    ‘’’
    url = ‘https://haokan.baidu.com/web/search/api?pn=1&rn=10&type=video&query=python
    headers = {
    ‘User-Agent’: ‘Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.82 Safari/537.36’
    }
    response = requests.get(url,headers=headers)
    res_text = json.loads(response.text)
    name_list = [data[‘title’]for data in res_text[‘data’][‘list’]]
    url_list = [data[‘url’]for data in res_text[‘data’][‘list’]]
    # print(name_list,url_list)
    for data in zip(name_list,url_list):
    print(data)

    import requests
    import json

    1. 作业1
    # ● 目标网站:https://fanyi.baidu.com/
    # ● 爬取要求:
    # ○ 1、输入要翻译的内容
    # ○ 2、通过post请求拿到json数据(可以用urllib模块,也可以用requests模块)
    # ○ 3、把翻译后的数据提取出来,直接打印到控制台就行
    #
    #
    # 作业二
    # ● 目标网站:https://haokan.baidu.com/
    # ● 爬取要求:
    # ○ 1、输入搜索内容
    # ○ 2、拿到对应内容的视频的名字和链接(不要求全部拿到)
    # ○ 3、把内容提取出来,直接打印到控制台即可

    作业1(第一种完不成)
    # url = ‘https://fanyi.baidu.com/v2transapi?from=zh&to=en
    # headers = {
    # ‘User-Agent’: ‘Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.82 Safari/537.36’
    # }
    # data = {
    # ‘from’: ‘zh’,
    # ‘to’: ‘en’,
    # ‘query’: ‘你好’,
    # ‘simple_means_flag’: ‘3’,
    # ‘sign’: ‘232427.85594’,
    # ‘token’: ‘5799cf84c7102344d4d4295fe404e58d’,
    # ‘domain’: ‘common’,
    #
    # }
    # response = requests.post(url, data=data, headers=headers)
    # res_json = response.text
    # print(res_json)
    # url = ‘https://fanyi.baidu.com/sug
    # headers = {
    # ‘User-Agent’: ‘Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.82 Safari/537.36’
    # }
    # data = {
    # ‘kw’: ‘你好吗’
    #
    # }
    # response = requests.post(url, data=data, headers=headers)
    # res_json = json.loads(response.text)
    # print(res_json)
    # print(res_json[‘data’][0][‘v’])

    作业2
    ‘’’
    https://haokan.baidu.com/web/search/api?pn=1&rn=10&type=video&query=python
    https://haokan.baidu.com/web/search/api?pn=3&rn=10&type=video&query=python
    https://haokan.baidu.com/web/search/api?pn=4&rn=10&type=video&query=python
    ‘’’
    url = ‘https://haokan.baidu.com/web/search/api?pn=1&rn=10&type=video&query=python
    headers = {
    ‘User-Agent’: ‘Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.82 Safari/537.36’
    }
    response = requests.get(url,headers=headers)
    res_text = json.loads(response.text)
    name_list = [data[‘title’]for data in res_text[‘data’][‘list’]]
    url_list = [data[‘url’]for data in res_text[‘data’][‘list’]]
    # print(name_list,url_list)
    for data in zip(name_list,url_list):
    print(data)