项目目录:
    image.png

    1. 第一步:创建项目
    2. scrapy startproject pearVideo
    3. 第二步:
    4. cd pearVideo
    5. scrapy genspider pearVideos "www.pearvideo.com/category_6"
    1. pearVideos.py文件
    2. import scrapy
    3. from pearVideo.items import PearvideoItem
    4. class PearvideosSpider(scrapy.Spider):
    5. name = 'pearVideos'
    6. allowed_domains = ['www.pearvideo.com']
    7. start_urls = ['https://www.pearvideo.com/category_6']
    8. def parse(self, response):
    9. li_list = response.xpath('//ul[@id="listvideoListUl"]/li')
    10. for li in li_list:
    11. item = PearvideoItem()
    12. item['title'] = li.xpath('./div/a//div[@class="vervideo-title"]/text()').get()
    13. item['author'] = li.xpath('.//a[@class="column"]/text()').get()
    14. item['nums'] = li.xpath('.//span[@class="fav"]/text()').get()
    15. print(item)
    16. yield item
    17. items.py文件
    18. class PearvideoItem(scrapy.Item):
    19. title = scrapy.Field()
    20. author = scrapy.Field()
    21. nums = scrapy.Field()
    22. run.py 运行项目文件
    23. from scrapy import cmdline
    24. # 执行项目
    25. #cmdline.execute('scrapy crawl pearVideos -o pearvideo.csv'.split())
    26. cmdline.execute('scrapy crawl pearVideos'.split())