python之scrapy爬取某集团招聘信息
1、创建工程 scrapy startproject gosuncn 2、创建项目 cd gosuncn scrapy genspider gaoxinxing gosuncn.zhiye.com 3、运行项目 crawl gaoxinxing 4、gaoxinxing.py代码 # -*- coding: utf-8 -*- import scrapy import logging logger = logging.getLogger(__name__) #引入日志 class GaoxinxingSpider(scrapy.Spider): name = 'gaoxinxing' allowed_domains = ['gosuncn.zhiye.com'] start_urls = ['http://gosuncn.zhiye.com/Social'] next_page_num = 1 def parse(self, response): tr_list = response.xpath("//table[@class='jobsTable']/tr")[1:] #print(tr_list) for tr in tr_list: item = {} item["position"]=tr.xpath(".//td[1]/a/text()").extract_first()