chinaunicombidding_spider.py 文件源码-python代码片段

chinaunicombidding_spider.py 文件源码

python

阅读 21 收藏 0 点赞 0 评论 0

项目：scrapy_site 作者: hl10502 项目源码文件源码

def parse_(self, response):
        detail = response.xpath('//table[@bordercolor="lightgray"]/tr')
        # ???????
        for temp in detail[:-1]:
            item = SiteItem()
            item['title'] = temp.xpath('td/span/@title').extract_first().strip()
            if temp.xpath('td/span/@onclick').extract_first():
                item['link'] = 'http://www.chinaunicombidding.cn' + \
                               (temp.xpath('td/span/@onclick').extract_first()).split(',')[0].split(
                                   '(')[1][1:-1].strip()
            item['pubtime'] = temp.xpath('td[@width="15%"]/text()').extract_first().strip()
            yield item
        nowPage = str(int(response.xpath('//span[@id="nowPage"]/text()').extract_first()) + 1)
        print ('nowpage======================================' + str(nowPage))
        if item['pubtime'] == date.get_curdate():
            yield scrapy.FormRequest(
                "http://www.chinaunicombidding.cn/jsp/cnceb/web/info1/infoList.jsp?page=" + nowPage,
                formdata={
                    "type": "",
                    "province": "",
                    "city": "",
                    "notice": "",
                    "time1": "",
                    "time2": ""
                }, callback=self.parse_)