AJK.py 文件源码-python代码片段

AJK.py 文件源码
python
阅读 28 收藏 0 点赞 0 评论 0
def parse_item(self, response):
        soup = BeautifulSoup(response.body, 'html.parser')
        # ?????
        infos = soup.findAll(attrs={'class': 'item-mod'})
        for q in infos:
            if 'data-link' in str(q):
                item = AjkItem()
                item['title'] = q.h3.a.string
                print(q.h3.a.string)
                item['detailUrl'] = q.h3.a.get('href')
                print(q.h3.a.get('href'))
                print(q.find(attrs={'class': 'address'}).a.string)
                if q.find(attrs={'class': 'price'}) != None:
                    item['price'] = q.find(attrs={'class': 'price'}).span.string
                    print(q.find(attrs={'class': 'price'}).span.string)
                else:
                    item['price'] = q.find(attrs={'class': 'favor-tag around-price'}).span.string + 'around'
                    print(q.find(attrs={'class': 'favor-tag around-price'}).span.string + 'around')
                # item['telephone'] = q.find(attrs={'class': 'tel'}).contents[1]
                # print(q.find(attrs={'class': 'tel'}).string)
                yield scrapy.Request(url=q.h3.a.get('href'), callback=self.parse_item2)