本文整理汇总了Python中scrapy.http.request.Request.meta['url']方法的典型用法代码示例。如果您正苦于以下问题:Python Request.meta['url']方法的具体用法?Python Request.meta['url']怎么用?Python Request.meta['url']使用的例子?那么恭喜您, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在类scrapy.http.request.Request
的用法示例。
在下文中一共展示了Request.meta['url']方法的2个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Python代码示例。
示例1: parse
# 需要导入模块: from scrapy.http.request import Request [as 别名]
# 或者: from scrapy.http.request.Request import meta['url'] [as 别名]
def parse(self, response):
base_url = "http://www.thesaigontimes.vn"
posts = Selector(response).xpath('//div[@class="ARTICLE"]')
for post in posts:
postTitle = post.xpath(
'a[@class="ArticleTitle"]/text()').extract()[0]
itemFullURL = base_url + post.xpath(
'a[@class="ArticleTitle"]/@href').extract()[0]
request = Request(itemFullURL, callback = self.parse_full_post)
request.meta['title'] = postTitle
request.meta['url'] = itemFullURL
yield request
示例2: parse
# 需要导入模块: from scrapy.http.request import Request [as 别名]
# 或者: from scrapy.http.request.Request import meta['url'] [as 别名]
def parse(self, response):
self.counter += 1
base_url = "http://m.vnexpress.net"
hxs = HtmlXPathSelector(response)
next_page = hxs.select("//a[@class='right txt_1_1em']/@href").extract()
if ((next_page) and self.counter < self.max_page):
yield Request(base_url + next_page[0], self.parse)
posts = hxs.select("//a[@class='block_image_relative ui-link']")
for post in posts:
itemFullURL = base_url + post.select('.//@href').extract()[0]
request = Request(itemFullURL, callback=self.parse_full_post)
request.meta['title'] = post.select('.//h2[@class="h2SdTopHome txt_1_5em"][1]/text()').extract()
request.meta['url'] = itemFullURL
yield request