本文整理汇总了Python中models.Product.update_history['combine_url']方法的典型用法代码示例。如果您正苦于以下问题:Python Product.update_history['combine_url']方法的具体用法?Python Product.update_history['combine_url']怎么用?Python Product.update_history['combine_url']使用的例子?那么恭喜您, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在类models.Product
的用法示例。
在下文中一共展示了Product.update_history['combine_url']方法的1个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Python代码示例。
示例1: crawl_listing
# 需要导入模块: from models import Product [as 别名]
# 或者: from models.Product import update_history['combine_url'] [as 别名]
def crawl_listing(self, url, ctx='', **kwargs):
res = requests.get(url, params={'Ns': 'P_sale_flag|1'})
res.raise_for_status()
tree = lxml.html.fromstring(res.content)
category = Category.objects(key=kwargs.get('key')).first()
if not category:
print 'Category does not exist'
common_failed.send(sender=ctx, url=url, reason='Category does not exist -> {0} .'.format(kwargs))
return
product_nodes = tree.cssselect('div#product-container div');
no_discount_num = 0 # sometimes no discount product occurs between the discount ones ordered by sale.
for product_node in product_nodes:
if not product_node.get('id') or 'product' not in product_node.get('id').lower():
continue
key = product_node.get('id')
info_node = product_node.cssselect('div.product-text a')[0]
price = None; listprice = None
listprice_node = info_node.cssselect('span.product-price')
price_node = info_node.cssselect('span.product-sale-price')
if listprice_node:
listprice = ''.join(listprice_node[0].xpath('.//text()')).strip()
if price_node:
price = ''.join(price_node[0].xpath('.//text()')).strip()
if price is None or listprice is None:
no_discount_num += 1
if no_discount_num < 3:
continue
return
no_discount_num = 0
brand = info_node.cssselect('p span.product-designer-name')[0].text
if brand:
brand = brand.strip()
title = info_node.cssselect('p.product-description')[0].text.strip()
combine_url = info_node.get('href')
is_new = False; is_updated = False
product = Product.objects(key=key).first()
if not product:
is_new = True
product = Product(key=key)
product.updated = False
product.event_type = False
if title and title != product.title:
product.title = title
is_updated = True
product.update_history['title'] = datetime.utcnow()
if brand and brand != product.brand:
product.brand = brand
is_updated = True
if combine_url and combine_url != product.combine_url:
product.combine_url = combine_url
is_updated = True
product.update_history['combine_url'] = datetime.utcnow()
if price and price != product.price:
product.price = price
is_updated = True
if listprice and listprice != product.listprice:
product.listprice = listprice
is_updated = True
if category.cats and set(category.cats).difference(product.dept):
product.dept = list(set(category.cats) | set(product.dept or []))
is_updated = True
if category.key not in product.category_key:
product.category_key.append(category.key)
is_updated = True
if is_updated:
product.list_update_time = datetime.utcnow()
# To pick the product which fit our needs, such as a certain discount, brand, dept etc.
selected = Picker(site='saksfifthavenue').pick(product)
if not selected:
continue
product.hit_time = datetime.utcnow()
product.save()
# print product.brand; print product.title; print product.combine_url; print product.listprice, ' / ', product.price; print is_new; print is_updated
# print
common_saved.send(sender=ctx, obj_type='Product', key=product.key, url=product.combine_url, \
is_new=is_new, is_updated=((not is_new) and is_updated) )
# Go to the next page to keep on crawling.
next_page = None
page_nodes = tree.cssselect('div.pagination-container ol.pa-page-number li a')
for page_node in page_nodes:
#.........这里部分代码省略.........