Changeset 1849:1d0ac164cf62 for scrapy/contrib/itemsampler.py
- Timestamp:
- 11/14/09 20:28:59 (10 months ago)
- Branch:
- default
- Files:
-
- 1 modified
-
scrapy/contrib/itemsampler.py (modified) (4 diffs)
Legend:
- Unmodified
- Added
- Removed
-
scrapy/contrib/itemsampler.py
r1828 r1849 54 54 55 55 def process_item(self, spider, item): 56 sampled = stats.get_value("items_sampled", 0, domain=spider.domain_name)56 sampled = stats.get_value("items_sampled", 0, spider=spider) 57 57 if sampled < items_per_spider: 58 58 self.items[item.guid] = item 59 59 sampled += 1 60 stats.set_value("items_sampled", sampled, domain=spider.domain_name)60 stats.set_value("items_sampled", sampled, spider=spider) 61 61 log.msg("Sampled %s" % item, spider=spider, level=log.INFO) 62 62 if close_spider and sampled == items_per_spider: … … 72 72 73 73 def spider_closed(self, spider, reason): 74 if reason == 'finished' and not stats.get_value("items_sampled", domain=spider.domain_name):74 if reason == 'finished' and not stats.get_value("items_sampled", spider=spider): 75 75 self.empty_domains.add(spider.domain_name) 76 76 self.spiders_count += 1 … … 88 88 89 89 def process_spider_input(self, response, spider): 90 if stats.get_value("items_sampled", domain=spider.domain_name) >= items_per_spider:90 if stats.get_value("items_sampled", spider=spider) >= items_per_spider: 91 91 return [] 92 92 elif max_response_size and max_response_size > len(response_httprepr(response)): … … 101 101 items.append(r) 102 102 103 if stats.get_value("items_sampled", domain=spider.domain_name) >= items_per_spider:103 if stats.get_value("items_sampled", spider=spider) >= items_per_spider: 104 104 return [] 105 105 else:
