/ Published in: Python
data:image/s3,"s3://crabby-images/90b0e/90b0e6a2677ca35d5348c94828b6331437fd25ab" alt=""
Expand |
Embed | Plain Text
Copy this code and paste it in your HTML
# This snippet was taken from the old wiki. # # You can do this by overriding the Scrapy HTTP Client Factory, with the following (undocumented) setting: # # DOWNLOADER_HTTPCLIENTFACTORY = 'myproject.downloader.LimitSizeHTTPClientFactory' # MAX_RESPONSE_SIZE = 1048576 # 1Mb from scrapy.core.downloader.webclient import ScrapyHTTPClientFactory, ScrapyHTTPPageGetter class LimitSizePageGetter(ScrapyHTTPPageGetter): def handleHeader(self, key, value): ScrapyHTTPPageGetter.handleHeader(self, key, value) if key.lower() == 'content-length' and int(value) > MAX_RESPONSE_SIZE: self.connectionLost('oversized') class LimitSizeHTTPClientFactory(ScrapyHTTPClientFactory): protocol = LimitSizePageGetter # Snippet imported from snippets.scrapy.org (which no longer works) # author: pablo # date : Sep 16, 2011
Comments
data:image/s3,"s3://crabby-images/ddb6f/ddb6f8242eb268e53b908f42b5afcd1004e6fcb1" alt="RSS Feed for Comments RSS Icon"