Germey 3 gadi atpakaļ
vecāks
revīzija
0ebac358a2
1 mainītis faili ar 3 papildinājumiem un 1 dzēšanām
  1. 3 1
      proxypool/crawlers/base.py

+ 3 - 1
proxypool/crawlers/base.py

@@ -20,7 +20,7 @@ class BaseCrawler(object):
             if response.status_code == 200:
             if response.status_code == 200:
                 response.encoding = 'utf-8'
                 response.encoding = 'utf-8'
                 return response.text
                 return response.text
-        except requests.ConnectionError:
+        except (requests.ConnectionError, requests.ReadTimeout):
             return
             return
 
 
     def process(self, html, url):
     def process(self, html, url):
@@ -39,6 +39,8 @@ class BaseCrawler(object):
             for url in self.urls:
             for url in self.urls:
                 logger.info(f'fetching {url}')
                 logger.info(f'fetching {url}')
                 html = self.fetch(url)
                 html = self.fetch(url)
+                if not html:
+                    continue
                 time.sleep(.5)
                 time.sleep(.5)
                 yield from self.process(html, url)
                 yield from self.process(html, url)
         except RetryError:
         except RetryError: