From 496811786b4e7e4fc1ad2059515af7bf96dc0265 Mon Sep 17 00:00:00 2001 From: Zhiyuan Chen Date: Thu, 5 Nov 2020 23:18:44 +0800 Subject: [PATCH] catch DecompressionBomb(warning/exception) some website return abnormal image, which may cause the death of download thread --- icrawler/downloader.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/icrawler/downloader.py b/icrawler/downloader.py index b895910..9ed4508 100644 --- a/icrawler/downloader.py +++ b/icrawler/downloader.py @@ -243,7 +243,7 @@ def keep_file(self, task, response, min_size=None, max_size=None): """ try: img = Image.open(BytesIO(response.content)) - except (IOError, OSError): + except (IOError, OSError, Image.DecompressionBombWarning, Image.DecompressionBombError, UserWarning): return False task['img_size'] = img.size if min_size and not self._size_gt(img.size, min_size):