Tesseract errors take many forms - just capture them all in one go

This commit is contained in:
rimu 2024-04-20 20:17:58 +12:00
parent e261c3b9c0
commit 35efd7725c

View file

@ -867,9 +867,7 @@ def make_image_sizes_async(file_id, thumbnail_width, medium_width, directory):
if img_width < 2000: # images > 2000px tend to be real photos instead of 4chan screenshots.
try:
image_text = pytesseract.image_to_string(Image.open(BytesIO(source_image)).convert('L'), timeout=30)
except FileNotFoundError as e:
image_text = ''
except TimeoutError as e:
except Exception as e:
image_text = ''
if 'Anonymous' in image_text and ('No.' in image_text or ' N0' in image_text): # chan posts usually contain the text 'Anonymous' and ' No.12345'
post = Post.query.filter_by(image_id=file.id).first()