From 5534ae317f8336ad33b2fa7874ea234edfbcb304 Mon Sep 17 00:00:00 2001 From: Pradana AUMARS Date: Mon, 12 Jul 2021 22:20:00 +0200 Subject: [PATCH] Isolate subtitles as black over white background (kudos to u/Yun on hexbear.net) --- videocr/video.py | 1 + 1 file changed, 1 insertion(+) diff --git a/videocr/video.py b/videocr/video.py index 27ebdc3..22cb63c 100644 --- a/videocr/video.py +++ b/videocr/video.py @@ -56,6 +56,7 @@ class Video: if not self.use_fullframe: # only use bottom half of the frame by default img = img[self.height // 2:, :] + img = cv2.bitwise_not(cv2.bitwise_and(img, img, mask=cv2.inRange(img, (190, 190, 190), (255, 255, 255)))) config = '--tessdata-dir "{}"'.format(constants.TESSDATA_DIR) try: return pytesseract.image_to_data(img, lang=self.lang, config=config)