diff --git a/.DS_Store b/.DS_Store new file mode 100644 index 0000000..d9a693e Binary files /dev/null and b/.DS_Store differ diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..4de579b --- /dev/null +++ b/.gitignore @@ -0,0 +1,3 @@ +images* +test.py +1.jpg diff --git a/main.py b/main.py new file mode 100644 index 0000000..046a304 --- /dev/null +++ b/main.py @@ -0,0 +1,20 @@ +import cv2 +import pytesseract +import os +directory = 'images' + +# iterate over files in +# that directory +for filename in os.listdir(directory): + f = os.path.join(directory, filename) + # checking if it is a file + if os.path.isfile(f): + image = cv2.imread(f, 0) + thresh = 255 - cv2.threshold(image, 0, 255, cv2.THRESH_BINARY_INV + cv2.THRESH_OTSU)[1] + #bottom 2 locations + ROI1 = thresh[1383:1447,77:154] + ROI2 = thresh[1383:1447,950:1027] + ROI = cv2.hconcat([ROI1, ROI2]) + data = pytesseract.image_to_string(ROI, lang='eng',config='--psm 7 -c tessedit_char_whitelist=0123456789' ) + print(data) + os.rename(f'{f}', f'images/{data}.jpg')