main.py
1.63 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
from pytesseract import image_to_string
import argparse
import cv2
from pathlib import Path
import os.path
import yaml
doc = yaml.load(open('freset.yaml', 'r'))
bil_op = doc["bilateralFilterData"]
th_op = doc["thresholdData"]
def main():
parser = argparse.ArgumentParser(description='OCR program')
parser.add_argument('img_file', type=str, help="Input Image File Name")
parser.add_argument('--op', type=int,
help="Input option number to 0 ~12", default=0)
parser.add_argument('--engine', type=str,
help="Select engine to Google-Vision and Tessreact")
args = parser.parse_args()
direct = Path(os.path.expanduser('~'))
file_path = direct / 'Desktop' / args.img_file
img = cv2.imread(str(file_path))
select_freset(args.op, img)
def tesseract_orc_to_file(img):
text = image_to_string(img, lang='kor')
print(text) # debug
with open('result\\foo.txt', "w") as f:
f.write(text)
def select_freset(type, img):
gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
if type < 7:
gray = cv2.bilateralFilter(gray, int(bil_op[0]), int(bil_op[1]), int(bil_op[2]))
_, img = cv2.threshold(gray, int(th_op['threshVal'][type % 3]),
int(th_op['threshMax'][0]), cv2.THRESH_BINARY_INV if type%2 else cv2.THRESH_BINARY)
elif type < 13:
_, img = cv2.threshold(gray, int(th_op['threshVal'][type % 3]),
int(th_op['threshMax'][0]),
cv2.THRESH_BINARY_INV if type % 2 else cv2.THRESH_BINARY)
tesseract_orc_to_file(img)
if __name__ == "__main__":
main()