import cv2
import pytesseract
from IPython.display import display
from PIL import Image


fname = 'age.png'
img = cv2.imread(fname)
img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB) # Converting BGR to RGB\
display(Image.fromarray(img))


crop = img[540:-135, 1260:]
gray = cv2.cvtColor(crop, cv2.COLOR_BGR2GRAY)
blur = cv2.GaussianBlur(gray, (3, 3), 0)
thresh = cv2.threshold(blur, 0, 255, cv2.THRESH_BINARY_INV + cv2.THRESH_OTSU)[1]
display(Image.fromarray(thresh))


data = pytesseract.image_to_string(thresh, lang='eng', config='--psm 6')
print(data)

Mince: 2
Lumberjack: 1
Hunter: 1
Forager: 1
Shepherds: 2


types = ['Miner', 'Lumberjack', 'Hunter', 'Forager', 'Shepherds']
numbers = [int(x) for x in data if x.isdigit()]
 = zip(types, numbers)


 ! jupyter nbconvert --to html ORC.ipynb

[NbConvertApp] Converting notebook ORC.ipynb to html
[NbConvertApp] Writing 3516469 bytes to ORC.html

Text recognition example¶