Development of the ocr part of AOI
Samo Penic
2018-11-16 e2fa6a35a6548a5acfd000af56ea333df8149b27
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
from Ocr import Paper
from sklearn.externals import joblib
 
from glob import glob
 
settings = {"sid_mask": "61xx0xxx", "answer_treshold": 0.25}
classifier = joblib.load("filename.joblib")
 
#p = Paper(filename="testpage300dpi_scan1.png")
#p=Paper(filename='sizif111.tif', sid_classifier=classifier, settings=settings)
#p=Paper(filename='processed_scans/20141016095134535_0006.tif', sid_classifier=classifier, settings=settings)
#p=Paper(filename='processed_scans/20151111080408825_0001.tif', sid_classifier=classifier, settings=settings)
p=Paper(filename='processed_scans/20151028145444607_0028.tif', sid_classifier=classifier, settings=settings)
 
# print(p.QRData)
# print(p.errors)
 
# print(p.getSkewAngle())
# print(p.locateUpMarkers())
# print(p.locateRightMarkers())
# print(p.answerMatrix)
# p.get_enhanced_sid()
 
 
print(p.get_paper_ocr_data())
exit(0)
filelist = glob("processed_scans/*.tif")
for f in filelist:
    print(f,Paper(filename=f, sid_classifier=classifier, settings=settings).get_paper_ocr_data())