-
Notifications
You must be signed in to change notification settings - Fork 0
/
eval.py
54 lines (49 loc) · 1.94 KB
/
eval.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
def replace(str):
str = str[:-7].strip()
return str.replace('목판본_001_문학류_춘향전', '목판본_001_문학류_춘향전')
def pred_file_preprocessing(dataset):
with open(f'log_eval_result_{dataset}.txt', 'r', encoding='utf-8') as f:
file = f.readlines()
file = [line for line in file if 'test' in line]
file = list(map(replace, file))
return file
def test_file():
with open('gt_train.txt', 'r', encoding='utf-8') as f:
file = f.readlines()
with open('gt_test.txt', 'w', encoding='utf-8') as f:
for line in file:
if '목판본_001_문학류_춘향전' in line:
f.write(line)
def eval_log(dataset='origin'):
'''
label: train/목판본_001_문학류_춘향전_01_011_73.png 류
pred: /content/gdrive/MyDrive/old_korean_ocr/test/목판본_001_문학류_춘향전_01_011_73.png 류 0.3353
'''
with open('gt_test.txt', 'r', encoding='utf-8') as f:
label_file = f.readlines()
pred_file = pred_file_preprocessing(dataset)
label_dict = dict()
pred_dict = dict()
imgs = set()
for label_line, pred_line in zip(label_file, pred_file):
file, label = label_line.split('\t')
idx = file.find('목')
label_dict[file[idx:]] = label.strip()
imgs.add(file[idx:])
try:
file, pred = pred_line.strip().split('\t')
except:
file = pred_line.strip()
pred = ' '
idx = file.find('목')
pred_dict[file[idx:]] = pred
correct = 0
for file in list(imgs):
try:
if pred_dict[file] == label_dict[file]:
correct += 1
except:
continue
print(f'Test accuracy: {correct / len(imgs):0.4f}')
if __name__ == '__main__':
eval_log()