trec-coding/extract.py at main · csdevignes/trec-coding · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
'''
Contains methods for detecting boxes coordinates on the scanned resultsheets (Boxdetection)
and extracting and plotting roi extracted from the sheet (ROIExtract)
'''

import cv2 as cv
import numpy as np
import pandas as pd
import streamlit as st

class Boxdetection:
    '''
    Contains all the method to load scanned image file, display grid on it,
    Perform image rotation, box detection and coordinates storage, box display
    on scanned image.
    '''

    def __init__(self, image_file = None, image_path = None):
        '''
        When using with streamlit file uploader, use cv.imdecode with image_file binary
        When using with local file, use cv.imread together with image path
        (also modify in __init__)
        :param image_path: directory path to image file
        :param image_file: image file loaded from another method
        '''
        if image_file is not None:
            self.img = cv.imdecode(image_file, cv.IMREAD_COLOR)
        elif image_path is not None:
            self.img = cv.imread(image_path)
    @st.cache_data
    def plot_scan(_self, image, grid = [5, 4]):
        '''
        Draw horizontal and vertical lines on a copy of the image, then returns it
        :param image: image to plot on
        :param grid: number of [rows, cols] in the grid. Pass None to remove the grid
        :return: image copy with lines plotted on
        '''
        h, w, _ = image.shape
        img_lines = image.copy()
        if grid is not None :
            rows, cols = grid
            dy, dx = h / rows, w / cols
            for x in np.linspace(start=dx, stop=w-dx, num=cols-1): # vertical
                x = int(round(x))
                cv.line(img_lines, (x, 0), (x, h), color=(0, 255, 0), thickness=3)
            for y in np.linspace(start=dy, stop=h - dy, num=rows - 1): # horizontal
                y = int(round(y))
                cv.line(img_lines, (0, y), (w, y), color=(255, 0, 0), thickness=3)
        return img_lines
    def image_rotation(self, degree):
        '''
        Rotates an image of a certain degree counterclockwise
        :param degree: float
        '''
        rows, cols, _ = self.img.shape
        M = cv.getRotationMatrix2D(((cols - 1) / 2.0, (rows - 1) / 2.0), degree, 1)
        self.img_rot = self.img.copy()
        self.img_rot = cv.warpAffine(self.img_rot, M, (cols, rows))
        self.gray = cv.cvtColor(self.img_rot, cv.COLOR_BGR2GRAY)
    def find_boxes(self, lower_threshold):
        '''
        Run OpenCV findcontour with a given threshold for binary image, then loops
        into the contours to keep only the ones corresponding to the right size
        and aspect ratio for the boxes.
        :param lower_threshold: int between 0 and 255
        '''
        _, thresh = cv.threshold(self.gray, lower_threshold, 250, cv.THRESH_BINARY_INV)
        contours, _ = cv.findContours(thresh, cv.RETR_LIST, cv.CHAIN_APPROX_SIMPLE)
        self.box_coord = []
        for contour in contours:
            x, y, w, h = cv.boundingRect(contour)
            if(w>=90 and w<100):
                aspect_ratio = w/h
                if aspect_ratio <= 1.15:
                    self.box_coord.append((x, y, w, h))
        self.box_coord = np.array(self.box_coord)
    def align_boxes(self):
        '''
        Align boxes horizontally and vertically by replacing the given coordinates
        with the average of the line (of 20 boxes).
        Then sort the boxes left -> right and top -> bottom
        '''
        boxdf = pd.DataFrame(self.box_coord, columns=['x', 'y', 'w', 'h'])
        boxdf_sorted = boxdf.copy()
        # Horizontal alignment (mean y)
        boxdf_sorted = boxdf_sorted.sort_values(by='y', ignore_index=True)
        for i in range(0, 400, 20):
            boxdf_sorted.loc[i:i + 19, 'y'] = round(boxdf_sorted.loc[i:i + 19, 'y'].mean(), 0)
        # Vertical alignment (mean x)
        boxdf_sorted = boxdf_sorted.sort_values(by='x', ignore_index=True)
        for j in range(0, 400, 20):
            boxdf_sorted.loc[j:j + 19, 'x'] = round(boxdf_sorted.loc[j:j + 19, 'x'].mean(), 0)
        # Final reordering
        boxdf_sorted = boxdf_sorted.sort_values(by=['y', 'x'], ignore_index=True)
        self.box_coord = boxdf_sorted.to_numpy()
    def extract_boxes_fast(self):
        '''
        Iteration among thresholds for binary image, to find the one that will allow for the detection of all the
        boxes (400). Then reorder the box list top to bottom, and perform box alignment. Worked for all images so far.
        '''
        max_box_detected = 0
        lower_TSt = 160
        while (max_box_detected) != 400 and (lower_TSt >= 0):
            lower_TSt -= 5
            self.find_boxes(lower_TSt)
            max_box_detected = len(self.box_coord)
        self.box_coord = np.array(self.box_coord)
        self.box_coord = np.flip(self.box_coord, axis=0)
        self.align_boxes()
    def extract_boxes_ext(self):
        '''
        Iteration among all possible thresholds for binary image, to find the one that will allow for the detection of
        all the boxes (400). Then reorder the box list top to bottom, and perform box alignment.
        May be used if extract_boxes_fast() fails to detect all (400) the boxes.
        '''
        max_box_detected = 0
        lower_TSt = 255
        while (max_box_detected) != 400 and (lower_TSt >= 0):
            lower_TSt -= 1
            self.find_boxes(lower_TSt)
            max_box_detected = len(self.box_coord)
        self.box_coord = np.array(self.box_coord)
        self.box_coord = np.flip(self.box_coord, axis=0)
        self.align_boxes()
    @st.cache_data
    def plot_boxes(_self, coord):
        '''
        Display detected boxes
        :param coord: array of X coordinates (X, 4)
        :return: img_box picture of image with coordinates plotted on
        '''
        img_box = _self.img_rot.copy()
        if coord.ndim > 1:
            for gbox in coord:
                x, y, w, h = gbox
                cv.rectangle(img_box, (x, y), (x + w, y + h), (0, 255, 0), 2)
        else:  # If giving only one box to the function
            x, y, w, h = coord
            cv.rectangle(img_box, (x, y), (x + w, y + h), (0, 255, 0), 2)
        return img_box

class ROIExtract:
    '''
    Defines parameters and methods needed for image (ROI) extraction from given box coordinates
    Also includes symbols/numbers indexes.
    '''
    def __init__(self, image_rot):
        '''
        Loads image, defines indexes for symbols and numbers. Defines box width and height
        :param image_rot: image
        '''
        self.img = image_rot
        intervals = [(20, 40), (60, 80), (100, 120), (140, 160), (180, 200), (220, 240), (260, 280), (300, 320),
                     (340, 360), (380, 400)]
        self.symbols_index = np.concatenate([np.arange(start, end, 1) for start, end in intervals])
        self.all_index = np.arange(0, 400, 1)
        self.number_index = np.setdiff1d(self.all_index, self.symbols_index)
        self.width = 87
        self.height = 80
    def extract_roi_inside_box(self, coord):
        '''
        Extracts image (region of interest - ROI) located inside given coordinates, on the scanned image
        :param coord: list of 4 coordinates
        :return: image (ROI) of dimension [height, width]
        '''
        gray = cv.cvtColor(self.img, cv.COLOR_BGR2GRAY)
        x, y, w, h = coord
        roi = gray[y + 4:y + self.height, x + 5:x + self.width]
        return roi
    def extract_roi_symbols(self, coord_list):
        '''
        Iterates through coordinates to extract all the images (ROI) corresponding to symbols index.
        Boxes must be properly aligned and reordered for index-based selection to work.
        :param coord_list: array of X coordinates (X, 4)
        '''
        self.roi_symbols = []
        for coord in coord_list[self.symbols_index]:
            roi_img = self.extract_roi_inside_box(coord)
            self.roi_symbols.append(roi_img)
        self.roi_symbols = np.array(self.roi_symbols)
    def extract_roi_all(self, coord_list):
        '''
        Iterates through coordinates to extract all the images (ROI), not only the symbols.
        :param coord_list: array of X coordinates (X, 4)
        '''
        self.roi_all = []
        for coord in coord_list:
            roi_img = self.extract_roi_inside_box(coord)
            self.roi_all.append(roi_img)
        self.roi_all = np.array(self.roi_all)