/DTI_PID/DTI_PID/TextDetector.py - HYTOS - 일정관리

hytos / DTI_PID / DTI_PID / TextDetector.py @ ae3a61a6

       # coding: utf-8
       """
           This is text detector module
       """
       import sys
       import os
       import cv2
       import numpy as np
       from PyQt5.QtCore import *
       from PyQt5.QtGui import *
       from PyQt5.QtWidgets import *
       from PyQt5.QtSvg import *
       from AppDocData import *
       import TextInfo as ti
       import tesseract_ocr_module as TOCR
       MIN_TEXT_SIZE = 10
       THREAD_MAX_WORKER = os.cpu_count()
       class TextDetector:
           '''
               @brief  constructor
               @author humkyung
               @date   2018.07.11
           '''
           def __init__(self):
               self.textInfoList = []
               self.otherTextInfoList = []
               self.titleBlockTextInfoList = []
           '''
               @brief  detect text areas
               @author humkyung
               @date   2018.06.16
           '''
           def detectTextAreas(self, img, offset):
               tInfoList = []
               try:
                   tInfoList = self.getTextAreaInfo(img, offset[0], offset[1])
               except Exception as ex:
                   print('error occurred({}) in {}:{}'.format(ex, sys.exc_info()[-1].tb_frame.f_code.co_filename,
                                                              sys.exc_info()[-1].tb_lineno))
               return tInfoList
           '''
               @brief      Get Text Area info by contour
               @author     Jeongwoo
               @date       2018.06.05
               @history    2018.06.08  Jeongwoo    Add angle
                           humkyung 2018.06.18 fixed logic to detect text area
           '''
           def getTextAreaInfo(self, imgGray, offsetX, offsetY):
               from AppDocData import AppDocData
               appDocData = AppDocData.instance()
               project = appDocData.getCurrentProject()
               configs = appDocData.getConfigs('Text Size', 'Max Text Size')
               maxTextSize = int(configs[0].value) if 1 == len(configs) else 100
               minSize = 5
               contourImg = np.ones(imgGray.shape, np.uint8) * 255
               binaryImg, mask = cv2.threshold(imgGray, 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU)
               contours, hierarchy = cv2.findContours(mask, cv2.RETR_TREE, cv2.CHAIN_APPROX_NONE)
               for contour in contours:
                   # remove too big one or horizontal/vertical line
                   [x, y, w, h] = cv2.boundingRect(contour)
                   area = cv2.contourArea(contour, True)
                   # skip one which size is greater than max size or less then minimum size
                   if area >= 0:
                       if (w > maxTextSize or h > maxTextSize) or (w <= minSize and h <= minSize): continue
                   if area >= 0:
                       cv2.drawContours(contourImg, [contour], -1, (0, 0, 0), -1)
                       cv2.drawContours(contourImg, [contour], -1, (255, 255, 255), 1)
                   else:
                       cv2.drawContours(contourImg, [contour], -1, (255, 255, 255), -1)
               path = os.path.join(project.getTempPath(), 'OCR_{}.png'.format(appDocData.imgName))
               cv2.imwrite(path, contourImg)
               rects = []
               configs = appDocData.getConfigs('Text Recognition', 'Expand Size')
               expandSize = int(configs[0].value) if 1 == len(configs) else 10
               configs = appDocData.getConfigs('Text Recognition', 'Shrink Size')
               shrinkSize = int(configs[0].value) if 1 == len(configs) else 0
               eroded = cv2.erode(contourImg, np.ones((expandSize, expandSize), np.uint8))
               # path = os.path.join(project.getTempPath(), 'ERODED_OCR_{}.png'.format(appDocData.imgName))
               # cv2.imwrite(path, eroded)
               eroded = cv2.bitwise_not(eroded)
               # path = os.path.join(project.getTempPath(), 'bitwise_not_{}.png'.format(appDocData.imgName))
               # cv2.imwrite(path, eroded)
               contours, hierarchy = cv2.findContours(eroded, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
               for contour in contours:
                   area = cv2.contourArea(contour, True)
                   if area < 0:
                       [x, y, w, h] = cv2.boundingRect(contour)
                       img = contourImg[y:y + h, x:x + w]
                       img = cv2.bitwise_not(img)
                       horizontal, max_width = 0, 0
                       vertical, max_height = 0, 0
                       _contours, _ = cv2.findContours(img, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
                       for xx in _contours:
                           [_x, _y, _w, _h] = cv2.boundingRect(xx)
                           cv2.rectangle(img, (_x, _y), (_x + _w, _y + _h), 255, 1)
                           max_width = _x if _x > max_width else max_width
                           max_height = _y if _y > max_height else max_height
                           if (_w < _h) or (_w > maxTextSize and _h < maxTextSize):  # width is greater than height
                               horizontal += 1 + (_w * _h) / (w * h)
                           else:
                               vertical += 1 + (_w * _h) / (w * h)
                       if (w < 10 and h < 10) or (
                               max_width > maxTextSize and max_height > maxTextSize): continue;  # skip too small or big one
                       """
                       if w > maxTextSize:
                           horizontal = 1
                       elif h > maxTextSize:
                           vertical = 1
                       else:
                           if shrinkSize > 0:
                               img = cv2.erode(img, np.ones((shrinkSize,shrinkSize), np.uint8))
                           _contours, _ = cv2.findContours(img, cv2.RETR_CCOMP, cv2.CHAIN_APPROX_SIMPLE)
                           for xx in _contours:
                               [_x, _y, _w, _h] = cv2.boundingRect(xx)
                               cv2.rectangle(img, (_x, _y), (_x+_w, _y+_h), 255, 1)
                               if (_w < _h) or (_w > maxTextSize and _h < maxTextSize): # width is greater than height
                                   horizontal += 1 + (_w*_h)/(w*h)
                               else:
                                   vertical += 1 + (_w*_h)/(w*h)
                       """
                       """
                       if horizontal > vertical:
                           filePath = os.path.join(project.getTempPath(), "Tile", "H-{}-{}-{}-{}.png".format(x,y,w,h))
                       else:
                           filePath = os.path.join(project.getTempPath(), "Tile", "V-{}-{}-{}-{}.png".format(x,y,w,h))
                       cv2.imwrite(filePath, img)
                       """
                       rects.append([0 if horizontal > vertical else 90, QRect(x, y, w, h)])
               configs = appDocData.getConfigs('Text Recognition', 'Merge Size')
               mergeSize = int(configs[0].value) if 1 == len(configs) else 10
               # merge rectangles
               intersected = True
               while intersected:
                   intersected = False
                   for rect in rects[:]:  # clone rects
                       if 0 == rect[0]:
                           rectExpand = rect[1].adjusted(-mergeSize, 0, mergeSize, 0)
                       else:
                           rectExpand = rect[1].adjusted(0, -mergeSize, 0, mergeSize)
                       matches = [x for x in rects if (x[0] == rect[0]) and rectExpand.intersects(x[1])]
                       if len(matches) > 1:
                           united = matches[0]
                           for _rect in matches:
                               united[1] = united[1].united(_rect[1])
                               if _rect in rects: rects.remove(_rect)
                           rects.append(united)
                           intersected = True
                           break
               list = []
               for rect in rects:
                   angle = rect[0]
                   list.append(ti.TextInfo('', round(offsetX) + rect[1].x(), round(offsetY) + rect[1].y(), rect[1].width(),
                                           rect[1].height(), angle))
                   x = rect[1].x()
                   y = rect[1].y()
                   w = rect[1].width()
                   h = rect[1].height()
                   img = contourImg[y:y + h, x:x + w]
                   ## DEBUG
                   # if angle == 0:
                   #    filePath = os.path.join(project.getTempPath(), "Tile", "H-{}-{}-{}-{}.png".format(x,y,w,h))
                   # else:
                   #    filePath = os.path.join(project.getTempPath(), "Tile", "V-{}-{}-{}-{}.png".format(x,y,w,h))
                   # cv2.imwrite(filePath, img)
                   ## up to here
               return list
           '''
               @brief      recognize text of given text info
               @author     humkyung
               @date       2018.07.24
               @history    change parameter updateProgressSignal to worker
 .11.08 euisung     add white char list check process on db
           '''
           @staticmethod
           def recognizeTextFromImage(tInfos, imgOCR, offset, searchedSymbolList, worker, listWidget, maxProgressValue):
               import re
               res = []
               app_doc_data = AppDocData.instance()
               try:
                   for tInfo in tInfos:
                       x = tInfo.getX() - round(offset[0])
                       y = tInfo.getY() - round(offset[1])
                       img = imgOCR[y:y + tInfo.getH(), x:x + tInfo.getW()]
                       # set angle 0 if symbol contains the text area is instrumentation
                       category = None
                       contains = [symbol for symbol in searchedSymbolList if symbol.contains(tInfo)]
                       if contains:
                           _type = contains[0].getType()
                           category = app_doc_data.getSymbolCategoryByType(_type)
                           if 'Instrumentation' == category:
                               tInfo.setAngle(0)
                       # up to here
                       whiteCharList = app_doc_data.getConfigs('Text Recognition', 'White Character List')
                       if len(whiteCharList) is 0:
                           resultTextInfo = TOCR.getTextInfo(img, (x, y), tInfo.getAngle(), language=app_doc_data.OCRData)
                       else:
                           resultTextInfo = TOCR.getTextInfo(img, (x, y), tInfo.getAngle(), language=app_doc_data.OCRData,
                                                             conf=whiteCharList[0].value)
                       if resultTextInfo is not None and len(resultTextInfo) > 0:
                           for result in resultTextInfo:
                               result.setX(result.getX() + round(offset[0]))
                               result.setY(result.getY() + round(offset[1]))
                               if 'Instrumentation' == category:
                                   text = re.sub('[^a-zA-Z0-9]+', '', result.getText())
                                   result.setText(text)
                           res.extend(resultTextInfo)
                           if listWidget is not None:
                               item = QListWidgetItem(
                                   '{},{},{} is recognized'.format(resultTextInfo[0].getX(), resultTextInfo[0].getY(),
                                                                   resultTextInfo[0].getText()))
                               listWidget.addItem(item)
                       else:
                           pass
                       if worker is not None:
                           worker.updateProgress.emit(maxProgressValue,
                                                      resultTextInfo[0].getText() if resultTextInfo is not None and 1 == len(
                                                          resultTextInfo) else None)
               except Exception as ex:
                   message = 'error occurred({}) in {}:{}'.format(repr(ex), sys.exc_info()[-1].tb_frame.f_code.co_filename,
                                                                  sys.exc_info()[-1].tb_lineno)
                   if worker is not None:
                       worker.displayLog.emit(MessageType.Error, message)
               return res
           '''
               @brief      read image drawing and then remove text
               @author     jwkim
               @date
               @history    humkyung 2018.04.06 check if file exists
                           Jeongwoo 2018.05.09 Use Tesseract OCR after Azure OCR (Azure OCR : Getting text area)
                           Jeongwoo 2018.05.25 Add condition on if-statement
                           Jeongwoo 2018.06.05 Get text area data list by config.type
                           Jeongwoo 2018.06.08 Add angle Parameter on TOCR.getTextInfo
                           humkyung 2018.06.16 update proessbar while recognizing text
                           humkyung 2018.07.03 remove white space and replace given oldStr with newStr
                           humkyung 2018.07.07 change method name to recognizeText
                           euisung  2018.11.08 add white char list check process on db
                           euisung  2018.11.12 add title block properties
           '''
           def recognizeText(self, imgSrc, offset, tInfoList, searchedSymbolList, worker, listWidget, maxProgressValue,
                             onlyTextArea=False):
               import concurrent.futures as futures
               from multiprocessing import Process, Queue
               from Area import Area
               try:
                   self.otherTextInfoList = []
                   self.titleBlockTextInfoList = []
                   self.textInfoList = []
                   appDocData = AppDocData.instance()
                   project = appDocData.getCurrentProject()
                   path = os.path.join(project.getTempPath(), 'OCR_{}.png'.format(appDocData.imgName))
                   if os.path.isfile(path):
                       imgOCR = cv2.imread(path, 1)
                       imgOCR = \
                       cv2.threshold(cv2.cvtColor(imgOCR, cv2.COLOR_BGR2GRAY), 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU)[1]
                       text_info_array = np.array_split(tInfoList, THREAD_MAX_WORKER)
                       pool = futures.ThreadPoolExecutor(max_workers=THREAD_MAX_WORKER)
                       for tInfo in text_info_array:
                           future = pool.submit(TextDetector.recognizeTextFromImage, tInfo, imgOCR, offset, searchedSymbolList,
                                                worker, listWidget, maxProgressValue)
                           data = future.result()
                           if data:
                               self.textInfoList.extend(data)
                       pool.shutdown(wait=True)
                       # remove text item has only 1 character
                       # for index in range(len(self.textInfoList) - 1, -1, -1):
                       #    if len(self.textInfoList[index].getText()) is 1:
                       #        self.textInfoList.pop(index)
                       if onlyTextArea:
                           return
                       # parse texts in area except Drawing area
                       whiteCharList = appDocData.getConfigs('Text Recognition', 'White Character List')
                       for area in appDocData.getAreaList():
                           if area.name == 'Drawing': continue
                           if area.name == 'Note':
                               if area is not None and hasattr(area, 'img') and area.img is not None:
                                   if len(whiteCharList) is 0:
                                       texts = TOCR.getTextInfo(area.img, (area.x, area.y), 0, language='eng')
                                   else:
                                       texts = TOCR.getTextInfo(area.img, (area.x, area.y), 0, language='eng',
                                                                conf=whiteCharList[0].value)
                                   self.otherTextInfoList.append([area.name, texts])
                           else:
                               img = imgSrc[round(area.y):round(area.y + area.height),
                                     round(area.x):round(area.x + area.width)]
                               if len(whiteCharList) is 0:
                                   texts = TOCR.getTextInfo(img, (area.x, area.y), 0, language='eng')
                               else:
                                   texts = TOCR.getTextInfo(img, (area.x, area.y), 0, language='eng',
                                                            conf=whiteCharList[0].value)
                               if texts is not None and len(texts) > 0:
                                   if area.name == 'Unit':
                                       appDocData.activeDrawing.setAttr('Unit', texts[0].getText())
                                   self.otherTextInfoList.append([area.name, texts])
                       titleBlockProps = appDocData.getTitleBlockProperties()
                       if titleBlockProps:
                           for titleBlockProp in titleBlockProps:
                               area = Area(titleBlockProp[0])
                               area.parse(titleBlockProp[2])
                               if not (titleBlockProp[3] and titleBlockProp[3] != ''):
                                   img = imgSrc[round(area.y):round(area.y + area.height),
                                         round(area.x):round(area.x + area.width)]
                                   if len(whiteCharList) is 0:
                                       texts = TOCR.getTextInfo(img, (area.x, area.y), 0, language=appDocData.OCRData)
                                   else:
                                       texts = TOCR.getTextInfo(img, (area.x, area.y), 0, language='eng',
                                                                conf=whiteCharList[0].value)
                                   texts = [ti.TextInfo('\n'.join([textInfo.getText() for textInfo in texts]), area.x, area.y,
                                                        area.width, area.height, 0)]
                               else:
                                   texts = [ti.TextInfo(titleBlockProp[3], area.x, area.y, area.width, area.height, 0)]
                               self.titleBlockTextInfoList.append([area.name, texts])
                       if worker is not None: worker.updateProgress.emit(maxProgressValue, None)
               except Exception as ex:
                   message = 'error occurred({}) in {}:{}'.format(repr(ex), sys.exc_info()[-1].tb_frame.f_code.co_filename,
                                                                  sys.exc_info()[-1].tb_lineno)
                   worker.displayLog.emit(MessageType.Error, message)
           '''
               @brief      remove text from image
               @author     humkyung
               @date       2018.07.24
           '''
           def removeTextFromImage(self, imgSrc, offset):
               appDocData = AppDocData.instance()
               project = appDocData.getCurrentProject()
               path = os.path.join(project.getTempPath(), 'OCR_{}.png'.format(appDocData.imgName))
               if os.path.isfile(path):
                   imgOCR = cv2.imread(path)
                   imgOCR = \
                   cv2.threshold(cv2.cvtColor(imgOCR, cv2.COLOR_BGR2GRAY), 127, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU)[1]
                   # remove recognized text from image
                   for text in self.textInfoList:
                       x = round(text.getX() - offset[0])
                       y = round(text.getY() - offset[1])
                       width = round(text.getW())
                       height = round(text.getH())
                       self.removeText(imgSrc, (round(text.getX()), round(text.getY())), imgOCR[y:y + height, x:x + width])
                   # up to here
           '''
               @brief  remove text from image by using ocr image
               @author
           '''
           def removeText(self, img, pt, imgOCR):
               try:
                   x = round(pt[0])
                   y = round(pt[1])
                   width, height = imgOCR.shape[::-1]
                   temp = img[y:y + height, x:x + width]
                   imgOCR = cv2.erode(imgOCR, np.ones((3, 3), np.uint8))
                   mask = cv2.bitwise_or(temp, imgOCR)
                   imgXOR = cv2.bitwise_xor(temp, mask)
                   img[y:y + height, x:x + width] = cv2.bitwise_not(imgXOR)
               except Exception as ex:
                   print('error occurred({}) in {}:{}'.format(ex, sys.exc_info()[-1].tb_frame.f_code.co_filename,
                                                              sys.exc_info()[-1].tb_lineno))
               return img

프로젝트

일반

사용자정보

HYTOS

hytos / DTI_PID / DTI_PID / TextDetector.py @ ae3a61a6