/ - Diff - HYTOS - 일정관리

개정판 9e64682b

ID	9e64682b06b02763441d74216c281e7195d464b8
상위	ff3d1c7a
하위	0d0dfc38

김정우 이(가) 약 7년 전에 추가함

DTI_PID 중 drawFoundSymbols 내 Tesseract 사용 구문을 tesseract_ocr_module에 병합 / tesseract_ocr_module의 각 함수의 conf를 전역 변수 사용하여 통일화

     '''
         @history    2018.04.27  Jeongwoo    Remove Tesseract Log on listWidget
 .05.04  Jeongwoo    Change method to OCR with tesseract_ocr_module.py
     '''
     def drawFoundSymbols(symbol, listWidget):
         global src
-...
             #kernel2 = np.ones((1, 1), np.uint8)
             #bitImg = cv2.erode(bitImg, kernel2)
             bitImg = cv2.resize(bitImg, None, fx = 2.0, fy = 2.0)
             im = Image.fromarray(bitImg)
             ocrData = pytesseract.image_to_boxes(im, config='-c tessedit_char_whitelist="-0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ" -psm 6')
             ### For image_to_boxes()
             if ocrData:
                 splitOcrData = ocrData.split('\n')
                 tList = []
                 lastCoord = (-1, -1) # Top-Right Coord
                 tText = []
                 ftSp = (-1, -1)
             try:
                 threadLock.acquire()
                 for data in splitOcrData:
                     sData = data.split(' ')
                     text = sData[0]
                     tsx = int(sData[1]) // 2
                     tsy = int(sData[2]) // 2
                     tex = int(sData[3]) // 2
                     tey = int(sData[4]) // 2
                     tw = tex - tsx
                     th = tey - tsy
                     global MIN_TEXT_SIZE
                     if WHITE_LIST_CHARS.find(text) >= 0:
                         if tw >= MIN_TEXT_SIZE or th >= MIN_TEXT_SIZE:
                             realTextSp = (-1, -1)
                             if symbolOcrOption == SymbolBase.OCR_OPTION_HALF_AND_HALF:
                                 realTextSp = (symbolSp[0]+inSqX+tsx, symbolSp[1]+((h//2) - tsy + inSqY))
                             else:
                                 realTextSp = (symbolSp[0]+inSqX+tsx, symbolSp[1]+tsy)
                             #cv2.rectangle(src, realTextSp, (realTextSp[0] + tw, realTextSp[1] + th), (0, 255, 255), 3)
                             removeText(srcGray, text, realTextSp[0], realTextSp[1], tw, th)
                             if lastCoord == (-1, -1):
                                 tText.append(text)
                                 ftSp = (tsx, tsy)
                             else:
                                 COORD_ADJUSTMENT = 15
                                 if (abs(lastCoord[1] - tsy) <= COORD_ADJUSTMENT and lastCoord[0] >= tsx - COORD_ADJUSTMENT and lastCoord[0] <= tsx + COORD_ADJUSTMENT) or (abs(lastCoord[0] - tsx) <= COORD_ADJUSTMENT and lastCoord[1] >= tsy - COORD_ADJUSTMENT and lastCoord[1] <= tsy + COORD_ADJUSTMENT):
                                     tText.append(text)
                                 else:
                                     if symbolOcrOption == SymbolBase.OCR_OPTION_ALL_FIND or symbolOcrOption == SymbolBase.OCR_OPTION_HALF_AND_HALF:
                                         tText.append(',')
                                     tText.append(text)
                             lastCoord = (tex, tsy) # Top-Right Coord
                 realSp = (symbolSp[0]+inSqX+ftSp[0], symbolSp[1]+inSqY+ftSp[1])
                 realEp = (symbolSp[0]+inSqX+lastCoord[0], symbolSp[1]+inSqY+lastCoord[1])
                 resultText = ''.join(tText)
                 cv2.putText(canvas, resultText, (realSp[0], realSp[1]+th), 2, 1.0, (0, 0, 0)) # cv2.FONT_HERSHEY_SIMPLEX
                 #textInfoList.append(ti.TextInfo(resultText, str(realSp[0]), str(realSp[1]), str(realEp[0]), str(realEp[1])))
                 # text value in symbol object update
                 index = [i for i, item in enumerate(searchedSymbolList) if item.getSp() == symbolSp]
                 if len(index) > 0:
                     searchedSymbolList[index[0]].setText(resultText)
                 im = Image.fromarray(bitImg)
                 sp = (0, 0)
                 if symbolOcrOption == SymbolBase.OCR_OPTION_HALF_AND_HALF:
                     sp = (symbolSp[0]+inSqX, symbolSp[1]+ inSqY)
                 else:
                     sp = (symbolSp[0]+inSqX, symbolSp[1] + inSqY)
                 tList = TOCR.getTextInfoInSymbol(bitImg, sp)
                 resultText = ''
                 if tList is not None:
                     for index in range(len(tList)):
                         textInfo = tList[index]
                         if index != 0:
                             resultText = resultText + ","
                         resultText = resultText + textInfo.getText()
                         cv2.putText(canvas, textInfo.getText(), (textInfo.getX(), textInfo.getY()), 2, 1.0, (0, 0, 0)) # cv2.FONT_HERSHEY_SIMPLEX
                     # text value in symbol object update
                     index = [i for i, item in enumerate(searchedSymbolList) if item.getSp() == symbolSp]
                     if len(index) > 0:
                         searchedSymbolList[index[0]].setText(resultText)
             except Exception as ex:
                 print('error occured({}) in {}:{}'.format(ex, sys.exc_info()[-1].tb_frame.f_code.co_filename, sys.exc_info()[-1].tb_lineno))
             finally:
                 threadLock.release()

     pytesseract.pytesseract.tesseract_cmd = 'D:\\Program Files\\Tesseract-OCR\\tesseract.exe'
     tesseract_cmd = 'D:\\Program Files\\Tesseract-OCR\\tesseract.exe'
     DEFAULT_CONF = """
         --psm 6 -c tessedit_char_whitelist=abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-~.,/!@#$%&*(){}<>:;+=?\\"\\'
     """
     '''
         @brief      Get Text info in Symbol (Instrumentation, OPC, etc...)
         @author     Jeongwoo
         @date       2018.05.04
     '''
     def getTextInfoInSymbol(img, startPoint, flag = FLAG_IMAGE_TO_BOXES, conf = DEFAULT_CONF):
         im = Image.fromarray(img)
         imgWidth = im.width
         imgHeight = im.height
         textInfoList = []
         WHITE_LIST_CHARS = "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ1234567890-"
         MIN_TEXT_SIZE = 10
         boundaryOcrData = pytesseract.image_to_boxes(im, config=conf, lang='eng')
         textGroupIndex = 0
         lastRT = (-1, -1)
         tempText = ''
         charWidth = -1
         charHeight = -1
         lastCharHeight = -1
         lineSp = (-1, -1)
         lineRect = None
         for index in range(len(boundaryOcrData.split('\n'))):
             data = boundaryOcrData.split('\n')[index]
             sData = data.split(' ')
             char = sData[0]
             if WHITE_LIST_CHARS.find(char) >= 0:
                 csx = int(sData[1])
                 csy = imgHeight - int(sData[4])
                 cex = int(sData[3])
                 cey = int(sData[2])
                 cw = cex - csx
                 ch = abs(cey - int(sData[4]))
                 if cw >= MIN_TEXT_SIZE or ch >= MIN_TEXT_SIZE:
                     charWidth = max(charWidth, cw)
                     charHeight = max(charHeight, ch)
                     currentRect = None
                     if lastRT != (-1, -1):
                         currentRect = QRect(csx, csy, csx + cw, csy + ch)
                     if lastRT == (-1, -1) and lineRect is None:
                         tempText = tempText + char
                         lastRT = (csx+cw, csy)
                         lineSp = (csx, csy)
                         lastCharHeight = charHeight
                         lineRect = QRect(lineSp[0], lineSp[1], imgWidth - lineSp[0], charHeight)
                     elif (lineRect is not None and currentRect is not None) and lineRect.intersects(currentRect):
                         tempText = tempText + char
                         lastRT = (csx+cw, min(lineSp[1], csy))
                         lineSp = (lineSp[0], min(lineSp[1], csy))
                         lastCharHeight = charHeight
                         lineRect.setHeight(charHeight)
                     else:
                         # Save previous line
                         prevLineText = ti.TextInfo(tempText, startPoint[0]+lineSp[0], startPoint[1]+lineSp[1], lastRT[0] - lineSp[0], lastCharHeight, 0)
                         textInfoList.append(prevLineText)
                         textGroupIndex = textGroupIndex + 1
                         # Start new line
                         tempText = char
                         charWidth = cw
                         charHeight = ch
                         lastRT = (csx + cw, csy)
                         lineSp = (csx, csy)
                         lineRect = QRect(lineSp[0], lineSp[1], imgWidth - lineSp[0], ch)
         if not (len(textInfoList) > textGroupIndex) and (tempText is not None and len(tempText) > 0):
             textInfo = ti.TextInfo(tempText, startPoint[0]+lineSp[0], startPoint[1]+lineSp[1], lastRT[0] - lineSp[0], charHeight, 0)
             if textInfo not in textInfoList:
                 textInfoList.append(textInfo)
         else:
             return None
         return textInfoList
     '''
         @brief      Get info about each character
         @author     Jeongwoo
         @date       2018.05.03
     '''
     def getCharactersInfo(img, startPoint, flag = FLAG_IMAGE_TO_BOXES, conf = """--psm 6 -c tessedit_char_whitelist=abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-~.,/!@#$%&*(){}<>:;+=?\\"\\'"""):
     def getCharactersInfo(img, startPoint, flag = FLAG_IMAGE_TO_BOXES, conf = DEFAULT_CONF):
         im = Image.fromarray(img)
         imgWidth = im.width
         imgHeight = im.height
-...
         @history    2018.04.26  Jeongwoo    Make TextInfo object with Calculated Coords (with BoundBox Coords)
 .04.30  Jeongwoo    Add QRect.setHeight() in if-statement [(lineRect is not None and currentRect is not None) and lineRect.intersects(currentRect)]
     '''
     def getTextInfo(img, startPoint, flag = FLAG_IMAGE_TO_BOXES, conf = """--psm 6 -c tessedit_char_whitelist=abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-~.,/!@#$%&*(){}<>:;+=?\\"\\'"""):
     def getTextInfo(img, startPoint, flag = FLAG_IMAGE_TO_BOXES, conf = DEFAULT_CONF):
         im = Image.fromarray(img)
         imgWidth = im.width
         imgHeight = im.height
-...
         return textInfoList
     def removeTextFromNpArray(img, flag = FLAG_IMAGE_TO_BOXES, conf = '-c tessedit_char_whitelist="-0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ" -psm 6'):
     def removeTextFromNpArray(img, flag = FLAG_IMAGE_TO_BOXES, conf = DEFAULT_CONF):
         retImg = img.copy()
         for i in range(4):

내보내기 Unified diff

프로젝트

일반

사용자정보

HYTOS

개정판 9e64682b