/ - Diff - HYTOS - 일정관리

개정판 e266373b

ID	e266373b3fcecacfe92671c875b2df1456338a42
상위	59560085
하위	1e67c5f1, 039c0a17

백흠경이(가) 6년 이상 전에 추가함

fixed issue #478:
- change logic to extract text from image

         return textInfoList
     '''
     """
         @history    2018.04.26  Jeongwoo    Make TextInfo object with Calculated Coords (with BoundBox Coords)
 .04.30  Jeongwoo    Add QRect.setHeight() in if-statement [(lineRect is not None and currentRect is not None) and lineRect.intersects(currentRect)]
 .05.09  Jeongwoo    Check split text' length
-...
 .06.08  Jeongwoo    Add angle Parameter and get rotated image's coords
 .06.14  Jeongwoo    Add try-except. If exception occured, return None
 .06.20  Jeongwoo    Remove variable [lastCharHeight] / Change variable [cey], [ch] / Change method to calculate text line height
     '''
                     humkyung 2018.10.12 change logic to extract text which first get bounding box and then extract character
     """
     def getTextInfo(img, startPoint, angle = 0, flag = FLAG_IMAGE_TO_BOXES, conf = DEFAULT_CONF):
         try:
             textInfoList = []
             docData = AppDocData.instance()
             configs = docData.getConfigs('Text Size', 'Min Text Size')
             minSize = int(configs[0].value) if 1 == len(configs) else 30
-...
             im = im.rotate(-angle, expand=True)
             imgWidth = im.width
             imgHeight = im.height
             textOnlyOcrData = pytesseract.image_to_string(im, config=conf, lang='eng')
             textInfoList = []
             ADJUST = 2
             if textOnlyOcrData:
                 boundaryOcrData = pytesseract.image_to_boxes(im, config=conf, lang='eng')
                 text = textOnlyOcrData
                 text = re.sub('\n{1,}', '\n', text)
                 splitText = text.split('\n')
                 textGroupIndex = 0
                 lastRT = (-1, -1)
                 tempText = ''
                 charWidth = -1
                 charHeight = -1
                 lineSp = (-1, -1)
                 lineRect = None
                 for index in range(len(boundaryOcrData.split('\n'))):
                     data = boundaryOcrData.split('\n')[index]
                     sData = data.split(' ')
                     if len(sData) >= 5:
                         char = sData[0]
                         csx = int(sData[1])
                         csy = imgHeight - int(sData[4])
                         cex = int(sData[3])
                         cey = imgHeight - int(sData[2])
                         cw = cex - csx
                         ch = abs(cey - csy)
                         charWidth = max(charWidth, cw)
                         charHeight = max(charHeight, ch)
                         currentRect = None
                         if lastRT != (-1, -1):
                             currentRect = QRect(csx, csy, csx + cw, csy + ch)
                         if lastRT == (-1, -1) and lineRect is None:
                             tempText = tempText + char
                             lastRT = (csx+cw, csy)
                             lineSp = (csx, csy)
                             lineRect = QRect(lineSp[0], lineSp[1], imgWidth - lineSp[0], charHeight)
                         elif (lineRect is not None and currentRect is not None) and lineRect.intersects(currentRect):
                             tempText = tempText + char
                             lastRT = (csx+cw, min(lineSp[1], csy))
                             lineSp = (lineSp[0], min(lineSp[1], csy))
                             lineHeight = max(max(lineRect.height(), abs(cey - lineSp[1])), abs((lineRect.y()+lineRect.height()) - lineSp[1]))
                             lineRect.setX(lineSp[0])
                             lineRect.setY(lineSp[1])
                             lineRect.setHeight(lineHeight)
             boundaryOcrData = pytesseract.image_to_boxes(im, config=conf, lang='eng')
             bounding_boxes = boundaryOcrData.split('\n')
             merged_boxes = []
             for box in bounding_boxes:
                 if merged_boxes:
                     tokens = box.split(' ')
                     if len(tokens) >= 5:
                         minx = int(tokens[1])
                         miny = int(tokens[2])
                         maxx = int(tokens[3])
                         maxy = int(tokens[4])
                         top = merged_boxes[-1].top()
                         bottom = merged_boxes[-1].bottom()
                         if maxy < top or miny > bottom:
                             merged_boxes.append(QRect(minx, miny, maxx - minx, maxy - miny))
                         else:
                             # Save previous line
                             if len(splitText) > textGroupIndex:
                                 rect = QRect(lineSp[0], lineSp[1], lastRT[0]-lineSp[0], lineRect.height())
                                 if rect.height() >= minSize and rect.height() <= maxSize:
                                     if angle == 90 or angle == 270:
                                         transform = QTransform()
                                         transform.translate(imgHeight*0.5, imgWidth*0.5)
                                         transform.rotate(-angle)
                                         transform.translate(-imgWidth*0.5, -imgHeight*0.5)
                                         rect = transform.mapRect(rect)
                                     prevLineText = ti.TextInfo(splitText[textGroupIndex], startPoint[0]+rect.left(), startPoint[1]+rect.top(), rect.width(), rect.height(), angle)
                                     textInfoList.append(prevLineText)
                                 textGroupIndex = textGroupIndex + 1
                                 # Start new line
                                 tempText = char
                                 charWidth = cw
                                 charHeight = ch
                                 lastRT = (csx + cw, csy)
                                 lineSp = (csx, csy)
                                 lineRect = QRect(lineSp[0], lineSp[1], imgWidth - lineSp[0], ch)
                 if not (len(textInfoList) > textGroupIndex) and textGroupIndex < len(splitText):
                     rect = QRect(lineSp[0], lineSp[1], lastRT[0]-lineSp[0], lineRect.height())
                     if rect.height() >= minSize and rect.height() <= maxSize:
                         if angle == 90 or angle == 270:
                             transform = QTransform()
                             transform.translate(imgHeight*0.5, imgWidth*0.5)
                             transform.rotate(-angle)
                             transform.translate(-imgWidth*0.5, -imgHeight*0.5)
                             rect = transform.mapRect(rect)
                         textInfo = ti.TextInfo(splitText[textGroupIndex], startPoint[0]+rect.left(), startPoint[1]+rect.top(), rect.width(), rect.height(), angle)
                         if textInfo not in textInfoList:
                             textInfoList.append(textInfo)
                             merged_boxes[-1].setLeft(min(merged_boxes[-1].left(), minx))
                             merged_boxes[-1].setTop(min(merged_boxes[-1].top(), miny))
                             merged_boxes[-1].setRight(max(merged_boxes[-1].right(), maxx))
                             merged_boxes[-1].setBottom(max(merged_boxes[-1].bottom(), maxy))
                 else:
                     return None
             else:
                 pass
                     tokens = box.split(' ')
                     if len(tokens) >= 5:
                         minx = int(tokens[1])
                         miny = int(tokens[2])
                         maxx = int(tokens[3])
                         maxy = int(tokens[4])
                         merged_boxes.append(QRect(minx, miny, maxx - minx, maxy - miny))
             for rect in merged_boxes:
                 cropped = im.crop((rect.left(), imgHeight - rect.bottom(), rect.right(), imgHeight - rect.top()))
                 text = pytesseract.image_to_string(cropped, config=conf, lang='eng')
                 if rect.height() >= minSize and rect.height() <= maxSize:
                     text_rect = QRect(rect.left(), imgHeight - rect.bottom(), rect.width(), rect.height())
                     if angle == 90 or angle == 270:
                         transform  = QTransform()
                         transform.translate(imgHeight*0.5, imgWidth*0.5)
                         transform.rotate(-angle)
                         transform.translate(-imgWidth*0.5, -imgHeight*0.5)
                         text_rect = transform.mapRect(text_rect)
                     text_info = ti.TextInfo(text, startPoint[0] + text_rect.left(), startPoint[1] + text_rect.top(), text_rect.width(), text_rect.height(), angle)
                     textInfoList.append(text_info)
             return textInfoList
         except Exception as ex:
             from App import App

내보내기 Unified diff

프로젝트

일반

사용자정보

HYTOS

개정판 e266373b