0.2: variable filename

zvezdochiot · zvezdochiot · commit b83f8d6adba3 · 2019-11-23T20:49:49.000+03:00
diff --git a/LICENSE b/LICENSE
@@ -0,0 +1,30 @@
+Public Domain Mark 1.0
+ No Copyright
+
+    This work has been identified as being free of known restrictions
+    under copyright law, including all related and neighboring rights.
+
+    You can copy, modify, distribute and perform the work, even for
+    commercial purposes, all without asking permission. See Other
+    Information below.
+
+ Other Information
+
+    The work may not be free of known copyright restrictions in all
+    jurisdictions.
+
+    Persons may have other rights in or related to the work, such as
+    patent or trademark rights, and others may have rights in how the
+    work is used, such as publicity or privacy rights.
+
+    In some jurisdictions moral rights of the author may persist beyond
+    the term of copyright. These rights may include the right to be
+    identified as the author and the right to object to derogatory
+    treatments.
+
+    Unless expressly stated otherwise, the person who identified the work
+    makes no warranties about the work, and disclaims liability for all
+    uses of the work, to the fullest extent permitted by applicable law.
+
+    When using or citing the work, you should not imply endorsement by
+    the author or the person who identified the work.
diff --git a/img2txt.py b/img2txt.py
@@ -1,101 +1,117 @@
-import cv2
-import numpy as np
-#import pytesseract
-#pytesseract.pytesseract.tesseract_cmd = 'C:/Program Files (x86)/Tesseract-OCR/tesseract'
-#from PIL import Image
-#import image
-image = cv2.imread('test.jpg')
-#cv2.imshow('orig',image)
-#cv2.waitKey(0)
-
-  #Initial Processing of the image starts...!!!!!!!!!!!
-
-#grayscale
-gray = cv2.cvtColor(image,cv2.COLOR_BGR2GRAY)
-cv2.imshow('gray',gray)
-cv2.waitKey(0)
-
-#binary
-ret,thresh = cv2.threshold(gray,160,255,cv2.THRESH_BINARY_INV)
-cv2.imshow('Binarized',thresh)
-cv2.waitKey(0)
-
-#detecting edges>>>>
-
-edges=cv2.Canny(thresh,140,200)
-#cv2.imshow("edges",edges)
-
-#dilation
-kernel = np.ones((5,5), np.uint8)
-img_dilation = cv2.dilate(edges, kernel, iterations=1)
-cv2.imshow('dilated',img_dilation)
-cv2.waitKey(0)
-
-#Localization Horizontal projection
-(x,y)=img_dilation.shape
-z=[sum(y) for y in img_dilation]
-Tx=(((sum(z))/(len(z))/20))
-#print Tx
-
-
-#Vertical Projection
-ndilation=zip(*img_dilation)
-X=[sum(row) for row in ndilation]
-mean=(sum(X))/(len(X))
-maximofX=(max(X)/10)
-Ty=mean+maximofX
-#print Ty
-
-
-#Adaptive threashold for horizontal  projection
-th1 = cv2.adaptiveThreshold(img_dilation,Tx,cv2.ADAPTIVE_THRESH_MEAN_C,cv2.THRESH_BINARY,11,2) #block size and constant.
-    
-
-#Adaptive threashold for vertical projection
-th2 = cv2.adaptiveThreshold(img_dilation,Ty,cv2.ADAPTIVE_THRESH_MEAN_C,cv2.THRESH_BINARY,11,2)
-fthreashold=cv2.add(th1,th2)
-cv2.imshow("threashold1",fthreashold)
-
-
-
-        #Initial Processing of the image finishes....!!!!!
-
-
-#find contours
-im2,ctrs, hier = cv2.findContours(img_dilation.copy(), cv2.RETR_EXTERNAL,cv2.CHAIN_APPROX_SIMPLE)
-
-#sort contours
-sorted_ctrs = sorted(ctrs, key=lambda ctr: cv2.boundingRect(ctr)[0])
-
-for i, ctr in enumerate(sorted_ctrs):
-    # Get bounding box
-    #(x,y) be the top-left coordinate of the rectangle and (w,h) be its width and height
-    x, y, w, h = cv2.boundingRect(ctr)
-
-    #Removing the false area that are not textes.
-    if w<35 and h<35:
-        continue
-
-    # Getting ROI
-    roi = image[y:y+h, x:x+w]
-
-    #result = pytesseract.image_to_string(Image.open(roi))
-
-    # show ROI
-    #cv2.imshow(roi)
-    cv2.imshow('segment no:'+str(i),roi)
-    cv2.waitKey(0)
-    cv2.rectangle(image,(x,y),( x + w, y + h ),(90,0,255),1)
-    
-    #print result
-
-'''cv2.imshow('marked areas',image)
-cv2.waitKey(0)
-cv2.imwrite('final.jpg', image)
-
-
-result = pytesseract.image_to_string(Image.open('final.jpg'))
-with open('fiel12.txt',mode='w') as file:
-	file.write(result)
-	print("Done")
-'''
+#!/usr/bin/env python
+import sys
+import cv2
+import numpy as np
+#import pytesseract
+#pytesseract.pytesseract.tesseract_cmd = 'C:/Program Files (x86)/Tesseract-OCR/tesseract'
+#from PIL import Image
+#import image
+
+def imagetoregion(imagename, imagedest, segmentview):
+    image = cv2.imread(imagename)
+    cv2.imshow('orig',image)
+    cv2.waitKey(0)
+
+    #Initial Processing of the image starts...!!!!!!!!!!!
+
+    #grayscale
+    gray = cv2.cvtColor(image,cv2.COLOR_BGR2GRAY)
+    cv2.imshow('gray',gray)
+    cv2.waitKey(0)
+
+    #binary
+    ret,thresh = cv2.threshold(gray,160,255,cv2.THRESH_BINARY_INV)
+    cv2.imshow('Binarized',thresh)
+    cv2.waitKey(0)
+
+    #detecting edges>>>>
+
+    edges=cv2.Canny(thresh,140,200)
+    cv2.imshow("edges",edges)
+    cv2.waitKey(0)
+
+    #dilation
+    kernel = np.ones((15,15), np.uint8)
+    img_dilation = cv2.dilate(edges, kernel, iterations=1)
+    cv2.imshow('dilated',img_dilation)
+    cv2.waitKey(0)
+
+    #Localization Horizontal projection
+    (x,y)=img_dilation.shape
+    z=[sum(y) for y in img_dilation]
+    Tx=(((sum(z))/(len(z))/20))
+    #print Tx
+
+    #Vertical Projection
+    ndilation=zip(*img_dilation)
+    X=[sum(row) for row in ndilation]
+    mean=(sum(X))/(len(X))
+    maximofX=(max(X)/10)
+    Ty=mean+maximofX
+    #print Ty
+
+    #Adaptive threashold for horizontal  projection
+    th1 = cv2.adaptiveThreshold(img_dilation,Tx,cv2.ADAPTIVE_THRESH_MEAN_C,cv2.THRESH_BINARY,11,2) #block size and constant.
+
+    #Adaptive threashold for vertical projection
+    th2 = cv2.adaptiveThreshold(img_dilation,Ty,cv2.ADAPTIVE_THRESH_MEAN_C,cv2.THRESH_BINARY,11,2)
+    fthreashold=cv2.add(th1,th2)
+    cv2.imshow("threashold1",fthreashold)
+    cv2.waitKey(0)
+
+    #Initial Processing of the image finishes....!!!!!
+
+    #find contours
+    im2,ctrs, hier = cv2.findContours(img_dilation.copy(), cv2.RETR_EXTERNAL,cv2.CHAIN_APPROX_SIMPLE)
+
+    #sort contours
+    sorted_ctrs = sorted(ctrs, key=lambda ctr: cv2.boundingRect(ctr)[0])
+
+    for i, ctr in enumerate(sorted_ctrs):
+        # Get bounding box
+        #(x,y) be the top-left coordinate of the rectangle and (w,h) be its width and height
+        x, y, w, h = cv2.boundingRect(ctr)
+
+        #Removing the false area that are not textes.
+        if w<35 and h<35:
+            continue
+
+        if segmentview:
+            # Getting ROI
+            roi = image[y:y+h, x:x+w]
+
+            #result = pytesseract.image_to_string(Image.open(roi))
+
+            # show ROI
+            #cv2.imshow(roi)
+            cv2.imshow('segment no:'+str(i),roi)
+            cv2.waitKey(0)
+
+        cv2.rectangle(image,(x,y),( x + w, y + h ),(90,0,255),1)
+
+        #print result
+
+    cv2.namedWindow('marked areas', cv2.WINDOW_NORMAL)
+    cv2.resizeWindow('marked areas', 800, 600)
+    cv2.imshow('marked areas',image)
+    cv2.waitKey(0)
+    if not(segmentview):
+        cv2.imwrite(imagedest, image)
+
+    '''
+    result = pytesseract.image_to_string(Image.open('final.jpg'))
+    with open('fiel12.txt',mode='w') as file:
+        file.write(result)
+        print("Done")
+    '''
+
+if __name__ == '__main__':
+    segmentview = True
+    filename = 'test.jpg'
+    if len(sys.argv) > 1:
+        filename = sys.argv[1]
+    filedest = 'final.jpg'
+    if len(sys.argv) > 2:
+        filedest = sys.argv[2]
+        segmentview = False
+    imagetoregion(filename, filedest, segmentview)