You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
34 lines
938 B
34 lines
938 B
import cv2
|
|
import logging
|
|
|
|
d = 1
|
|
|
|
while True:
|
|
try:
|
|
output = ('cropped/page%d.jpg'%d)
|
|
|
|
# Load image, convert to grayscale, and find edges
|
|
image = cv2.imread('split/input%d.jpg'%d)
|
|
gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
|
|
thresh = cv2.threshold(gray, 0, 255, cv2.THRESH_OTSU + cv2.THRESH_BINARY)[1]
|
|
|
|
# Find contour and sort by contour area
|
|
cnts = cv2.findContours(thresh, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
|
|
cnts = cnts[0] if len(cnts) == 2 else cnts[1]
|
|
cnts = sorted(cnts, key=cv2.contourArea, reverse=True)
|
|
|
|
# Find bounding box and extract ROI
|
|
for c in cnts:
|
|
x,y,w,h = cv2.boundingRect(c)
|
|
ROI = image[y:y+h, x:x+w]
|
|
break
|
|
|
|
cv2.imwrite(output,ROI)
|
|
cv2.waitKey()
|
|
|
|
d+=1
|
|
|
|
except:
|
|
logging.exception("message")
|
|
print("All pages must be ready!")
|
|
break
|
|
|