如何使用Python构建一个文档扫描器?
data:image/s3,"s3://crabby-images/4b94f/4b94f6d32f774e3ef99889fdada0757523d4eebc" alt=""
pip install OpenCV-Python imutils scikit-image NumPy
data:image/s3,"s3://crabby-images/f94ea/f94ea7a7558265c50850cc0622ea537817786951" alt=""
import cv2
import imutils
from skimage.filters import threshold_local
from transform import perspective_transform
data:image/s3,"s3://crabby-images/0f0f2/0f0f29ffc04857a74326a731ae1b35f9841c807d" alt=""
# Passing the image path
original_img = cv2.imread('sample.jpg')
copy = original_img.copy()
# The resized height in hundreds
ratio = original_img.shape[0] / 500.0
img_resize = imutils.resize(original_img, height=500)
# Displaying output
cv2.imshow('Resized image', img_resize)
# Waiting for the user to press any key
cv2.waitKey(0)
data:image/s3,"s3://crabby-images/8a933/8a933eac7c55c35efdbd5109b90c98060a9450a4" alt=""
gray_image = cv2.cvtColor(img_resize, cv2.COLOR_BGR2GRAY)
cv2.imshow('Grayed Image', gray_image)
cv2.waitKey(0)
data:image/s3,"s3://crabby-images/f2ad9/f2ad918d4e297c646fc00c618ec8d5f8eafa19b2" alt=""
blurred_image = cv2.GaussianBlur(gray_image, (5, 5), 0)
edged_img = cv2.Canny(blurred_image, 75, 200)
cv2.imshow('Image edges', edged_img)
cv2.waitKey(0)
data:image/s3,"s3://crabby-images/b5e59/b5e5976318649372a6c351c1f798d437a176d13a" alt=""
cnts, _ = cv2.findContours(edged_img, cv2.RETR_LIST, cv2.CHAIN_APPROX_SIMPLE)
cnts = sorted(cnts, key=cv2.contourArea, reverse=True)[:5]
for c in cnts:
peri = cv2.arcLength(c, True)
approx = cv2.approxPolyDP(c, 0.02 * peri, True)
if len(approx) == 4:
doc = approx
break
p = []
for d in doc:
tuple_point = tuple(d[0])
cv2.circle(img_resize, tuple_point, 3, (0, 0, 255), 4)
p.append(tuple_point)
cv2.imshow('Circled corner points', img_resize)
cv2.waitKey(0)
data:image/s3,"s3://crabby-images/05a3f/05a3fdbf97bde51e1b619727ada1f996a4c044f3" alt=""
warped_image = perspective_transform(copy, doc.reshape(4, 2) * ratio)
warped_image = cv2.cvtColor(warped_image, cv2.COLOR_BGR2GRAY)
cv2.imshow("Warped Image", imutils.resize(warped_image, height=650))
cv2.waitKey(0)
import numpy as np
import cv2
def order_points(pts):
# initializing the list of coordinates to be ordered
rect = np.zeros((4, 2), dtype = "float32")
s = pts.sum(axis = 1)
# top-left point will have the smallest sum
rect[0] = pts[np.argmin(s)]
# bottom-right point will have the largest sum
rect[2] = pts[np.argmax(s)]
'''computing the difference between the points, the
top-right point will have the smallest difference,
whereas the bottom-left will have the largest difference'''
diff = np.diff(pts, axis = 1)
rect[1] = pts[np.argmin(diff)]
rect[3] = pts[np.argmax(diff)]
# returns ordered coordinates
return rect
def perspective_transform(image, pts):
# unpack the ordered coordinates individually
rect = order_points(pts)
(tl, tr, br, bl) = rect
'''compute the width of the new image, which will be the
maximum distance between bottom-right and bottom-left
x-coordinates or the top-right and top-left x-coordinates'''
widthA = np.sqrt(((br[0] - bl[0]) ** 2) + ((br[1] - bl[1]) ** 2))
widthB = np.sqrt(((tr[0] - tl[0]) ** 2) + ((tr[1] - tl[1]) ** 2))
maxWidth = max(int(widthA), int(widthB))
'''compute the height of the new image, which will be the
maximum distance between the top-left and bottom-left y-coordinates'''
heightA = np.sqrt(((tr[0] - br[0]) ** 2) + ((tr[1] - br[1]) ** 2))
heightB = np.sqrt(((tl[0] - bl[0]) ** 2) + ((tl[1] - bl[1]) ** 2))
maxHeight = max(int(heightA), int(heightB))
'''construct the set of destination points to obtain an overhead shot'''
dst = np.array([
[0, 0],
[maxWidth - 1, 0],
[maxWidth - 1, maxHeight - 1],
[0, maxHeight - 1]], dtype = "float32")
# compute the perspective transform matrix
transform_matrix = cv2.getPerspectiveTransform(rect, dst)
# Apply the transform matrix
warped = cv2.warpPerspective(image, transform_matrix, (maxWidth, maxHeight))
# return the warped image
return warped
data:image/s3,"s3://crabby-images/80888/808881bf7a85a6650171af512b55c551edfe1e68" alt=""
T = threshold_local(warped_image, 11, offset=10, method="gaussian")
warped = (warped_image > T).astype("uint8") * 255
cv2.imwrite('./'+'scan'+'.png',warped)
cv2.imshow("Final Scanned image", imutils.resize(warped, height=650))
cv2.waitKey(0)
cv2.destroyAllWindows()
data:image/s3,"s3://crabby-images/eaf25/eaf25897ef92c672c93d46e449465433f239b0d5" alt=""
原文链接:
https://www.makeuseof.com/python-create-document-scanner/
关注公众号:拾黑(shiheibook)了解更多
[广告]赞助链接:
四季很好,只要有你,文娱排行榜:https://www.yaopaiming.com/
让资讯触达的更精准有趣:https://www.0xu.cn/
data:image/s3,"s3://crabby-images/a8209/a8209b304fc92c07c96a4ef5d1141e5e2b6df1b9" alt="公众号"
随时掌握互联网精彩
赞助链接
排名
热点
搜索指数
- 1 大有可为 大显身手 7944091
- 2 《哪吒2》成全球动画电影票房榜第1 7977917
- 3 周星驰cos哪吒 7898685
- 4 早春时节农事忙 7729230
- 5 郭艾伦眼睛受重伤:瞎了我就不活了 7698434
- 6 胡歌看着女儿感觉时间不够用 7528379
- 7 多位高校领导被查 有人主动投案 7435683
- 8 湖北“狗狗山”爆火 网友直呼太像了 7349362
- 9 哈尔滨“冰马俑”被盘成了光头 7252931
- 10 俄方在沙特“三谈一不谈” 7198401