我试图.pdf通过首先将其转换为图像然后使用 OpenCV来识别文档中的文本段落。但是我在文本行而不是段落上得到了边界框。如何设置一些阈值或其他限制来获取段落而不是行?
这是示例输入图像:
这是我为上述示例获得的输出:
我试图在中间的段落上获得一个边界框。我正在使用此代码。
import cv2
import numpy as np
large = cv2.imread('sample image.png')
rgb = cv2.pyrDown(large)
small = cv2.cvtColor(rgb, cv2.COLOR_BGR2GRAY)
# kernel = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (3, 3))
kernel = np.ones((5, 5), np.uint8)
grad = cv2.morphologyEx(small, cv2.MORPH_GRADIENT, kernel)
_, bw = cv2.threshold(grad, 0.0, 255.0, cv2.THRESH_BINARY | cv2.THRESH_OTSU)
kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (9, 1))
connected = cv2.morphologyEx(bw, cv2.MORPH_CLOSE, kernel)
# using RETR_EXTERNAL instead of RETR_CCOMP
contours, hierarchy = cv2.findContours(connected.copy(), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
#For opencv 3+ comment the previous line …Run Code Online (Sandbox Code Playgroud) python opencv image-processing bounding-box text-recognition