initial commit
commit
6404a3b3fa
@ -0,0 +1,45 @@
|
|||||||
|
# Measuring Size of Objects with OpenCV
|
||||||
|
### Calculates the size of objects based on a given reference object
|
||||||
|
|
||||||
|
Cool object size estimator with just OpenCV and python
|
||||||
|
|
||||||
|
All thanks to Adrian Rosebrock (from [pyimagesearch](https://www.pyimagesearch.com/)) for making
|
||||||
|
great tutorials. This project is inspired from his blog: [Measuring size of objects in an image with OpenCV](https://www.pyimagesearch.com/2016/03/28/measuring-size-of-objects-in-an-image-with-opencv/). I have included the author's code and the one i wrote my self as well.
|
||||||
|
|
||||||
|
## **Key Points**
|
||||||
|
1. Steps involved:
|
||||||
|
1. Find contours in the image.
|
||||||
|
2. Get the minimum area rectangle for the contours.
|
||||||
|
3. Draw the mid points and the lines joining mid points of the bounding rectangle of the contours.
|
||||||
|
4. Grab the reference object from the contours and calculate **Pixel Per Metric** ratio.
|
||||||
|
5. Calculate and print the bounding rectangle's dimensions based on the reference object's dimensions.
|
||||||
|
2. Assumptions:
|
||||||
|
1. There is a reference object in the image which is easy to find and it's width/height is know to us.
|
||||||
|
3. Uses "Pixel Per Metric" ratio to calculate the size based on the given reference object.
|
||||||
|
4. Reference object properties:
|
||||||
|
1. We should know the dimensions of this object (in terms of width or height).
|
||||||
|
2. We should be able to easily find this reference object in the image, either based on the placement of the object (like being placed in top-left corner, etc.) or via appearances (like distinctive color and/or shape).
|
||||||
|
5. Used the United States quarter as the reference object.
|
||||||
|
6. Used the OpenCV's find contours method to find the objects in the image and calculated their dimensions.
|
||||||
|
|
||||||
|
## **Requirements: (with versions i tested on)**
|
||||||
|
1. python (3.7.3)
|
||||||
|
2. opencv (4.1.0)
|
||||||
|
3. numpy (1.61.4)
|
||||||
|
4. imutils (0.5.2)
|
||||||
|
|
||||||
|
## **Commands to run the detection:**
|
||||||
|
```
|
||||||
|
python object_size.py --image images/example_01.png --width 0.955
|
||||||
|
```
|
||||||
|
|
||||||
|
## **Results:**
|
||||||
|
The results are pretty decent even though not perfect. This is due the limitations of the image itself as its not perfect top-down view of the objects and some calibrations could have also been done in the camera before clicking the picture.
|
||||||
|
|
||||||
|

|
||||||
|

|
||||||
|
|
||||||
|
|
||||||
|
## **The limitations**
|
||||||
|
1. This technique requires the image to be near perfect top-down view of the objects to calculate the accurate results. Otherwise the dimensions of the objects in the image may be distorted.
|
||||||
|
2. The photos are prone to radial and tangential lens distortion which would lead to uneven object dimensions.
|
||||||
Binary file not shown.
|
After Width: | Height: | Size: 684 KiB |
Binary file not shown.
|
After Width: | Height: | Size: 507 KiB |
Binary file not shown.
|
After Width: | Height: | Size: 380 KiB |
Binary file not shown.
|
After Width: | Height: | Size: 676 KiB |
Binary file not shown.
|
After Width: | Height: | Size: 417 KiB |
@ -0,0 +1,118 @@
|
|||||||
|
# USAGE
|
||||||
|
# python object_size.py --image images/example_01.png --width 0.955
|
||||||
|
# python object_size.py --image images/example_02.png --width 0.955
|
||||||
|
# python object_size.py --image images/example_03.png --width 3.5
|
||||||
|
|
||||||
|
# import the necessary packages
|
||||||
|
from scipy.spatial import distance as dist
|
||||||
|
from imutils import perspective
|
||||||
|
from imutils import contours
|
||||||
|
import numpy as np
|
||||||
|
import argparse
|
||||||
|
import imutils
|
||||||
|
import cv2
|
||||||
|
|
||||||
|
def midpoint(ptA, ptB):
|
||||||
|
return ((ptA[0] + ptB[0]) * 0.5, (ptA[1] + ptB[1]) * 0.5)
|
||||||
|
|
||||||
|
# construct the argument parse and parse the arguments
|
||||||
|
ap = argparse.ArgumentParser()
|
||||||
|
ap.add_argument("-i", "--image", required=True,
|
||||||
|
help="path to the input image")
|
||||||
|
ap.add_argument("-w", "--width", type=float, required=True,
|
||||||
|
help="width of the left-most object in the image (in inches)")
|
||||||
|
args = vars(ap.parse_args())
|
||||||
|
|
||||||
|
# load the image, convert it to grayscale, and blur it slightly
|
||||||
|
image = cv2.imread(args["image"])
|
||||||
|
gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
|
||||||
|
gray = cv2.GaussianBlur(gray, (7, 7), 0)
|
||||||
|
|
||||||
|
# perform edge detection, then perform a dilation + erosion to
|
||||||
|
# close gaps in between object edges
|
||||||
|
edged = cv2.Canny(gray, 50, 100)
|
||||||
|
edged = cv2.dilate(edged, None, iterations=1)
|
||||||
|
edged = cv2.erode(edged, None, iterations=1)
|
||||||
|
|
||||||
|
# find contours in the edge map
|
||||||
|
cnts = cv2.findContours(edged.copy(), cv2.RETR_EXTERNAL,
|
||||||
|
cv2.CHAIN_APPROX_SIMPLE)
|
||||||
|
cnts = imutils.grab_contours(cnts)
|
||||||
|
|
||||||
|
# sort the contours from left-to-right and initialize the
|
||||||
|
# 'pixels per metric' calibration variable
|
||||||
|
(cnts, _) = contours.sort_contours(cnts)
|
||||||
|
pixelsPerMetric = None
|
||||||
|
|
||||||
|
# loop over the contours individually
|
||||||
|
for c in cnts:
|
||||||
|
# if the contour is not sufficiently large, ignore it
|
||||||
|
if cv2.contourArea(c) < 100:
|
||||||
|
continue
|
||||||
|
|
||||||
|
# compute the rotated bounding box of the contour
|
||||||
|
orig = image.copy()
|
||||||
|
box = cv2.minAreaRect(c)
|
||||||
|
box = cv2.cv.BoxPoints(box) if imutils.is_cv2() else cv2.boxPoints(box)
|
||||||
|
box = np.array(box, dtype="int")
|
||||||
|
|
||||||
|
# order the points in the contour such that they appear
|
||||||
|
# in top-left, top-right, bottom-right, and bottom-left
|
||||||
|
# order, then draw the outline of the rotated bounding
|
||||||
|
# box
|
||||||
|
box = perspective.order_points(box)
|
||||||
|
cv2.drawContours(orig, [box.astype("int")], -1, (0, 255, 0), 2)
|
||||||
|
|
||||||
|
# loop over the original points and draw them
|
||||||
|
for (x, y) in box:
|
||||||
|
cv2.circle(orig, (int(x), int(y)), 5, (0, 0, 255), -1)
|
||||||
|
|
||||||
|
# unpack the ordered bounding box, then compute the midpoint
|
||||||
|
# between the top-left and top-right coordinates, followed by
|
||||||
|
# the midpoint between bottom-left and bottom-right coordinates
|
||||||
|
(tl, tr, br, bl) = box
|
||||||
|
(tltrX, tltrY) = midpoint(tl, tr)
|
||||||
|
(blbrX, blbrY) = midpoint(bl, br)
|
||||||
|
|
||||||
|
# compute the midpoint between the top-left and top-right points,
|
||||||
|
# followed by the midpoint between the top-righ and bottom-right
|
||||||
|
(tlblX, tlblY) = midpoint(tl, bl)
|
||||||
|
(trbrX, trbrY) = midpoint(tr, br)
|
||||||
|
|
||||||
|
# draw the midpoints on the image
|
||||||
|
cv2.circle(orig, (int(tltrX), int(tltrY)), 5, (255, 0, 0), -1)
|
||||||
|
cv2.circle(orig, (int(blbrX), int(blbrY)), 5, (255, 0, 0), -1)
|
||||||
|
cv2.circle(orig, (int(tlblX), int(tlblY)), 5, (255, 0, 0), -1)
|
||||||
|
cv2.circle(orig, (int(trbrX), int(trbrY)), 5, (255, 0, 0), -1)
|
||||||
|
|
||||||
|
# draw lines between the midpoints
|
||||||
|
cv2.line(orig, (int(tltrX), int(tltrY)), (int(blbrX), int(blbrY)),
|
||||||
|
(255, 0, 255), 2)
|
||||||
|
cv2.line(orig, (int(tlblX), int(tlblY)), (int(trbrX), int(trbrY)),
|
||||||
|
(255, 0, 255), 2)
|
||||||
|
|
||||||
|
# compute the Euclidean distance between the midpoints
|
||||||
|
dA = dist.euclidean((tltrX, tltrY), (blbrX, blbrY))
|
||||||
|
dB = dist.euclidean((tlblX, tlblY), (trbrX, trbrY))
|
||||||
|
|
||||||
|
# if the pixels per metric has not been initialized, then
|
||||||
|
# compute it as the ratio of pixels to supplied metric
|
||||||
|
# (in this case, inches)
|
||||||
|
if pixelsPerMetric is None:
|
||||||
|
pixelsPerMetric = dB / args["width"]
|
||||||
|
|
||||||
|
# compute the size of the object
|
||||||
|
dimA = dA / pixelsPerMetric
|
||||||
|
dimB = dB / pixelsPerMetric
|
||||||
|
|
||||||
|
# draw the object sizes on the image
|
||||||
|
cv2.putText(orig, "{:.1f}in".format(dimA),
|
||||||
|
(int(tltrX - 15), int(tltrY - 10)), cv2.FONT_HERSHEY_SIMPLEX,
|
||||||
|
0.65, (255, 255, 255), 2)
|
||||||
|
cv2.putText(orig, "{:.1f}in".format(dimB),
|
||||||
|
(int(trbrX + 10), int(trbrY)), cv2.FONT_HERSHEY_SIMPLEX,
|
||||||
|
0.65, (255, 255, 255), 2)
|
||||||
|
|
||||||
|
# show the output image
|
||||||
|
cv2.imshow("Image", orig)
|
||||||
|
cv2.waitKey(0)
|
||||||
@ -0,0 +1,91 @@
|
|||||||
|
from scipy.spatial import distance as dist
|
||||||
|
from imutils import perspective
|
||||||
|
from imutils import contours
|
||||||
|
import argparse
|
||||||
|
import numpy as np
|
||||||
|
import imutils
|
||||||
|
import cv2
|
||||||
|
|
||||||
|
|
||||||
|
def midpoint(ptA, ptB):
|
||||||
|
return ((ptA[0] + ptB[0]) * 0.5, (ptA[1] + ptB[1]) * 0.5)
|
||||||
|
|
||||||
|
def show_image(title, image, destroy_all=True):
|
||||||
|
cv2.imshow(title, image)
|
||||||
|
cv2.waitKey(0)
|
||||||
|
if destroy_all:
|
||||||
|
cv2.destroyAllWindows()
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
ap = argparse.ArgumentParser()
|
||||||
|
ap.add_argument("-i", "--image", required=True, help="path to the input image")
|
||||||
|
ap.add_argument("-w", "--width", type=float, required=True, help="width of the left-most object in the image (in inches)")
|
||||||
|
args = vars(ap.parse_args())
|
||||||
|
|
||||||
|
image = cv2.imread(args["image"])
|
||||||
|
gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
|
||||||
|
gray = cv2.GaussianBlur(gray, (7, 7), 0)
|
||||||
|
|
||||||
|
edged = cv2.Canny(gray, 50, 100)
|
||||||
|
show_image("Edged", edged, False)
|
||||||
|
edged = cv2.dilate(edged, None, iterations=1)
|
||||||
|
edged = cv2.erode(edged, None, iterations=1)
|
||||||
|
show_image("erode and dilate", edged, True)
|
||||||
|
|
||||||
|
cnts = cv2.findContours(edged, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
|
||||||
|
cnts = imutils.grab_contours(cnts)
|
||||||
|
print("Total number of contours are: ", len(cnts))
|
||||||
|
|
||||||
|
(cnts, _) = contours.sort_contours(cnts)
|
||||||
|
pixelPerMetric = None
|
||||||
|
|
||||||
|
|
||||||
|
count = 0
|
||||||
|
for c in cnts:
|
||||||
|
if cv2.contourArea(c) < 100:
|
||||||
|
continue
|
||||||
|
count += 1
|
||||||
|
|
||||||
|
orig = image.copy()
|
||||||
|
box = cv2.minAreaRect(c)
|
||||||
|
box = cv2.cv.BoxPoints(box) if imutils.is_cv2() else cv2.boxPoints(box)
|
||||||
|
box = np.array(box, dtype="int")
|
||||||
|
|
||||||
|
box = perspective.order_points(box)
|
||||||
|
cv2.drawContours(orig, [box.astype("int")], -1, (0, 255, 0), 2)
|
||||||
|
|
||||||
|
for (x, y) in box:
|
||||||
|
cv2.circle(orig, (int(x), int(y)), 5, (0, 0, 255), -1)
|
||||||
|
|
||||||
|
|
||||||
|
(tl, tr, br, bl) = box
|
||||||
|
(tltrX, tltrY) = midpoint(tl, tr)
|
||||||
|
(blbrX, blbrY) = midpoint(bl, br)
|
||||||
|
(tlblX, tlblY) = midpoint(tl, bl)
|
||||||
|
(trbrX, trbrY) = midpoint(tr, br)
|
||||||
|
|
||||||
|
cv2.circle(orig, (int(tltrX), int(tltrY)), 5, (255, 0, 0), -1)
|
||||||
|
cv2.circle(orig, (int(blbrX), int(blbrY)), 5, (255, 0, 0), -1)
|
||||||
|
cv2.circle(orig, (int(tlblX), int(tlblY)), 5, (255, 0, 0), -1)
|
||||||
|
cv2.circle(orig, (int(trbrX), int(trbrY)), 5, (255, 0, 0), -1)
|
||||||
|
|
||||||
|
cv2.line(orig, (int(tltrX), int(tltrY)), (int(blbrX), int(blbrY)), (255, 0, 255), 2)
|
||||||
|
cv2.line(orig, (int(tlblX), int(tlblY)), (int(trbrX), int(trbrY)), (255, 0, 255), 2)
|
||||||
|
|
||||||
|
dA = dist.euclidean((tltrX, tltrY), (blbrX, blbrY))
|
||||||
|
dB = dist.euclidean((tlblX, tlblY), (trbrX, trbrY))
|
||||||
|
|
||||||
|
if pixelPerMetric is None:
|
||||||
|
pixelPerMetric = dB / args["width"]
|
||||||
|
|
||||||
|
dimA = dA / pixelPerMetric
|
||||||
|
dimB = dB / pixelPerMetric
|
||||||
|
|
||||||
|
cv2.putText(orig, "{:.1f}in".format(dimA), (int(tltrX - 15), int(tltrY - 10)), cv2.FONT_HERSHEY_SIMPLEX, 0.65, (255, 255, 255), 2)
|
||||||
|
cv2.putText(orig, "{:.1f}in".format(dimB), (int(trbrX + 10), int(trbrY)), cv2.FONT_HERSHEY_SIMPLEX, 0.65, (255, 255, 255), 2)
|
||||||
|
|
||||||
|
cv2.imshow("Image", orig)
|
||||||
|
cv2.waitKey(0)
|
||||||
|
|
||||||
|
print("Total contours processed: ", count)
|
||||||
Loading…
Reference in New Issue