dlib C++ Library - edge_detector.h

// Copyright (C) 2008 Davis E. King (davis@dlib.net)
// License: Boost Software License See LICENSE.txt for the full license.
#ifndef DLIB_EDGE_DETECTOr_
#define DLIB_EDGE_DETECTOr_
#include "edge_detector_abstract.h"
#include "../pixel.h"
#include "../array2d.h"
#include "../geometry.h"
#include <vector>
#include "../image_keypoint/build_separable_poly_filters.h"
namespace dlib
{
// ----------------------------------------------------------------------------------------
 template <
 typename T
 >
 inline char edge_orientation (
 const T& x_,
 const T& y_
 )
 {
 // if this is a perfectly horizontal gradient then return right away
 if (x_ == 0)
 {
 return '|';
 }
 else if (y_ == 0) // if this is a perfectly vertical gradient then return right away
 {
 return '-';
 }
 // Promote x so that when we multiply by 128 later we know overflow won't happen.
 typedef typename promote<T>::type type;
 type x = x_;
 type y = y_;
 if (x < 0)
 {
 x = -x;
 if (y < 0)
 {
 y = -y;
 x *= 128;
 const type temp = x/y;
 if (temp > 309)
 return '-';
 else if (temp > 53)
 return '/';
 else
 return '|';
 }
 else
 {
 x *= 128;
 const type temp = x/y;
 if (temp > 309)
 return '-';
 else if (temp > 53)
 return '\\';
 else
 return '|';
 }
 }
 else
 {
 if (y < 0)
 {
 y = -y;
 x *= 128;
 const type temp = x/y;
 if (temp > 309)
 return '-';
 else if (temp > 53)
 return '\\';
 else
 return '|';
 }
 else
 {
 x *= 128;
 const type temp = x/y;
 if (temp > 309)
 return '-';
 else if (temp > 53)
 return '/';
 else
 return '|';
 }
 }
 }
// ----------------------------------------------------------------------------------------
 template <
 typename in_image_type,
 typename out_image_type
 >
 void sobel_edge_detector (
 const in_image_type& in_img_,
 out_image_type& horz_,
 out_image_type& vert_
 )
 {
 typedef typename image_traits<out_image_type>::pixel_type pixel_type;
 COMPILE_TIME_ASSERT(pixel_traits<pixel_type>::is_unsigned == false);
 DLIB_ASSERT( !is_same_object(in_img_,horz_) && !is_same_object(in_img_,vert_) &&
 !is_same_object(horz_,vert_),
 "\tvoid sobel_edge_detector(in_img_, horz_, vert_)"
 << "\n\t You can't give the same image as more than one argument"
 << "\n\t is_same_object(in_img_,horz_): " << is_same_object(in_img_,horz_)
 << "\n\t is_same_object(in_img_,vert_): " << is_same_object(in_img_,vert_)
 << "\n\t is_same_object(horz_,vert_): " << is_same_object(horz_,vert_)
 );
 const int vert_filter[3][3] = {{-1,-2,-1}, 
 {0,0,0}, 
 {1,2,1}};
 const int horz_filter[3][3] = { {-1,0,1}, 
 {-2,0,2}, 
 {-1,0,1}};
 const long M = 3;
 const long N = 3;
 const_image_view<in_image_type> in_img(in_img_);
 image_view<out_image_type> horz(horz_);
 image_view<out_image_type> vert(vert_);
 horz.set_size(in_img.nr(),in_img.nc());
 vert.set_size(in_img.nr(),in_img.nc());
 assign_border_pixels(horz,1,1,0);
 assign_border_pixels(vert,1,1,0);
 // figure out the range that we should apply the filter to
 const long first_row = M/2;
 const long first_col = N/2;
 const long last_row = in_img.nr() - M/2;
 const long last_col = in_img.nc() - N/2;
 // apply the filter to the image
 for (long r = first_row; r < last_row; ++r)
 {
 for (long c = first_col; c < last_col; ++c)
 {
 typedef typename pixel_traits<typename image_traits<in_image_type>::pixel_type>::basic_pixel_type bp_type;
 typename promote<bp_type>::type p, horz_temp, vert_temp;
 horz_temp = 0;
 vert_temp = 0;
 for (long m = 0; m < M; ++m)
 {
 for (long n = 0; n < N; ++n)
 {
 // pull out the current pixel and put it into p
 p = get_pixel_intensity(in_img[r-M/2+m][c-N/2+n]);
 horz_temp += p*horz_filter[m][n];
 vert_temp += p*vert_filter[m][n];
 }
 }
 assign_pixel(horz[r][c] , horz_temp);
 assign_pixel(vert[r][c] , vert_temp);
 }
 }
 }
// ----------------------------------------------------------------------------------------
 namespace impl
 {
 template <typename T>
 typename promote<T>::type square (const T& a)
 { 
 return static_cast<T>(a)*static_cast<T>(a); 
 }
 }
 template <
 typename in_image_type,
 typename out_image_type
 >
 void suppress_non_maximum_edges (
 const in_image_type& horz_,
 const in_image_type& vert_,
 out_image_type& out_img_
 )
 {
 const_image_view<in_image_type> horz(horz_);
 const_image_view<in_image_type> vert(vert_);
 image_view<out_image_type> out_img(out_img_);
 COMPILE_TIME_ASSERT(is_signed_type<typename image_traits<in_image_type>::pixel_type>::value);
 DLIB_ASSERT( horz.nr() == vert.nr() && horz.nc() == vert.nc(),
 "\tvoid suppress_non_maximum_edges(horz, vert, out_img)"
 << "\n\tYou have to give horz and vert gradient images that are the same size"
 << "\n\thorz.nr(): " << horz.nr() 
 << "\n\thorz.nc(): " << horz.nc() 
 << "\n\tvert.nr(): " << vert.nr() 
 << "\n\tvert.nc(): " << vert.nc() 
 );
 DLIB_ASSERT( !is_same_object(out_img_,horz_) && !is_same_object(out_img_,vert_),
 "\tvoid suppress_non_maximum_edges(horz_, vert_, out_img_)"
 << "\n\t out_img can't be the same as one of the input images."
 << "\n\t is_same_object(out_img_,horz_): " << is_same_object(out_img_,horz_)
 << "\n\t is_same_object(out_img_,vert_): " << is_same_object(out_img_,vert_)
 );
 using std::min;
 using std::abs;
 // if there isn't any input image then don't do anything
 if (horz.size() == 0)
 {
 out_img.clear();
 return;
 }
 out_img.set_size(horz.nr(),horz.nc());
 zero_border_pixels(out_img,1,1);
 // now do non maximum suppression while we copy the 
 const long M = 3;
 const long N = 3;
 // figure out the range that we should apply the filter to
 const long first_row = M/2;
 const long first_col = N/2;
 const long last_row = horz.nr() - M/2;
 const long last_col = horz.nc() - N/2;
 // apply the filter to the image
 for (long r = first_row; r < last_row; ++r)
 {
 for (long c = first_col; c < last_col; ++c)
 {
 typedef typename promote<typename image_traits<in_image_type>::pixel_type>::type T;
 const T y = horz[r][c];
 const T x = vert[r][c];
 using impl::square;
 const T val = square(horz[r][c]) + square(vert[r][c]); 
 const char ori = edge_orientation(x,y);
 const unsigned char zero = 0;
 switch (ori)
 {
 case '-':
 if (square(horz[r-1][c])+square(vert[r-1][c]) > val || square(horz[r+1][c]) + square(vert[r+1][c]) > val)
 assign_pixel(out_img[r][c] , zero);
 else
 assign_pixel(out_img[r][c] , std::sqrt((double)val));
 break;
 case '|':
 if (square(horz[r][c-1]) + square(vert[r][c-1]) > val || square(horz[r][c+1]) + square(vert[r][c+1]) > val)
 assign_pixel(out_img[r][c] , zero);
 else
 assign_pixel(out_img[r][c] , std::sqrt((double)val));
 break;
 case '/':
 if (square(horz[r-1][c-1]) + square(vert[r-1][c-1]) > val || square(horz[r+1][c+1]) + square(vert[r+1][c+1]) > val)
 assign_pixel(out_img[r][c] , zero);
 else
 assign_pixel(out_img[r][c] , std::sqrt((double)val));
 break;
 case '\\':
 if (square(horz[r+1][c-1]) + square(vert[r+1][c-1]) > val || square(horz[r-1][c+1]) + square(vert[r-1][c+1]) > val)
 assign_pixel(out_img[r][c] , zero);
 else
 assign_pixel(out_img[r][c] , std::sqrt((double)val));
 break;
 }
 }
 }
 }
// ----------------------------------------------------------------------------------------
 template <
 typename image_type
 >
 void normalize_image_gradients (
 image_type& img1_,
 image_type& img2_
 )
 {
 image_view<image_type> img1(img1_);
 image_view<image_type> img2(img2_);
 using pixel_type = typename image_traits<image_type>::pixel_type;
 static_assert(std::is_same<pixel_type,float>::value || 
 std::is_same<pixel_type,double>::value ||
 std::is_same<pixel_type,long double>::value, 
 "normalize_image_gradients() requires the input images to use floating point pixel types.");
 DLIB_CASSERT(img1.nr() == img2.nr());
 DLIB_CASSERT(img1.nc() == img2.nc());
 // normalize all the gradients
 for (long r = 0; r < img1.nr(); ++r)
 {
 for (long c = 0; c < img1.nc(); ++c)
 {
 if (img1[r][c] != 0 || img2[r][c] != 0)
 {
 double len = std::sqrt(img1[r][c]*img1[r][c] + img2[r][c]*img2[r][c]);
 img1[r][c] /= len;
 img2[r][c] /= len;
 }
 }
 }
 }
// ----------------------------------------------------------------------------------------
 template <
 typename image_type
 >
 std::vector<point> remove_incoherent_edge_pixels (
 const std::vector<point>& line,
 const image_type& horz_gradient_,
 const image_type& vert_gradient_,
 double angle_threshold
 )
 {
 const_image_view<image_type> horz_gradient(horz_gradient_);
 const_image_view<image_type> vert_gradient(vert_gradient_);
 DLIB_CASSERT(horz_gradient.nr() == vert_gradient.nr());
 DLIB_CASSERT(horz_gradient.nc() == vert_gradient.nc());
 DLIB_CASSERT(angle_threshold >= 0);
#ifdef ENABLE_ASSERTS
 for (auto& p : line)
 DLIB_ASSERT(get_rect(horz_gradient).contains(p), "All line points must be inside the given images.");
#endif
 // We make sure that each vector is within this threshold of the mean vector. So
 // to make sure they are pairwise within the user supplied angel threshold we need
 // to divide by 2 before we proceed.
 angle_threshold /= 2;
 const double dotthresh = std::cos(angle_threshold*pi/180);
 // find the average gradient on this line
 dpoint avg;
 for (auto p : line)
 avg += dpoint(horz_gradient[p.y()][p.x()], vert_gradient[p.y()][p.x()]);
 dpoint ref = avg.normalize();
 // now iterate a few times and find the most common average gradient.
 for (int i = 0; i < 10; ++i)
 {
 avg = dpoint();
 for (auto p : line)
 {
 const dpoint v(horz_gradient[p.y()][p.x()], vert_gradient[p.y()][p.x()]);
 const double dp = ref.dot(v);
 if (dp > dotthresh)
 avg += v;
 else if (-dp > dotthresh)
 avg -= v;
 }
 ref = avg.normalize();
 }
 // now remove all the points that deviate from the average gradient too much.
 std::vector<point> newpixels;
 for (auto p : line)
 {
 dpoint v(horz_gradient[p.y()][p.x()], vert_gradient[p.y()][p.x()]);
 if (std::abs(ref.dot(v)) > dotthresh)
 newpixels.push_back(p);
 }
 return newpixels;
 }
 template <
 typename image_type
 >
 std::vector<std::vector<point>> remove_incoherent_edge_pixels (
 const std::vector<std::vector<point>>& line_pixels,
 const image_type& horz_gradient_,
 const image_type& vert_gradient_,
 const double angle_threshold
 )
 {
 std::vector<std::vector<point>> temp;
 temp.reserve(line_pixels.size());
 for (auto& line : line_pixels)
 temp.emplace_back(remove_incoherent_edge_pixels(line, horz_gradient_, vert_gradient_, angle_threshold));
 return temp;
 }
// ----------------------------------------------------------------------------------------
 class image_gradients
 {
 public:
 image_gradients (
 ) : image_gradients(1) {}
 image_gradients (
 long scale
 ) : the_scale(scale)
 {
 DLIB_CASSERT(scale >= 1);
 scale = 2*scale+1;
 auto dfilters = build_separable_poly_filters(2,scale); 
 DLIB_CASSERT(dfilters[1].size() == 1);
 DLIB_CASSERT(dfilters[2].size() == 1);
 DLIB_CASSERT(dfilters[3].size() == 1);
 DLIB_CASSERT(dfilters[4].size() == 1);
 DLIB_CASSERT(dfilters[5].size() == 1);
 filter_x.first = matrix_cast<float>(dfilters[1][0].first);
 filter_x.second = matrix_cast<float>(dfilters[1][0].second);
 filter_y.first = matrix_cast<float>(dfilters[2][0].first);
 filter_y.second = matrix_cast<float>(dfilters[2][0].second);
 // We multiply by 2 so that the filter gives the gradient rather than the x^2
 // polynomial coefficient.
 filter_xx.first = 2*matrix_cast<float>(dfilters[3][0].first);
 filter_xx.second = matrix_cast<float>(dfilters[3][0].second);
 filter_xy.first = matrix_cast<float>(dfilters[4][0].first);
 filter_xy.second = matrix_cast<float>(dfilters[4][0].second);
 // We multiply by 2 so that the filter gives the gradient rather than the y^2
 // polynomial coefficient.
 filter_yy.first = 2*matrix_cast<float>(dfilters[5][0].first);
 filter_yy.second = matrix_cast<float>(dfilters[5][0].second);
 }
 long get_scale() const { return the_scale; }
 template <
 typename in_image_type,
 typename out_image_type
 >
 rectangle gradient_x(
 const in_image_type& img,
 out_image_type& out
 ) const 
 { 
 return spatially_filter_image_separable(img, out, filter_x.second, filter_x.first); 
 }
 template <
 typename in_image_type,
 typename out_image_type
 >
 rectangle gradient_y(
 const in_image_type& img,
 out_image_type& out
 ) const 
 { 
 return spatially_filter_image_separable(img, out, filter_y.second, filter_y.first); 
 }
 template <
 typename in_image_type,
 typename out_image_type
 >
 rectangle gradient_xx(
 const in_image_type& img,
 out_image_type& out
 ) const
 { 
 return spatially_filter_image_separable(img, out, filter_xx.second, filter_xx.first); 
 }
 template <
 typename in_image_type,
 typename out_image_type
 >
 rectangle gradient_xy(
 const in_image_type& img,
 out_image_type& out
 ) const 
 { 
 return spatially_filter_image_separable(img, out, filter_xy.second, filter_xy.first); 
 }
 template <
 typename in_image_type,
 typename out_image_type
 >
 rectangle gradient_yy(
 const in_image_type& img,
 out_image_type& out
 ) const
 { 
 return spatially_filter_image_separable(img, out, filter_yy.second, filter_yy.first); 
 }
 matrix<float> get_x_filter() const { return filter_x.first*trans(filter_x.second); }
 matrix<float> get_y_filter() const { return filter_y.first*trans(filter_y.second); }
 matrix<float> get_xx_filter() const { return filter_xx.first*trans(filter_xx.second); }
 matrix<float> get_xy_filter() const { return filter_xy.first*trans(filter_xy.second); }
 matrix<float> get_yy_filter() const { return filter_yy.first*trans(filter_yy.second); }
 private:
 std::pair<matrix<float,0,1>,matrix<float,0,1>> filter_x;
 std::pair<matrix<float,0,1>,matrix<float,0,1>> filter_y;
 std::pair<matrix<float,0,1>,matrix<float,0,1>> filter_xx;
 std::pair<matrix<float,0,1>,matrix<float,0,1>> filter_xy;
 std::pair<matrix<float,0,1>,matrix<float,0,1>> filter_yy;
 long the_scale;
 };
// ----------------------------------------------------------------------------------------
 namespace impl
 {
 template <
 typename in_image_type,
 typename out_image_type
 >
 void find_lines(
 const in_image_type& xx_,
 const in_image_type& xy_,
 const in_image_type& yy_,
 out_image_type& horz_,
 out_image_type& vert_,
 double positive_if_should_find_dark_lines
 )
 {
 typedef typename image_traits<out_image_type>::pixel_type out_pixel_type;
 static_assert(std::is_same<float,out_pixel_type>::value || std::is_same<double,out_pixel_type>::value,
 "Output images must contain either float or double valued pixels");
 const_image_view<in_image_type> xx(xx_);
 const_image_view<in_image_type> xy(xy_);
 const_image_view<in_image_type> yy(yy_);
 DLIB_CASSERT(xx.nr() == xy.nr());
 DLIB_CASSERT(xx.nr() == yy.nr());
 DLIB_CASSERT(xx.nc() == xy.nc());
 DLIB_CASSERT(xx.nc() == yy.nc());
 image_view<out_image_type> x(horz_);
 image_view<out_image_type> y(vert_);
 x.set_size(xx.nr(), xx.nc());
 y.set_size(xx.nr(), xx.nc());
 // store the max eigenvalue into xy and then the associated eigen vector into [xx,yy]
 for (long r = 0; r < xx.nr(); ++r)
 {
 for (long c = 0; c < xx.nc(); ++c)
 {
 // negate to that lambda will be the *minimum* eigenvalue
 double w1 = positive_if_should_find_dark_lines*xx[r][c]/2.0;
 double w2 = positive_if_should_find_dark_lines*yy[r][c]/2.0;
 double w3 = positive_if_should_find_dark_lines*xy[r][c];
 auto lambda = w1 + w2 + std::sqrt((w1-w2)*(w1-w2) + w3*w3);
 if (lambda < 0)
 lambda = 0;
 if (2*w1!=lambda)
 {
 x[r][c] = -w3/(2*w1-lambda);
 y[r][c] = 1;
 double norm = std::sqrt(x[r][c]*x[r][c] + y[r][c]*y[r][c]);
 x[r][c] *= lambda/norm;
 y[r][c] *= lambda/norm;
 }
 else
 {
 x[r][c] = lambda;
 y[r][c] = 0;
 }
 }
 }
 }
 }
 template <
 typename in_image_type,
 typename out_image_type
 >
 void find_bright_lines(
 const in_image_type& xx,
 const in_image_type& xy,
 const in_image_type& yy,
 out_image_type& horz,
 out_image_type& vert
 )
 {
 impl::find_lines(xx,xy,yy,horz,vert,-1);
 }
 template <
 typename in_image_type,
 typename out_image_type
 >
 void find_dark_lines(
 const in_image_type& xx,
 const in_image_type& xy,
 const in_image_type& yy,
 out_image_type& horz,
 out_image_type& vert
 )
 {
 impl::find_lines(xx,xy,yy,horz,vert,+1);
 }
// ----------------------------------------------------------------------------------------
 template <
 typename in_image_type,
 typename out_image_type
 >
 void find_bright_keypoints(
 const in_image_type& xx_,
 const in_image_type& xy_,
 const in_image_type& yy_,
 out_image_type& saliency_
 )
 {
 typedef typename image_traits<out_image_type>::pixel_type out_pixel_type;
 static_assert(std::is_same<float,out_pixel_type>::value || std::is_same<double,out_pixel_type>::value,
 "Output images must contain either float or double valued pixels");
 const_image_view<in_image_type> xx(xx_);
 const_image_view<in_image_type> xy(xy_);
 const_image_view<in_image_type> yy(yy_);
 DLIB_CASSERT(xx.nr() == xy.nr());
 DLIB_CASSERT(xx.nr() == yy.nr());
 DLIB_CASSERT(xx.nc() == xy.nc());
 DLIB_CASSERT(xx.nc() == yy.nc());
 image_view<out_image_type> saliency(saliency_);
 saliency.set_size(xx.nr(), xx.nc());
 for (long r = 0; r < xx.nr(); ++r)
 {
 for (long c = 0; c < xx.nc(); ++c)
 {
 matrix<double,2,2> tmp;
 tmp = xx[r][c], xy[r][c],
 xy[r][c], yy[r][c];
 matrix<double,2,1> e = real_eigenvalues(tmp);
 saliency[r][c] = prod(upperbound(e,0));
 }
 }
 }
// ----------------------------------------------------------------------------------------
 template <
 typename in_image_type,
 typename out_image_type
 >
 void find_dark_keypoints(
 const in_image_type& xx_,
 const in_image_type& xy_,
 const in_image_type& yy_,
 out_image_type& saliency_
 )
 {
 typedef typename image_traits<out_image_type>::pixel_type out_pixel_type;
 static_assert(std::is_same<float,out_pixel_type>::value || std::is_same<double,out_pixel_type>::value,
 "Output images must contain either float or double valued pixels");
 const_image_view<in_image_type> xx(xx_);
 const_image_view<in_image_type> xy(xy_);
 const_image_view<in_image_type> yy(yy_);
 DLIB_CASSERT(xx.nr() == xy.nr());
 DLIB_CASSERT(xx.nr() == yy.nr());
 DLIB_CASSERT(xx.nc() == xy.nc());
 DLIB_CASSERT(xx.nc() == yy.nc());
 image_view<out_image_type> saliency(saliency_);
 saliency.set_size(xx.nr(), xx.nc());
 for (long r = 0; r < xx.nr(); ++r)
 {
 for (long c = 0; c < xx.nc(); ++c)
 {
 matrix<double,2,2> tmp;
 tmp = xx[r][c], xy[r][c],
 xy[r][c], yy[r][c];
 matrix<double,2,1> e = real_eigenvalues(tmp);
 saliency[r][c] = prod(lowerbound(e,0));
 }
 }
 }
// ----------------------------------------------------------------------------------------
}
#endif // DLIB_EDGE_DETECTOr_