Commit 2b4e363f authored by Davis King's avatar Davis King

Added the nearest_neighbor_feature_image object.

parent f03906fa
...@@ -7,6 +7,7 @@ ...@@ -7,6 +7,7 @@
#include "image_keypoint/hessian_pyramid.h" #include "image_keypoint/hessian_pyramid.h"
#include "image_keypoint/hog.h" #include "image_keypoint/hog.h"
#include "image_keypoint/hashed_feature_image.h" #include "image_keypoint/hashed_feature_image.h"
#include "image_keypoint/nearest_neighbor_feature_image.h"
#endif // DLIB_IMAGE_KEYPOINt_H_ #endif // DLIB_IMAGE_KEYPOINt_H_
This diff is collapsed.
// Copyright (C) 2011 Davis E. King (davis@dlib.net)
// License: Boost Software License See LICENSE.txt for the full license.
#undef DLIB_NEAREST_NEIGHBOR_FeATURE_IMAGE_ABSTRACT_H__
#ifdef DLIB_NEAREST_NEIGHBOR_FeATURE_IMAGE_ABSTRACT_H__
#include <vector>
#include "../algs.h"
namespace dlib
{
// ----------------------------------------------------------------------------------------
template <
typename feature_extractor
>
class nearest_neighbor_feature_image : noncopyable
{
/*!
REQUIREMENTS ON feature_extractor
- must be an object with an interface compatible with dlib::hog_image
INITIAL VALUE
- size() == 0
- get_num_dimensions() == 0
WHAT THIS OBJECT REPRESENTS
This object is a tool for performing image feature extraction. In
particular, it wraps another image feature extractor and converts
the wrapped image feature vectors into sparse indicator vectors. It does
this by finding the nearest neighbor for each feature vector and returning an
indicator vector that is zero everywhere except for the position indicated by
the nearest neighbor.
THREAD SAFETY
Concurrent access to an instance of this object is not safe and should be protected
by a mutex lock except for the case where you are copying the configuration
(via copy_configuration()) of a nearest_neighbor_feature_image object to many other
threads. In this case, it is safe to copy the configuration of a shared object so
long as no other operations are performed on it.
NOTATION
let BASE_FE denote the base feature_extractor object contained inside
the nearest_neighbor_feature_image.
!*/
public:
typedef std::vector<std::pair<unsigned int,double> > descriptor_type;
nearest_neighbor_feature_image (
);
/*!
ensures
- this object is properly initialized
!*/
void clear (
);
/*!
ensures
- this object will have its initial value
!*/
void copy_configuration (
const feature_extractor& item
);
/*!
ensures
- performs BASE_FE.copy_configuration(item)
!*/
void copy_configuration (
const nearest_neighbor_feature_image& item
);
/*!
ensures
- copies all the state information of item into *this, except for state
information populated by load(). More precisely, given two
nearest_neighbor_feature_image objects H1 and H2, the following sequence
of instructions should always result in both of them having the exact
same state.
H2.copy_configuration(H1);
H1.load(img);
H2.load(img);
!*/
template <
typename image_type
>
inline void load (
const image_type& img
);
/*!
requires
- image_type == any type that can be supplied to feature_extractor::load()
ensures
- performs BASE_FE.load(img)
i.e. does feature extraction. The features can be accessed using
operator() as defined below.
!*/
inline unsigned long size (
) const;
/*!
ensures
- returns BASE_FE.size()
!*/
inline long nr (
) const;
/*!
ensures
- returns BASE_FE.nr()
!*/
inline long nc (
) const;
/*!
ensures
- returns BASE_FE.nc()
!*/
inline long get_num_dimensions (
) const;
/*!
ensures
- returns the dimensionality of the feature vectors returned by operator().
In this case, this is the number of basis elements. That is, it is the number
of vectors given to the set_basis() member function.
!*/
template <typename vector_type>
void set_basis (
const vector_type& new_basis
);
/*!
ensures
- #get_num_dimensions() == new_basis.size()
- The operator() member function defined below will use new_basis to
determine nearest neighbors.
!*/
inline const descriptor_type& operator() (
long row,
long col
) const;
/*!
requires
- 0 <= row < nr()
- 0 <= col < nc()
- get_num_dimensions() > 0
ensures
- determines which basis element is nearest to BASE_FE(row,col) and returns a sparse
indicator vector identifying the nearest neighbor.
- To be precise, this function returns a sparse vector V such that:
- V.size() == 1
- V[0].first == The basis element index for the basis vector nearest to BASE_FE(row,col).
"nearness" is determined using Euclidean distance.
- V[0].second == 1
!*/
inline const rectangle get_block_rect (
long row,
long col
) const;
/*!
ensures
- returns BASE_FE.get_block_rect(row,col)
I.e. returns a rectangle that tells you what part of the original image is associated
with a particular feature vector.
!*/
inline const point image_to_feat_space (
const point& p
) const;
/*!
ensures
- returns BASE_FE.image_to_feat_space(p)
I.e. Each local feature is extracted from a certain point in the input image.
This function returns the identity of the local feature corresponding
to the image location p. Or in other words, let P == image_to_feat_space(p),
then (*this)(P.y(),P.x()) == the local feature closest to, or centered at,
the point p in the input image. Note that some image points might not have
corresponding feature locations. E.g. border points or points outside the
image. In these cases the returned point will be outside get_rect(*this).
!*/
inline const rectangle image_to_feat_space (
const rectangle& rect
) const;
/*!
ensures
- returns BASE_FE.image_to_feat_space(rect)
I.e. returns rectangle(image_to_feat_space(rect.tl_corner()), image_to_feat_space(rect.br_corner()));
(i.e. maps a rectangle from image space to feature space)
!*/
inline const point feat_to_image_space (
const point& p
) const;
/*!
ensures
- returns BASE_FE.feat_to_image_space(p)
I.e. returns the location in the input image space corresponding to the center
of the local feature at point p. In other words, this function computes
the inverse of image_to_feat_space(). Note that it may only do so approximately,
since more than one image location might correspond to the same local feature.
That is, image_to_feat_space() might not be invertible so this function gives
the closest possible result.
!*/
inline const rectangle feat_to_image_space (
const rectangle& rect
) const;
/*!
ensures
- returns BASE_FE.feat_to_image_space(rect)
I.e. return rectangle(feat_to_image_space(rect.tl_corner()), feat_to_image_space(rect.br_corner()));
(i.e. maps a rectangle from feature space to image space)
!*/
};
// ----------------------------------------------------------------------------------------
template <typename T>
void serialize (
const nearest_neighbor_feature_image<T>& item,
std::ostream& out
);
/*!
provides serialization support
!*/
template <typename T>
void deserialize (
nearest_neighbor_feature_image<T>& item,
std::istream& in
);
/*!
provides deserialization support
!*/
// ----------------------------------------------------------------------------------------
}
#endif // DLIB_NEAREST_NEIGHBOR_FeATURE_IMAGE_ABSTRACT_H__
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment