Added the nearest_neighbor_feature_image object.

2b4e363f · Davis King · f03906fa · 2b4e363f · 2b4e363f · 2b4e363f
Commit 2b4e363f authored Jan 01, 2012 by Davis King
3 changed files
--- a/dlib/image_keypoint.h
+++ b/dlib/image_keypoint.h
@@ -7,6 +7,7 @@
 #include "image_keypoint/hessian_pyramid.h"
 #include "image_keypoint/hog.h"
 #include "image_keypoint/hashed_feature_image.h"
+#include "image_keypoint/nearest_neighbor_feature_image.h"
 #endif // DLIB_IMAGE_KEYPOINt_H_
--- a/dlib/image_keypoint/nearest_neighbor_feature_image.h
+++ b/dlib/image_keypoint/nearest_neighbor_feature_image.h
--- a/dlib/image_keypoint/nearest_neighbor_feature_image_abstract.h
+++ b/dlib/image_keypoint/nearest_neighbor_feature_image_abstract.h
+// Copyright (C) 2011  Davis E. King (davis@dlib.net)
+// License: Boost Software License   See LICENSE.txt for the full license.
+#undef DLIB_NEAREST_NEIGHBOR_FeATURE_IMAGE_ABSTRACT_H__
+#ifdef DLIB_NEAREST_NEIGHBOR_FeATURE_IMAGE_ABSTRACT_H__
+#include <vector>
+#include "../algs.h"
+namespace dlib
+{
+// ----------------------------------------------------------------------------------------
+    template <
+        typename feature_extractor
+        >
+    class nearest_neighbor_feature_image : noncopyable
+    {
+        /*!
+            REQUIREMENTS ON feature_extractor 
+                - must be an object with an interface compatible with dlib::hog_image
+            INITIAL VALUE
+                 - size() == 0
+                 - get_num_dimensions() == 0
+            WHAT THIS OBJECT REPRESENTS
+                This object is a tool for performing image feature extraction.  In
+                particular, it wraps another image feature extractor and converts
+                the wrapped image feature vectors into sparse indicator vectors.  It does
+                this by finding the nearest neighbor for each feature vector and returning an
+                indicator vector that is zero everywhere except for the position indicated by 
+                the nearest neighbor.  
+            THREAD SAFETY
+                Concurrent access to an instance of this object is not safe and should be protected
+                by a mutex lock except for the case where you are copying the configuration 
+                (via copy_configuration()) of a nearest_neighbor_feature_image object to many other 
+                threads.  In this case, it is safe to copy the configuration of a shared object so 
+                long as no other operations are performed on it.
+            NOTATION 
+                let BASE_FE denote the base feature_extractor object contained inside 
+                the nearest_neighbor_feature_image.
+        !*/
+    public:
+        typedef std::vector<std::pair<unsigned int,double> > descriptor_type;
+        nearest_neighbor_feature_image (
+        ); 
+        /*!
+            ensures
+                - this object is properly initialized
+        !*/
+        void clear (
+        );
+        /*!
+            ensures
+                - this object will have its initial value
+        !*/
+        void copy_configuration (
+            const feature_extractor& item
+        );
+        /*!
+            ensures
+                - performs BASE_FE.copy_configuration(item)
+        !*/
+        void copy_configuration (
+            const nearest_neighbor_feature_image& item
+        );
+        /*!
+            ensures
+                - copies all the state information of item into *this, except for state 
+                  information populated by load().  More precisely, given two 
+                  nearest_neighbor_feature_image objects H1 and H2, the following sequence 
+                  of instructions should always result in both of them having the exact 
+                  same state.
+                    H2.copy_configuration(H1);
+                    H1.load(img);
+                    H2.load(img);
+        !*/
+        template <
+            typename image_type
+            >
+        inline void load (
+            const image_type& img
+        );
+        /*!
+            requires
+                - image_type == any type that can be supplied to feature_extractor::load() 
+            ensures
+                - performs BASE_FE.load(img)
+                  i.e. does feature extraction.  The features can be accessed using
+                  operator() as defined below.
+        !*/
+        inline unsigned long size (
+        ) const;
+        /*!
+            ensures
+                - returns BASE_FE.size() 
+        !*/
+        inline long nr (
+        ) const;
+        /*!
+            ensures
+                - returns BASE_FE.nr() 
+        !*/
+        inline long nc (
+        ) const;
+        /*!
+            ensures
+                - returns BASE_FE.nc() 
+        !*/
+        inline long get_num_dimensions (
+        ) const;
+        /*!
+            ensures
+                - returns the dimensionality of the feature vectors returned by operator().  
+                  In this case, this is the number of basis elements.  That is, it is the number
+                  of vectors given to the set_basis() member function.
+        !*/
+        template <typename vector_type>
+        void set_basis (
+            const vector_type& new_basis
+        );
+        /*!
+            ensures
+                - #get_num_dimensions() == new_basis.size()
+                - The operator() member function defined below will use new_basis to 
+                  determine nearest neighbors.
+        !*/
+        inline const descriptor_type& operator() (
+            long row,
+            long col
+        ) const;
+        /*!
+            requires
+                - 0 <= row < nr()
+                - 0 <= col < nc()
+                - get_num_dimensions() > 0
+            ensures
+                - determines which basis element is nearest to BASE_FE(row,col) and returns a sparse
+                  indicator vector identifying the nearest neighbor. 
+                - To be precise, this function returns a sparse vector V such that:
+                    - V.size() == 1 
+                    - V[0].first == The basis element index for the basis vector nearest to BASE_FE(row,col).
+                      "nearness" is determined using Euclidean distance.
+                    - V[0].second == 1 
+        !*/
+        inline const rectangle get_block_rect (
+            long row,
+            long col
+        ) const;
+        /*!
+            ensures
+                - returns BASE_FE.get_block_rect(row,col)
+                  I.e. returns a rectangle that tells you what part of the original image is associated
+                  with a particular feature vector.
+        !*/
+        inline const point image_to_feat_space (
+            const point& p
+        ) const;
+        /*!
+            ensures
+                - returns BASE_FE.image_to_feat_space(p)
+                  I.e. Each local feature is extracted from a certain point in the input image.
+                  This function returns the identity of the local feature corresponding
+                  to the image location p.  Or in other words, let P == image_to_feat_space(p), 
+                  then (*this)(P.y(),P.x()) == the local feature closest to, or centered at, 
+                  the point p in the input image.  Note that some image points might not have 
+                  corresponding feature locations.  E.g. border points or points outside the 
+                  image.  In these cases the returned point will be outside get_rect(*this).
+        !*/
+        inline const rectangle image_to_feat_space (
+            const rectangle& rect
+        ) const;
+        /*!
+            ensures
+                - returns BASE_FE.image_to_feat_space(rect)
+                  I.e. returns rectangle(image_to_feat_space(rect.tl_corner()), image_to_feat_space(rect.br_corner()));
+                  (i.e. maps a rectangle from image space to feature space)
+        !*/
+        inline const point feat_to_image_space (
+            const point& p
+        ) const;
+        /*!
+            ensures
+                - returns BASE_FE.feat_to_image_space(p)
+                  I.e. returns the location in the input image space corresponding to the center
+                  of the local feature at point p.  In other words, this function computes
+                  the inverse of image_to_feat_space().  Note that it may only do so approximately, 
+                  since more than one image location might correspond to the same local feature.  
+                  That is, image_to_feat_space() might not be invertible so this function gives 
+                  the closest possible result.
+        !*/
+        inline const rectangle feat_to_image_space (
+            const rectangle& rect
+        ) const;
+        /*!
+            ensures
+                - returns BASE_FE.feat_to_image_space(rect)
+                  I.e. return rectangle(feat_to_image_space(rect.tl_corner()), feat_to_image_space(rect.br_corner()));
+                  (i.e. maps a rectangle from feature space to image space)
+        !*/
+    };
+// ----------------------------------------------------------------------------------------
+    template <typename T>
+    void serialize (
+        const nearest_neighbor_feature_image<T>& item,
+        std::ostream& out
+    );
+    /*!
+        provides serialization support 
+    !*/
+    template <typename T>
+    void deserialize (
+        nearest_neighbor_feature_image<T>& item,
+        std::istream& in 
+    );
+    /*!
+        provides deserialization support 
+    !*/
+// ----------------------------------------------------------------------------------------
+}
+#endif // DLIB_NEAREST_NEIGHBOR_FeATURE_IMAGE_ABSTRACT_H__