fleshed out this spec

25e976fe · Davis King · 1c1acac9 · 25e976fe
Commit 25e976fe authored Dec 04, 2011 by Davis King
Hide whitespace changes
Inline Side-by-side

Showing with 278 additions and 0 deletions

assignment_function_abstract.h dlib/svm/assignment_function_abstract.h +278 -0

No files found.
--- a/dlib/svm/assignment_function_abstract.h
+++ b/dlib/svm/assignment_function_abstract.h
+// Copyright (C) 2011  Davis E. King (davis@dlib.net)
+// License: Boost Software License   See LICENSE.txt for the full license.
+#undef DLIB_ASSIGNMENT_FuNCTION_ABSTRACT_H__
+#ifdef DLIB_ASSIGNMENT_FuNCTION_ABSTRACT_H__
+#include <vector>
+#include "../optimization/max_cost_assignment_abstract.h"
+namespace dlib
+{
+// ----------------------------------------------------------------------------------------
+    class example_feature_extractor
+    {
+        /*!
+            WHAT THIS OBJECT REPRESENTS
+                This object defines the interface a feature extractor must implement
+                if it is to be used with the assignment_function defined at the bottom
+                of this file.  
+                The model used by assignment_function objects is the following.  
+                Given two sets of objects, the Left Hand Set (LHS) and Right Hand Set (RHS),
+                find a one-to-one mapping M from LHS into RHS such that:
+                    M == argmax_m  sum_{l in LHS} match_score(l,m(l))
+                Where match_score() returns a scalar value indicating how good it is
+                to say l maps to the RHS element m(l).  Additionally, in this model, 
+                m() is allowed to indicate that l doesn't map to anything, and in this 
+                case it is excluded from the sum.    
+                Finally, match_score() is defined as: 
+                    match_score(l,r) == dot(w, PSI(l,r))
+                where l is an element of LHS, r is an element of RHS, and
+                w is a parameter vector.
+                Therefore, a feature extractor defines how the PSI() feature vector 
+                is calculated.  In particular, PSI() is defined by the get_features()
+                method of this class.
+            THREAD SAFETY
+                Instances of this object should be thread safe, that is, it should 
+                be safe for multiple threads to make concurrent calls to the member 
+                functions of this object.
+        !*/
+    public:
+        // This type should be a dlib::matrix capable of storing column vectors
+        // or an unsorted sparse vector type as defined in dlib/svm/sparse_vector_abstract.h.
+        typedef matrix_or_sparse_vector_type feature_vector_type;
+        // These two typedefs define the types used to represent an element in 
+        // the left hand and right hand sets.  You can use any copyable types here.
+        typedef user_defined_type_1 lhs_element;
+        typedef user_defined_type_2 rhs_element;
+        unsigned long num_features(
+        ) const;
+        /*!
+            ensures
+                - returns the dimensionality of the PSI() feature vector.  
+        !*/
+        void get_features (
+            const lhs_element& left,
+            const rhs_element& right,
+            feature_vector_type& feats
+        ) const;
+        /*!
+            ensures
+                - #feats == PSI(left,right)
+                  (i.e. This function computes a feature vector which, in some sense, 
+                  captures information useful for deciding if matching left to right 
+                  is "good").
+        !*/
+    };
+// ----------------------------------------------------------------------------------------
+    void serialize(
+        const example_feature_extractor& item,
+        std::ostream& out
+    );
+    /*!
+        provides serialization support 
+    !*/
+    void deserialize(
+        example_feature_extractor& item, 
+        std::istream& in
+    );
+    /*!
+        provides deserialization support 
+    !*/
+// ----------------------------------------------------------------------------------------
+// ----------------------------------------------------------------------------------------
+    template <
+        typename feature_extractor 
+        >
+    class assignment_function
+    {
+        /*!
+            REQUIREMENTS ON feature_extractor
+                It must be an object that implements an interface compatible with 
+                the example_feature_extractor discussed above.
+            WHAT THIS OBJECT REPRESENTS
+                This object is a tool for solving the optimal assignment problem given a 
+                user defined method for computing the quality of any particular assignment. 
+                To define this precisely, suppose you have two sets of objects, a 
+                Left Hand Set (LHS) and a Right Hand Set (RHS) and you want to 
+                find a one-to-one mapping M from LHS into RHS such that:
+                    M == argmax_m  sum_{l in LHS} match_score(l,m(l))
+                Where match_score() returns a scalar value indicating how good it is
+                to say l maps to the RHS element m(l).  Additionally, in this model, 
+                m() is allowed to indicate that l doesn't map to anything, and in this 
+                case it is excluded from the sum.    
+                Finally, match_score() must be of the form: 
+                    match_score(l,r) == dot(w, PSI(l,r))
+                where l is an element of LHS, r is an element of RHS, w is a parameter 
+                vector, and PSI() is defined by the feature_extractor template argument.  
+        !*/
+    public:
+        typedef typename feature_extractor::lhs_element  lhs_element;
+        typedef typename feature_extractor::rhs_element  rhs_element;
+        typedef          std::vector<long>               label_type;
+        typedef          label_type                      result_type;
+        typedef std::pair<std::vector<lhs_element>, std::vector<rhs_element> > sample_type;
+        assignment_function(
+        );
+        /*!
+            ensures
+                - #get_feature_extractor() == feature_extractor() 
+                  (i.e. it will have its default value)
+                - #get_weights().size() == #get_feature_extractor().num_features()
+                - #get_weights() == 0
+                - #forces_assignment() == false 
+        !*/
+        explicit assignment_function(
+            const matrix<double,0,1>& weights
+        );
+        /*!
+            requires
+                - feature_extractor().num_features() == weights.size()
+            ensures
+                - #get_feature_extractor() == feature_extractor() 
+                  (i.e. it will have its default value)
+                - #get_weights() == weights
+                - #forces_assignment() == false 
+        !*/
+        assignment_function(
+            const feature_extractor& fe,
+            const matrix<double,0,1>& weights
+        );
+        /*!
+            requires
+                - fe.num_features() == weights.size()
+            ensures
+                - #get_feature_extractor() == fe
+                - #get_weights() == weights
+                - #forces_assignment() == false 
+        !*/
+        assignment_function(
+            const feature_extractor& fe,
+            const matrix<double,0,1>& weights,
+            bool force_assignment
+        );
+        /*!
+            requires
+                - fe.num_features() == weights.size()
+            ensures
+                - #get_feature_extractor() == fe
+                - #get_weights() == weights
+                - #forces_assignment() == force_assignment
+        !*/
+        const feature_extractor& get_feature_extractor (
+        ) const;
+        /*!
+            ensures
+                - returns the feature extractor used by this object
+        !*/
+        const matrix<double,0,1>& get_weights (
+        ) const;
+        /*!
+            ensures
+                - returns the parameter vector (w) associated with this assignment function. 
+                  The length of the vector is get_feature_extractor().num_features().  
+        !*/
+        bool forces_assignment (
+        ) const; 
+        /*!
+            ensures
+                - returns true if this object is in the "forced assignment mode" and false
+                  otherwise.
+                - When deciding how to match LHS to RHS, this object can operate in one of 
+                  two modes.  In the default mode, this object will indicate that there is 
+                  no match for an element of LHS if the best matching element of RHS would 
+                  result in a negative match_score().  However, in the "forced assignment mode", 
+                  this object will always make the assignment if there is an available 
+                  element in RHS regardless of the match_score().
+                  Another way to understand this distinction is to consider an example.  
+                  Suppose LHS and RHS both have 10 elements in them.  Then in the default
+                  mode, it is possible for this object to indicate that there are anywhere
+                  from 0 to 10 matches between LHS and RHS.  However, in forced assignment
+                  mode it will always indicate exactly 10 matches.   
+        !*/
+        result_type operator()(
+            const std::vector<lhs_element>& lhs,
+            const std::vector<rhs_element>& rhs 
+        ) const
+        /*!
+            ensures
+                - returns a vector ASSIGN such that:
+                    - ASSIGN.size() == lhs.size()
+                    - if (ASSIGN[i] != -1) then
+                        - lhs[i] is predicted to associate to rhs[ASSIGN[i]].
+                    - else
+                        - lhs[i] doesn't associate with anything in rhs.
+        !*/
+        result_type operator() (
+            const sample_type& item
+        ) const;
+        /*!
+            ensures
+                - returns (*this)(item.first, item.second);
+        !*/
+    };
+// ----------------------------------------------------------------------------------------
+    template <
+        typename feature_extractor
+        >
+    void serialize (
+        const assignment_function<feature_extractor>& item,
+        std::ostream& out
+    );
+    /*!
+        provides serialization support 
+    !*/
+// ----------------------------------------------------------------------------------------
+    template <
+        typename feature_extractor
+        >
+    void deserialize (
+        assignment_function<feature_extractor>& item,
+        std::istream& in 
+    );
+    /*!
+        provides deserialization support 
+    !*/
+// ----------------------------------------------------------------------------------------
+}
+#endif // DLIB_ASSIGNMENT_FuNCTION_ABSTRACT_H__