Commit 25e976fe authored by Davis King's avatar Davis King

fleshed out this spec

parent 1c1acac9
// Copyright (C) 2011 Davis E. King (davis@dlib.net)
// License: Boost Software License See LICENSE.txt for the full license.
#undef DLIB_ASSIGNMENT_FuNCTION_ABSTRACT_H__
#ifdef DLIB_ASSIGNMENT_FuNCTION_ABSTRACT_H__
#include <vector>
#include "../optimization/max_cost_assignment_abstract.h"
namespace dlib
{
// ----------------------------------------------------------------------------------------
class example_feature_extractor
{
/*!
WHAT THIS OBJECT REPRESENTS
This object defines the interface a feature extractor must implement
if it is to be used with the assignment_function defined at the bottom
of this file.
The model used by assignment_function objects is the following.
Given two sets of objects, the Left Hand Set (LHS) and Right Hand Set (RHS),
find a one-to-one mapping M from LHS into RHS such that:
M == argmax_m sum_{l in LHS} match_score(l,m(l))
Where match_score() returns a scalar value indicating how good it is
to say l maps to the RHS element m(l). Additionally, in this model,
m() is allowed to indicate that l doesn't map to anything, and in this
case it is excluded from the sum.
Finally, match_score() is defined as:
match_score(l,r) == dot(w, PSI(l,r))
where l is an element of LHS, r is an element of RHS, and
w is a parameter vector.
Therefore, a feature extractor defines how the PSI() feature vector
is calculated. In particular, PSI() is defined by the get_features()
method of this class.
THREAD SAFETY
Instances of this object should be thread safe, that is, it should
be safe for multiple threads to make concurrent calls to the member
functions of this object.
!*/
public:
// This type should be a dlib::matrix capable of storing column vectors
// or an unsorted sparse vector type as defined in dlib/svm/sparse_vector_abstract.h.
typedef matrix_or_sparse_vector_type feature_vector_type;
// These two typedefs define the types used to represent an element in
// the left hand and right hand sets. You can use any copyable types here.
typedef user_defined_type_1 lhs_element;
typedef user_defined_type_2 rhs_element;
unsigned long num_features(
) const;
/*!
ensures
- returns the dimensionality of the PSI() feature vector.
!*/
void get_features (
const lhs_element& left,
const rhs_element& right,
feature_vector_type& feats
) const;
/*!
ensures
- #feats == PSI(left,right)
(i.e. This function computes a feature vector which, in some sense,
captures information useful for deciding if matching left to right
is "good").
!*/
};
// ----------------------------------------------------------------------------------------
void serialize(
const example_feature_extractor& item,
std::ostream& out
);
/*!
provides serialization support
!*/
void deserialize(
example_feature_extractor& item,
std::istream& in
);
/*!
provides deserialization support
!*/
// ----------------------------------------------------------------------------------------
// ----------------------------------------------------------------------------------------
template <
typename feature_extractor
>
class assignment_function
{
/*!
REQUIREMENTS ON feature_extractor
It must be an object that implements an interface compatible with
the example_feature_extractor discussed above.
WHAT THIS OBJECT REPRESENTS
This object is a tool for solving the optimal assignment problem given a
user defined method for computing the quality of any particular assignment.
To define this precisely, suppose you have two sets of objects, a
Left Hand Set (LHS) and a Right Hand Set (RHS) and you want to
find a one-to-one mapping M from LHS into RHS such that:
M == argmax_m sum_{l in LHS} match_score(l,m(l))
Where match_score() returns a scalar value indicating how good it is
to say l maps to the RHS element m(l). Additionally, in this model,
m() is allowed to indicate that l doesn't map to anything, and in this
case it is excluded from the sum.
Finally, match_score() must be of the form:
match_score(l,r) == dot(w, PSI(l,r))
where l is an element of LHS, r is an element of RHS, w is a parameter
vector, and PSI() is defined by the feature_extractor template argument.
!*/
public:
typedef typename feature_extractor::lhs_element lhs_element;
typedef typename feature_extractor::rhs_element rhs_element;
typedef std::vector<long> label_type;
typedef label_type result_type;
typedef std::pair<std::vector<lhs_element>, std::vector<rhs_element> > sample_type;
assignment_function(
);
/*!
ensures
- #get_feature_extractor() == feature_extractor()
(i.e. it will have its default value)
- #get_weights().size() == #get_feature_extractor().num_features()
- #get_weights() == 0
- #forces_assignment() == false
!*/
explicit assignment_function(
const matrix<double,0,1>& weights
);
/*!
requires
- feature_extractor().num_features() == weights.size()
ensures
- #get_feature_extractor() == feature_extractor()
(i.e. it will have its default value)
- #get_weights() == weights
- #forces_assignment() == false
!*/
assignment_function(
const feature_extractor& fe,
const matrix<double,0,1>& weights
);
/*!
requires
- fe.num_features() == weights.size()
ensures
- #get_feature_extractor() == fe
- #get_weights() == weights
- #forces_assignment() == false
!*/
assignment_function(
const feature_extractor& fe,
const matrix<double,0,1>& weights,
bool force_assignment
);
/*!
requires
- fe.num_features() == weights.size()
ensures
- #get_feature_extractor() == fe
- #get_weights() == weights
- #forces_assignment() == force_assignment
!*/
const feature_extractor& get_feature_extractor (
) const;
/*!
ensures
- returns the feature extractor used by this object
!*/
const matrix<double,0,1>& get_weights (
) const;
/*!
ensures
- returns the parameter vector (w) associated with this assignment function.
The length of the vector is get_feature_extractor().num_features().
!*/
bool forces_assignment (
) const;
/*!
ensures
- returns true if this object is in the "forced assignment mode" and false
otherwise.
- When deciding how to match LHS to RHS, this object can operate in one of
two modes. In the default mode, this object will indicate that there is
no match for an element of LHS if the best matching element of RHS would
result in a negative match_score(). However, in the "forced assignment mode",
this object will always make the assignment if there is an available
element in RHS regardless of the match_score().
Another way to understand this distinction is to consider an example.
Suppose LHS and RHS both have 10 elements in them. Then in the default
mode, it is possible for this object to indicate that there are anywhere
from 0 to 10 matches between LHS and RHS. However, in forced assignment
mode it will always indicate exactly 10 matches.
!*/
result_type operator()(
const std::vector<lhs_element>& lhs,
const std::vector<rhs_element>& rhs
) const
/*!
ensures
- returns a vector ASSIGN such that:
- ASSIGN.size() == lhs.size()
- if (ASSIGN[i] != -1) then
- lhs[i] is predicted to associate to rhs[ASSIGN[i]].
- else
- lhs[i] doesn't associate with anything in rhs.
!*/
result_type operator() (
const sample_type& item
) const;
/*!
ensures
- returns (*this)(item.first, item.second);
!*/
};
// ----------------------------------------------------------------------------------------
template <
typename feature_extractor
>
void serialize (
const assignment_function<feature_extractor>& item,
std::ostream& out
);
/*!
provides serialization support
!*/
// ----------------------------------------------------------------------------------------
template <
typename feature_extractor
>
void deserialize (
assignment_function<feature_extractor>& item,
std::istream& in
);
/*!
provides deserialization support
!*/
// ----------------------------------------------------------------------------------------
}
#endif // DLIB_ASSIGNMENT_FuNCTION_ABSTRACT_H__
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment