# HG changeset patch # User Dmitriy Morozov <dmitriy@mrzv.org> # Date 1336781215 25200 # Node ID 870865d25958261b35211eeb0ddf43606acee65a # Parent 3a3dd22a98d9b2318f632dc6b31c9e7f2c54f4c9# Parent 021030a8f97c7c224a49c02d1f3489d1885b4969 Merge diff -r 3a3dd22a98d9 -r 870865d25958 bindings/python/CMakeLists.txt diff -r 3a3dd22a98d9 -r 870865d25958 bindings/python/dionysus/__init__.py --- a/bindings/python/dionysus/__init__.py Tue May 08 13:07:28 2012 -0700 +++ b/bindings/python/dionysus/__init__.py Fri May 11 17:06:55 2012 -0700 @@ -34,15 +34,11 @@ def vertex_dim_cmp(s1, s2): return cmp(s1.dimension(), s2.dimension()) or vertex_cmp(s1, s2) -# TBD: Port this into C++ -def point_iterator( point ): - - yield point.x - yield point.y - if not point.data is None: - yield point.data - -Point.__iter__ = point_iterator +def fill_alpha_complex(points, simplices): + if len(points[0]) == 2: # 2D + fill_alpha2D_complex(points, simplices) + elif len(points[0]) == 3: # 3D + fill_alpha3D_complex(points, simplices) def closure(simplices, k): """Compute the k-skeleton of the closure of the list of simplices.""" diff -r 3a3dd22a98d9 -r 870865d25958 bindings/python/filtration.h --- a/bindings/python/filtration.h Tue May 08 13:07:28 2012 -0700 +++ b/bindings/python/filtration.h Fri May 11 17:06:55 2012 -0700 @@ -8,7 +8,7 @@ namespace bp = boost::python; -namespace dionysus { +namespace dionysus { namespace python { typedef Filtration<SimplexVD> PythonFiltration; diff -r 3a3dd22a98d9 -r 870865d25958 bindings/python/persistence-diagram.cpp --- a/bindings/python/persistence-diagram.cpp Tue May 08 13:07:28 2012 -0700 +++ b/bindings/python/persistence-diagram.cpp Fri May 11 17:06:55 2012 -0700 @@ -1,41 +1,88 @@ #include<topology/persistence-diagram.h> #include<utilities/types.h> +#include "filtration.h" +#include "simplex.h" +#include "static-persistence.h" +#include "dynamic-persistence.h" + +#include <boost/foreach.hpp> + #include<boost/python.hpp> #include<boost/python/init.hpp> #include<boost/shared_ptr.hpp> #include<boost/python/stl_iterator.hpp> #include<boost/python/def.hpp> - - namespace bp = boost::python; namespace dionysus{ namespace python{ -typedef bp::object Data; -typedef PDPoint<Data> PointD; -typedef PersistenceDiagram<Data> PersistenceDiagramD; +typedef bp::object Data; +typedef PersistenceDiagram<Data> PersistenceDiagramD; +typedef PersistenceDiagramD::Point PointD; +typedef boost::shared_ptr<PersistenceDiagramD> PDgmPtr; } } //namespace dionysus::python namespace dp = dionysus::python; -// Easy way out of overloads -RealType get_x (const dp::PointD& p) { return p.x(); } -RealType get_y (const dp::PointD& p) { return p.y(); } -bp::object get_data(const dp::PointD& p) { return p.data(); } +struct PointFromTupleConverter +{ + PointFromTupleConverter() + { + boost::python::converter::registry::push_back(&convertible, + &construct, + boost::python::type_id<dp::PointD>()); + } + + static void* convertible(PyObject* obj_ptr) + { + if (!PyTuple_Check(obj_ptr)) return 0; + if (PyTuple_Size(obj_ptr) < 2) return 0; + return obj_ptr; + } + + static void construct(PyObject* obj_ptr, + boost::python::converter::rvalue_from_python_stage1_data* data) + { + //const char* value = PyString_AsString(obj_ptr); + //if (value == 0) boost::python::throw_error_already_set(); + + // Grab pointer to memory into which to construct the new T + void* storage = ( (boost::python::converter::rvalue_from_python_storage<dp::PointD>*) data)->storage.bytes; + + RealType x = bp::extract<RealType>(PyTuple_GetItem(obj_ptr, 0)); + RealType y = bp::extract<RealType>(PyTuple_GetItem(obj_ptr, 1)); + + // in-place construct the new T using the character data extraced from the python object + dp::PointD* p = new (storage) dp::PointD(x,y); + + if (PyTuple_Size(obj_ptr) > 2) + p->data() = bp::extract<bp::object>(PyTuple_GetItem(obj_ptr, 2)); + + // Stash the memory chunk pointer for later use by boost.python + data->convertible = storage; + } +}; + +struct PointToTupleConverter +{ + static PyObject* convert(const dp::PointD& p) + { + if (p.data().ptr() == bp::object().ptr()) + return bp::incref(bp::make_tuple(p.x(), p.y()).ptr()); + else + return bp::incref(bp::make_tuple(p.x(), p.y(), p.data()).ptr()); + } +}; + void export_point( ) { - bp::class_<dp::PointD>("Point") - .def( bp::init<RealType, RealType, bp::optional<dp::Data> >()) - .add_property("x", &get_x) - .add_property("y", &get_y) - .add_property("data", &get_data) - .def( repr(bp::self)) - ; + PointFromTupleConverter(); + bp::to_python_converter<dp::PointD, PointToTupleConverter>(); } @@ -55,11 +102,106 @@ RealType bottleneck_distance_adapter(const dp::PersistenceDiagramD& dgm1, const dp::PersistenceDiagramD& dgm2) { return bottleneck_distance(dgm1, dgm2); -} +} + + +template<class Persistence> +struct InitDiagrams +{ + typedef std::map<int, dp::PDgmPtr> DiagramMap; + typedef typename Persistence::template SimplexMap<dp::PythonFiltration> SMap; + + struct DataEvaluator + { + DataEvaluator(const SMap& smap_): + smap(smap_) {} + + template<class Key> + RealType operator()(Key k) const { return bp::extract<RealType>(smap[k].data()); } + + const SMap& smap; + }; + + struct PythonEvaluator + { + PythonEvaluator(const SMap& smap_, bp::object eval_): + smap(smap_), eval(eval_) {} + + template<class Key> + RealType operator()(Key k) const { return bp::extract<RealType>(eval(smap[k])); } + + const SMap& smap; + bp::object eval; + }; + + // A hack + struct DiagramMapOwner: public DiagramMap + { + typedef dp::PersistenceDiagramD mapped_type; + + mapped_type& operator[](Dimension d) + { + if (this->find(d) == this->end()) + this->insert(std::make_pair(d, dp::PDgmPtr(new dp::PersistenceDiagramD(d)))); + return *DiagramMap::operator[](d); + } + }; + + static + bp::list extract_list(const DiagramMapOwner& dgms) + { + bp::list result; + size_t dim = 0; + typedef typename DiagramMapOwner::value_type ValType; + BOOST_FOREACH(const ValType& dim_dgm, dgms) + { + while (dim_dgm.first > dim) + { + result.append(dp::PDgmPtr(new dp::PersistenceDiagramD)); + ++dim; + } + + // dim_dgm.first == dim + result.append(dim_dgm.second); + dim++; + } + + return result; + } + + struct PointDataVisitor + { + PointDataVisitor(bp::object data_): data(data_) {} + void point(const typename Persistence::iterator& i, dp::PointD& p) const { p.data() = data(*i); } + bp::object data; + }; + + static + bp::list init(const Persistence& p, const dp::PythonFiltration& f, bp::object eval, bp::object data) + { + + DiagramMapOwner dgms; + SMap smap = p.make_simplex_map(f); + if (eval == bp::object()) + init_diagrams(dgms, p.begin(), p.end(), + DataEvaluator(smap), + evaluate_through_map(smap, dp::SimplexVD::DimensionExtractor())); + else if (data == bp::object()) + init_diagrams(dgms, p.begin(), p.end(), + PythonEvaluator(smap, eval), + evaluate_through_map(smap, dp::SimplexVD::DimensionExtractor())); + else + init_diagrams(dgms, p.begin(), p.end(), + PythonEvaluator(smap, eval), + evaluate_through_map(smap, dp::SimplexVD::DimensionExtractor()), + PointDataVisitor(data)); + return extract_list(dgms); + } +}; void export_persistence_diagram() { - bp::class_<dp::PersistenceDiagramD>("PersistenceDiagram") + bp::class_<dp::PersistenceDiagramD, dp::PDgmPtr>("PersistenceDiagram") .def("__init__", bp::make_constructor(&init_from_points_sequence)) .def( bp::init<Dimension>()) .def("append", &dp::PersistenceDiagramD::push_back) @@ -69,5 +211,17 @@ .def("__len__", &dp::PersistenceDiagramD::size) ; + bp::def("init_diagrams", &InitDiagrams<dp::SPersistence>::init, + (bp::arg("persistence"), + bp::arg("filtration"), + bp::arg("eval")=bp::object(), + bp::arg("data")=bp::object())); + bp::def("init_diagrams", &InitDiagrams<dp::DPersistenceChains>::init, + (bp::arg("persistence"), + bp::arg("filtration"), + bp::arg("eval")=bp::object(), + bp::arg("data")=bp::object())); + bp::def("bottleneck_distance", &bottleneck_distance_adapter); + bp::def("wasserstein_distance", &wasserstein_distance<dp::PersistenceDiagramD>); } diff -r 3a3dd22a98d9 -r 870865d25958 bindings/python/static-persistence.cpp --- a/bindings/python/static-persistence.cpp Tue May 08 13:07:28 2012 -0700 +++ b/bindings/python/static-persistence.cpp Fri May 11 17:06:55 2012 -0700 @@ -11,7 +11,11 @@ namespace dp = dionysus::python; -void pair_simplices(dp::SPersistence& sp) { sp.pair_simplices(false); } +void pair_simplices(dp::SPersistence& sp, bool store_negative) +{ + dp::SPersistence::PairVisitorNoProgress visitor; + sp.pair_simplices(sp.begin(), sp.end(), store_negative, visitor); +} void export_static_persistence() @@ -25,8 +29,8 @@ bp::class_<dp::SPersistence>("StaticPersistence", bp::no_init) .def("__init__", bp::make_constructor(&dp::init_from_filtration<dp::SPersistence>)) - - .def("pair_simplices", &pair_simplices) + + .def("pair_simplices", &pair_simplices, (bp::args("store_negative")=false)) .def("__call__", &dp::distance<dp::SPersistence, dp::SPersistenceIndex>) .def("make_simplex_map",&dp::SPersistence::make_simplex_map<dp::PythonFiltration>) diff -r 3a3dd22a98d9 -r 870865d25958 doc/python/alphashapes.rst --- a/doc/python/alphashapes.rst Tue May 08 13:07:28 2012 -0700 +++ b/doc/python/alphashapes.rst Fri May 11 17:06:55 2012 -0700 @@ -15,13 +15,18 @@ .. _`Delaunay triangulation`: http://en.wikipedia.org/wiki/Delaunay_triangulation +.. function:: fill_alpha_complex(points, complex) + + Based on the dimension of the first point, decides which of the two functions + below to call. + .. function:: fill_alpha2D_complex(points, complex) - + Appends to the `complex` the simplices of the 2D Delaunay triangulation on the `points`. .. function:: fill_alpha3D_complex(points, complex) - + Appends to the `complex` the simplices of the 3D Delaunay triangulation on the `points`. diff -r 3a3dd22a98d9 -r 870865d25958 doc/python/persistence-diagram.rst --- a/doc/python/persistence-diagram.rst Tue May 08 13:07:28 2012 -0700 +++ b/doc/python/persistence-diagram.rst Fri May 11 17:06:55 2012 -0700 @@ -4,20 +4,24 @@ .. class:: PersistenceDiagram .. method:: __init__( dimension ) - + Initializes : an empty( no points ) :class:`PersistenceDiagram` object and sets the :attr:`~PersistenceDiagram.dimension` attribute( must be integer ) e.g.:: - + dia = PersistenceDiagram( 1 ) .. method:: __init__( dimension, point_seq ) - - Initializes :class:`PersistenceDiagram` of specified dimension from the given sequence `seq` of :class:`Point` objects, e.g.:: - - dia = PersistenceDiagram( 1, [Point(1,2)] ) + + Initializes :class:`PersistenceDiagram` of specified dimension from the given sequence `seq` of tuples, e.g.:: + + dia = PersistenceDiagram( 1, (1,2) ) + + The tuples must have at least 2 elements ``(birth, death)``. + If there is a third element, it is stored as extra data associated to + a point. .. method:: append( p ) - + Adds point `p` to the persistence diagram. .. attribute:: dimension @@ -28,7 +32,7 @@ Iterator over the points in the persistence diagram, e.g.:: - + for p in dia: print p .. method:: __len__( ) @@ -40,42 +44,24 @@ Utility functions for persistence diagrams -------------------------------------------- +.. function:: init_diagrams(persistence, filtration[, eval = lambda s: s.data[, data = lambda i: None]]) + + Initializes a collection of :class:`PersistenceDiagram` instances from `persistence` + and `filtration`. Optional `eval` can determine how to extract birth and + death values from a simplex. For example, if `filtration` was filled using + :func:`fill_alpha_complex()`, the :attr:`~Simplex.data` contains a pair ``(value, critical)``. + We can extract the ``value`` from the tuple:: + + init_diagrams(persistence, filtration, lambda s: s.data[0]) + + Optional `data` argument can return arbitrary data to associate with each point, + given an node of `persistence`. .. function:: bottleneck_distance(dia1, dia2) - - Calculates the bottleneck distance between the two persistence diagrams. - - -.. class:: Point - - .. method:: __init__( x, y [, data]) - - Initializes :class:`Point` with the given real-valued coordinates and - optionally real value `data`, e.g.:: - - s = Point( 1, 1.1, 1.11 ) - - .. attribute:: x - - x coordinate of the point + Calculates the bottleneck distance between the two persistence diagrams. - .. attribute:: y - - y coordinate of the point - - .. attribute:: data - - Real value stored in the simplex. - - .. method:: __iter__( ) +.. function:: wasserstein_distance(dia1, dia2, p) - Point objects are iterable, returning two or three elements depending on presence of data, e.g.:: - - p = Point( 1, 1.1, 1.11 ) - for i in p: print p + Calculates the `p`-th Wasserstein distance between the two persistence diagrams. - 1 - 1.1 - 1.11 - diff -r 3a3dd22a98d9 -r 870865d25958 doc/python/static-persistence.rst --- a/doc/python/static-persistence.rst Tue May 08 13:07:28 2012 -0700 +++ b/doc/python/static-persistence.rst Fri May 11 17:06:55 2012 -0700 @@ -10,9 +10,10 @@ matrix of the complex captured by the filtration with rows and columns sorted with respect to the filtration ordering. - .. method:: pair_simplices() + .. method:: pair_simplices(store_negative = False) - Pairs simplices using the [ELZ02]_ algorithm. + Pairs simplices using the [ELZ02]_ algorithm. `store_negative` indicates + whether to store the negative simplices in the cycles. .. method:: __call__(i) diff -r 3a3dd22a98d9 -r 870865d25958 examples/triangle/triangle.py --- a/examples/triangle/triangle.py Tue May 08 13:07:28 2012 -0700 +++ b/examples/triangle/triangle.py Fri May 11 17:06:55 2012 -0700 @@ -19,7 +19,7 @@ p = StaticPersistence(f) print "Persistence initialized" -p.pair_simplices() +p.pair_simplices(True) print "Simplices paired" smap = p.make_simplex_map(f) diff -r 3a3dd22a98d9 -r 870865d25958 include/topology/persistence-diagram.h --- a/include/topology/persistence-diagram.h Tue May 08 13:07:28 2012 -0700 +++ b/include/topology/persistence-diagram.h Fri May 11 17:06:55 2012 -0700 @@ -32,7 +32,7 @@ Data& data() { return point_.second(); } std::ostream& operator<<(std::ostream& out) const { return (out << x() << " " << y()); } // << " " << data()); } - + struct Visitor { template<class Iterator> @@ -45,17 +45,17 @@ private: boost::compressed_pair<std::pair<RealType, RealType>, Data> point_; - + private: - /* Serialization */ - friend class boost::serialization::access; - - template<class Archive> - void serialize(Archive& ar, version_type ); + /* Serialization */ + friend class boost::serialization::access; + + template<class Archive> + void serialize(Archive& ar, version_type ); }; template<class Data> -std::ostream& operator<<(std::ostream& out, const PDPoint<Data>& point) +std::ostream& operator<<(std::ostream& out, const PDPoint<Data>& point) { return (point.operator<<(out)); } template<class Point, class Iterator, class Evaluator, class Visitor> @@ -71,7 +71,7 @@ /** * Class: PersistenceDiagram * - * Stores birth-death pairs, i.e. points in the extended plane. Each point can also store + * Stores birth-death pairs, i.e. points in the extended plane. Each point can also store * additional information described by `Data_` template parameter. */ template<class Data_ = Empty<> > @@ -85,24 +85,24 @@ PersistenceDiagram() {} - PersistenceDiagram( Dimension dimension ): + PersistenceDiagram( Dimension dimension ): dimension_( dimension ) {} template<class OtherData> PersistenceDiagram(const PersistenceDiagram<OtherData>& other); template<class Iterator, class Evaluator> - PersistenceDiagram(Iterator bg, Iterator end, + PersistenceDiagram(Iterator bg, Iterator end, const Evaluator& eval = Evaluator()); template<class Iterator, class Evaluator, class Visitor> - PersistenceDiagram(Iterator bg, Iterator end, - const Evaluator& eval = Evaluator(), + PersistenceDiagram(Iterator bg, Iterator end, + const Evaluator& eval = Evaluator(), const Visitor& visitor = Visitor()); template<class Iterator, class Evaluator, class Visitor> - void init(Iterator bg, Iterator end, - const Evaluator& eval = Evaluator(), + void init(Iterator bg, Iterator end, + const Evaluator& eval = Evaluator(), const Visitor& visitor = Visitor()); const_iterator begin() const { return points_.begin(); } @@ -110,7 +110,7 @@ size_t size() const { return points_.size(); } void push_back(const Point& point) { points_.push_back(point); } - + std::ostream& operator<<(std::ostream& out) const; Dimension dimension() const { return dimension_; } @@ -118,57 +118,60 @@ private: PointVector points_; Dimension dimension_; - + private: - /* Serialization */ - friend class boost::serialization::access; - - template<class Archive> - void serialize(Archive& ar, version_type ); + /* Serialization */ + friend class boost::serialization::access; + + template<class Archive> + void serialize(Archive& ar, version_type ); }; template<class Data> -std::ostream& operator<<(std::ostream& out, const PersistenceDiagram<Data>& pd) +std::ostream& operator<<(std::ostream& out, const PersistenceDiagram<Data>& pd) { return (pd.operator<<(out)); } // Function: init_diagram_vector() template<class Diagrams, class Iterator, class Evaluator, class DimensionExtractor> void init_diagrams(Diagrams& diagrams, - Iterator bg, Iterator end, - const Evaluator& evaluator = Evaluator(), + Iterator bg, Iterator end, + const Evaluator& evaluator = Evaluator(), const DimensionExtractor& dimension = DimensionExtractor()); template<class Diagrams, class Iterator, class Evaluator, class DimensionExtractor, class Visitor> void init_diagrams(Diagrams& diagrams, - Iterator bg, Iterator end, - const Evaluator& evaluator = Evaluator(), + Iterator bg, Iterator end, + const Evaluator& evaluator = Evaluator(), const DimensionExtractor& dimension = DimensionExtractor(), const Visitor& visitor = Visitor()); -// Class: Linfty +// Class: Linfty // Functor that computes L infinity norm between two points template<class Point1, class Point2> struct Linfty { - RealType operator()(const Point1& p1, const Point2& p2) const { return std::max(std::abs(p1.x() - p2.x()), + RealType operator()(const Point1& p1, const Point2& p2) const { return std::max(std::abs(p1.x() - p2.x()), std::abs(p1.y() - p2.y())); } - + template<class Point> RealType diagonal(const Point& p) const { return std::abs(p.y() - p.x())/2; } }; // Function: bottleneck_distance(dgm1, dgm2) // Computes bottleneck distance between the two diagrams. -template<class Diagram1, - class Diagram2, +template<class Diagram1, + class Diagram2, class Norm> RealType bottleneck_distance(const Diagram1& dgm1, const Diagram2& dgm2, const Norm& norm = Norm()); -template<class Diagram1, +template<class Diagram1, class Diagram2> RealType bottleneck_distance(const Diagram1& dgm1, const Diagram2& dgm2) { return bottleneck_distance(dgm1, dgm2, Linfty<typename Diagram1::Point, typename Diagram2::Point>()); } +template<class Diagram> +RealType wasserstein_distance(const Diagram& dgm1, const Diagram& dgm2, unsigned p); + #include "persistence-diagram.hpp" diff -r 3a3dd22a98d9 -r 870865d25958 include/topology/persistence-diagram.hpp --- a/include/topology/persistence-diagram.hpp Tue May 08 13:07:28 2012 -0700 +++ b/include/topology/persistence-diagram.hpp Fri May 11 17:06:55 2012 -0700 @@ -1,6 +1,8 @@ #include <boost/serialization/vector.hpp> #include <boost/serialization/nvp.hpp> +#include "utilities/munkres/munkres.h" + using boost::serialization::make_nvp; template<class D> @@ -19,7 +21,7 @@ PersistenceDiagram(const PersistenceDiagram<OtherData>& other) { points_.reserve(other.size()); - for (typename PersistenceDiagram<OtherData>::PointVector::const_iterator cur = points_.begin(); + for (typename PersistenceDiagram<OtherData>::PointVector::const_iterator cur = points_.begin(); cur != points_.end(); ++cur) push_back(Point(cur->x(), cur->y())); } @@ -62,10 +64,10 @@ RealType y = Infinity; if (&*(i->pair) != &*i) y = evaluator(&*(i->pair)); - + Point p(x,y); visitor.point(i, p); - + if (x == y) return boost::optional<Point>(); return p; @@ -73,8 +75,8 @@ template<class Diagrams, class Iterator, class Evaluator, class DimensionExtractor> void init_diagrams(Diagrams& diagrams, - Iterator bg, Iterator end, - const Evaluator& evaluator, + Iterator bg, Iterator end, + const Evaluator& evaluator, const DimensionExtractor& dimension) { // FIXME: this is specialized for Diagrams that is std::map @@ -85,8 +87,8 @@ template<class Diagrams, class Iterator, class Evaluator, class DimensionExtractor, class Visitor> void init_diagrams(Diagrams& diagrams, - Iterator bg, Iterator end, - const Evaluator& evaluator, + Iterator bg, Iterator end, + const Evaluator& evaluator, const DimensionExtractor& dimension, const Visitor& visitor) { @@ -114,27 +116,27 @@ template<class D> template<class Archive> -void +void PDPoint<D>:: -serialize(Archive& ar, version_type ) -{ - ar & make_nvp("x", x()); - ar & make_nvp("y", y()); +serialize(Archive& ar, version_type ) +{ + ar & make_nvp("x", x()); + ar & make_nvp("y", y()); ar & make_nvp("data", data()); } template<class D> template<class Archive> -void +void PersistenceDiagram<D>:: -serialize(Archive& ar, version_type ) -{ - ar & make_nvp("points", points_); +serialize(Archive& ar, version_type ) +{ + ar & make_nvp("points", points_); } /** - * Some structures to compute bottleneck distance between two persistence diagrams (in bottleneck_distance() function below) + * Some structures to compute bottleneck distance between two persistence diagrams (in bottleneck_distance() function below) * by setting up bipartite graphs, and finding maximum cardinality matchings in them using Boost Graph Library. */ #include <boost/iterator/counting_iterator.hpp> @@ -148,7 +150,7 @@ Edge(unsigned v1, unsigned v2, RealType d): Parent(v1, v2), distance(d) {} - bool operator<(const Edge& other) const { return distance < other.distance; } + bool operator<(const Edge& other) const { return distance < other.distance; } RealType distance; }; @@ -172,7 +174,7 @@ // FIXME: the matching is being recomputed from scratch every time, this should be fixed if (i2 > last) - do + do { ++last; boost::add_edge(last->first, last->second, g); @@ -238,10 +240,87 @@ // Perform cardinality based binary search typedef boost::counting_iterator<EV_const_iterator> EV_counting_const_iterator; - EV_counting_const_iterator bdistance = std::upper_bound(EV_counting_const_iterator(edges.begin()), - EV_counting_const_iterator(edges.end()), + EV_counting_const_iterator bdistance = std::upper_bound(EV_counting_const_iterator(edges.begin()), + EV_counting_const_iterator(edges.end()), edges.begin(), CardinaliyComparison(max_size, edges.begin())); - + return (*bdistance)->distance; } + +// Wasserstein distance +template<class Diagram> +RealType +wasserstein_distance(const Diagram& dgm1, const Diagram& dgm2, unsigned p) +{ + typedef RealType Distance; + typedef typename Diagram::Point Point; + typedef Linfty<Point, Point> Norm; + + unsigned size = dgm1.size() + dgm2.size(); + Norm norm; + + // Setup the matrix + Matrix<Distance> m(size,size); + for (unsigned i = 0; i < dgm1.size(); ++i) + for (unsigned j = 0; j < dgm2.size(); ++j) + { + const Point& p1 = *(dgm1.begin() + i); + const Point& p2 = *(dgm2.begin() + j); + m(i,j) = pow(norm(p1, p2), p); + m(j + dgm1.size(), i + dgm2.size()) = 0; + } + + for (unsigned i = 0; i < dgm1.size(); ++i) + for (unsigned j = dgm2.size(); j < size; ++j) + { + const Point& p1 = *(dgm1.begin() + i); + m(i,j) = pow(norm.diagonal(p1), p); + } + + for (unsigned j = 0; j < dgm2.size(); ++j) + for (unsigned i = dgm1.size(); i < size; ++i) + { + const Point& p2 = *(dgm2.begin() + j); + m(i,j) = pow(norm.diagonal(p2), p); + } + + // Compute weighted matching + Munkres munkres; + munkres.solve(m); + + // Assume everything is assigned (i.e., that we have a perfect matching) + Distance sum = 0; + for (unsigned i = 0; i < size; i++) + for (unsigned j = 0; j < size; j++) + if (m(i,j) == 0) + { + //std::cout << i << ": " << j << '\n'; + //sum += m[i][j]; + if (i >= dgm1.size()) + { + if (j >= dgm2.size()) + sum += 0; + else + { + const Point& p2 = *(dgm2.begin() + j); + sum += pow(norm.diagonal(p2), p); + } + } else + { + if (j >= dgm2.size()) + { + const Point& p1 = *(dgm1.begin() + i); + sum += pow(norm.diagonal(p1), p); + } else + { + const Point& p1 = *(dgm1.begin() + i); + const Point& p2 = *(dgm2.begin() + j); + sum += pow(norm(p1, p2), p); + } + } + break; + } + + return sum; +} diff -r 3a3dd22a98d9 -r 870865d25958 include/topology/static-persistence.h --- a/include/topology/static-persistence.h Tue May 08 13:07:28 2012 -0700 +++ b/include/topology/static-persistence.h Fri May 11 17:06:55 2012 -0700 @@ -128,7 +128,6 @@ }; OrderModifier modifier() { return OrderModifier(order()); } - protected: // Function: pair_simplices(bg, end) // Compute persistence of the simplices in filtration between bg and end template<class Visitor> @@ -165,6 +164,7 @@ void finished(iterator j) const {} }; + protected: const Order& order() const { return order_; } Order& order() { return order_; } diff -r 3a3dd22a98d9 -r 870865d25958 include/utilities/munkres/matrix.h --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/include/utilities/munkres/matrix.h Fri May 11 17:06:55 2012 -0700 @@ -0,0 +1,56 @@ +/* + * Copyright (c) 2007 John Weaver + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + */ + +#if !defined(_MATRIX_H_) +#define _MATRIX_H_ + +template <class T> +class Matrix { +public: + Matrix(); + Matrix(int rows, int columns); + Matrix(const Matrix<T> &other); + Matrix<T> & operator= (const Matrix<T> &other); + ~Matrix(); + // all operations except product modify the matrix in-place. + void resize(int rows, int columns); + void identity(void); + void clear(void); + T& operator () (int x, int y); + T trace(void); + Matrix<T>& transpose(void); + Matrix<T> product(Matrix<T> &other); + int minsize(void) { + return ((m_rows < m_columns) ? m_rows : m_columns); + } + int columns(void) { + return m_columns; + } + int rows(void) { + return m_rows; + } +private: + T **m_matrix; + int m_rows; + int m_columns; +}; + +#include "matrix.hpp" + +#endif /* !defined(_MATRIX_H_) */ + diff -r 3a3dd22a98d9 -r 870865d25958 include/utilities/munkres/matrix.hpp --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/include/utilities/munkres/matrix.hpp Fri May 11 17:06:55 2012 -0700 @@ -0,0 +1,231 @@ +/* + * Copyright (c) 2007 John Weaver + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + */ + +#include "matrix.h" + +#include <cassert> +#include <cstdlib> +#include <algorithm> + +/*export*/ template <class T> +Matrix<T>::Matrix() { + m_rows = 0; + m_columns = 0; + m_matrix = NULL; +} + +/*export*/ template <class T> +Matrix<T>::Matrix(const Matrix<T> &other) { + if ( other.m_matrix != NULL ) { + // copy arrays + m_matrix = NULL; + resize(other.m_rows, other.m_columns); + for ( int i = 0 ; i < m_rows ; i++ ) + for ( int j = 0 ; j < m_columns ; j++ ) + m_matrix[i][j] = other.m_matrix[i][j]; + } else { + m_matrix = NULL; + m_rows = 0; + m_columns = 0; + } +} + +/*export*/ template <class T> +Matrix<T>::Matrix(int rows, int columns) { + m_matrix = NULL; + resize(rows, columns); +} + +/*export*/ template <class T> +Matrix<T> & +Matrix<T>::operator= (const Matrix<T> &other) { + if ( other.m_matrix != NULL ) { + // copy arrays + resize(other.m_rows, other.m_columns); + for ( int i = 0 ; i < m_rows ; i++ ) + for ( int j = 0 ; j < m_columns ; j++ ) + m_matrix[i][j] = other.m_matrix[i][j]; + } else { + // free arrays + for ( int i = 0 ; i < m_columns ; i++ ) + delete [] m_matrix[i]; + + delete [] m_matrix; + + m_matrix = NULL; + m_rows = 0; + m_columns = 0; + } + + return *this; +} + +/*export*/ template <class T> +Matrix<T>::~Matrix() { + if ( m_matrix != NULL ) { + // free arrays + for ( int i = 0 ; i < m_rows ; i++ ) + delete [] m_matrix[i]; + + delete [] m_matrix; + } + m_matrix = NULL; +} + +/*export*/ template <class T> +void +Matrix<T>::resize(int rows, int columns) { + if ( m_matrix == NULL ) { + // alloc arrays + m_matrix = new T*[rows]; // rows + for ( int i = 0 ; i < rows ; i++ ) + m_matrix[i] = new T[columns]; // columns + + m_rows = rows; + m_columns = columns; + clear(); + } else { + // save array pointer + T **new_matrix; + // alloc new arrays + new_matrix = new T*[rows]; // rows + for ( int i = 0 ; i < rows ; i++ ) { + new_matrix[i] = new T[columns]; // columns + for ( int j = 0 ; j < columns ; j++ ) + new_matrix[i][j] = 0; + } + + // copy data from saved pointer to new arrays + int minrows = std::min<int>(rows, m_rows); + int mincols = std::min<int>(columns, m_columns); + for ( int x = 0 ; x < minrows ; x++ ) + for ( int y = 0 ; y < mincols ; y++ ) + new_matrix[x][y] = m_matrix[x][y]; + + // delete old arrays + if ( m_matrix != NULL ) { + for ( int i = 0 ; i < m_rows ; i++ ) + delete [] m_matrix[i]; + + delete [] m_matrix; + } + + m_matrix = new_matrix; + } + + m_rows = rows; + m_columns = columns; +} + +/*export*/ template <class T> +void +Matrix<T>::identity() { + assert( m_matrix != NULL ); + + clear(); + + int x = std::min<int>(m_rows, m_columns); + for ( int i = 0 ; i < x ; i++ ) + m_matrix[i][i] = 1; +} + +/*export*/ template <class T> +void +Matrix<T>::clear() { + assert( m_matrix != NULL ); + + for ( int i = 0 ; i < m_rows ; i++ ) + for ( int j = 0 ; j < m_columns ; j++ ) + m_matrix[i][j] = 0; +} + +/*export*/ template <class T> +T +Matrix<T>::trace() { + assert( m_matrix != NULL ); + + T value = 0; + + int x = std::min<int>(m_rows, m_columns); + for ( int i = 0 ; i < x ; i++ ) + value += m_matrix[i][i]; + + return value; +} + +/*export*/ template <class T> +Matrix<T>& +Matrix<T>::transpose() { + assert( m_rows > 0 ); + assert( m_columns > 0 ); + + int new_rows = m_columns; + int new_columns = m_rows; + + if ( m_rows != m_columns ) { + // expand matrix + int m = std::max<int>(m_rows, m_columns); + resize(m,m); + } + + for ( int i = 0 ; i < m_rows ; i++ ) { + for ( int j = i+1 ; j < m_columns ; j++ ) { + T tmp = m_matrix[i][j]; + m_matrix[i][j] = m_matrix[j][i]; + m_matrix[j][i] = tmp; + } + } + + if ( new_columns != new_rows ) { + // trim off excess. + resize(new_rows, new_columns); + } + + return *this; +} + +/*export*/ template <class T> +Matrix<T> +Matrix<T>::product(Matrix<T> &other) { + assert( m_matrix != NULL ); + assert( other.m_matrix != NULL ); + assert ( m_columns == other.m_rows ); + + Matrix<T> out(m_rows, other.m_columns); + + for ( int i = 0 ; i < out.m_rows ; i++ ) { + for ( int j = 0 ; j < out.m_columns ; j++ ) { + for ( int x = 0 ; x < m_columns ; x++ ) { + out(i,j) += m_matrix[i][x] * other.m_matrix[x][j]; + } + } + } + + return out; +} + +/*export*/ template <class T> +T& +Matrix<T>::operator ()(int x, int y) { + assert ( x >= 0 ); + assert ( y >= 0 ); + assert ( x < m_rows ); + assert ( y < m_columns ); + assert ( m_matrix != NULL ); + return m_matrix[x][y]; +} diff -r 3a3dd22a98d9 -r 870865d25958 include/utilities/munkres/munkres.cpp --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/include/utilities/munkres/munkres.cpp Fri May 11 17:06:55 2012 -0700 @@ -0,0 +1,359 @@ +/* + * Copyright (c) 2007 John Weaver + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + */ + +#include "munkres.h" + +#include <iostream> +#include <cmath> + +bool +Munkres::find_uncovered_in_matrix(double item, int &row, int &col) { + for ( row = 0 ; row < matrix.rows() ; row++ ) + if ( !row_mask[row] ) + for ( col = 0 ; col < matrix.columns() ; col++ ) + if ( !col_mask[col] ) + if ( matrix(row,col) == item ) + return true; + + return false; +} + +bool +Munkres::pair_in_list(const std::pair<int,int> &needle, const std::list<std::pair<int,int> > &haystack) { + for ( std::list<std::pair<int,int> >::const_iterator i = haystack.begin() ; i != haystack.end() ; i++ ) { + if ( needle == *i ) + return true; + } + + return false; +} + +int +Munkres::step1(void) { + for ( int row = 0 ; row < matrix.rows() ; row++ ) + for ( int col = 0 ; col < matrix.columns() ; col++ ) + if ( matrix(row,col) == 0 ) { + bool isstarred = false; + for ( int nrow = 0 ; nrow < matrix.rows() ; nrow++ ) + if ( mask_matrix(nrow,col) == STAR ) { + isstarred = true; + break; + } + + if ( !isstarred ) { + for ( int ncol = 0 ; ncol < matrix.columns() ; ncol++ ) + if ( mask_matrix(row,ncol) == STAR ) { + isstarred = true; + break; + } + } + + if ( !isstarred ) { + mask_matrix(row,col) = STAR; + } + } + + return 2; +} + +int +Munkres::step2(void) { + int rows = matrix.rows(); + int cols = matrix.columns(); + int covercount = 0; + for ( int row = 0 ; row < rows ; row++ ) + for ( int col = 0 ; col < cols ; col++ ) + if ( mask_matrix(row,col) == STAR ) { + col_mask[col] = true; + covercount++; + } + + int k = matrix.minsize(); + + if ( covercount >= k ) { +#ifdef DEBUG + std::cout << "Final cover count: " << covercount << std::endl; +#endif + return 0; + } + +#ifdef DEBUG + std::cout << "Munkres matrix has " << covercount << " of " << k << " Columns covered:" << std::endl; + for ( int row = 0 ; row < rows ; row++ ) { + for ( int col = 0 ; col < cols ; col++ ) { + std::cout.width(8); + std::cout << matrix(row,col) << ","; + } + std::cout << std::endl; + } + std::cout << std::endl; +#endif + + + return 3; +} + +int +Munkres::step3(void) { + /* + Main Zero Search + + 1. Find an uncovered Z in the distance matrix and prime it. If no such zero exists, go to Step 5 + 2. If No Z* exists in the row of the Z', go to Step 4. + 3. If a Z* exists, cover this row and uncover the column of the Z*. Return to Step 3.1 to find a new Z + */ + if ( find_uncovered_in_matrix(0, saverow, savecol) ) { + mask_matrix(saverow,savecol) = PRIME; // prime it. + } else { + return 5; + } + + for ( int ncol = 0 ; ncol < matrix.columns() ; ncol++ ) + if ( mask_matrix(saverow,ncol) == STAR ) { + row_mask[saverow] = true; //cover this row and + col_mask[ncol] = false; // uncover the column containing the starred zero + return 3; // repeat + } + + return 4; // no starred zero in the row containing this primed zero +} + +int +Munkres::step4(void) { + int rows = matrix.rows(); + int cols = matrix.columns(); + + std::list<std::pair<int,int> > seq; + // use saverow, savecol from step 3. + std::pair<int,int> z0(saverow, savecol); + std::pair<int,int> z1(-1,-1); + std::pair<int,int> z2n(-1,-1); + seq.insert(seq.end(), z0); + int row, col = savecol; + /* + Increment Set of Starred Zeros + + 1. Construct the ``alternating sequence'' of primed and starred zeros: + + Z0 : Unpaired Z' from Step 4.2 + Z1 : The Z* in the column of Z0 + Z[2N] : The Z' in the row of Z[2N-1], if such a zero exists + Z[2N+1] : The Z* in the column of Z[2N] + + The sequence eventually terminates with an unpaired Z' = Z[2N] for some N. + */ + bool madepair; + do { + madepair = false; + for ( row = 0 ; row < rows ; row++ ) + if ( mask_matrix(row,col) == STAR ) { + z1.first = row; + z1.second = col; + if ( pair_in_list(z1, seq) ) + continue; + + madepair = true; + seq.insert(seq.end(), z1); + break; + } + + if ( !madepair ) + break; + + madepair = false; + + for ( col = 0 ; col < cols ; col++ ) + if ( mask_matrix(row,col) == PRIME ) { + z2n.first = row; + z2n.second = col; + if ( pair_in_list(z2n, seq) ) + continue; + madepair = true; + seq.insert(seq.end(), z2n); + break; + } + } while ( madepair ); + + for ( std::list<std::pair<int,int> >::iterator i = seq.begin() ; + i != seq.end() ; + i++ ) { + // 2. Unstar each starred zero of the sequence. + if ( mask_matrix(i->first,i->second) == STAR ) + mask_matrix(i->first,i->second) = NORMAL; + + // 3. Star each primed zero of the sequence, + // thus increasing the number of starred zeros by one. + if ( mask_matrix(i->first,i->second) == PRIME ) + mask_matrix(i->first,i->second) = STAR; + } + + // 4. Erase all primes, uncover all columns and rows, + for ( int row = 0 ; row < mask_matrix.rows() ; row++ ) + for ( int col = 0 ; col < mask_matrix.columns() ; col++ ) + if ( mask_matrix(row,col) == PRIME ) + mask_matrix(row,col) = NORMAL; + + for ( int i = 0 ; i < rows ; i++ ) { + row_mask[i] = false; + } + + for ( int i = 0 ; i < cols ; i++ ) { + col_mask[i] = false; + } + + // and return to Step 2. + return 2; +} + +int +Munkres::step5(void) { + int rows = matrix.rows(); + int cols = matrix.columns(); + /* + New Zero Manufactures + + 1. Let h be the smallest uncovered entry in the (modified) distance matrix. + 2. Add h to all covered rows. + 3. Subtract h from all uncovered columns + 4. Return to Step 3, without altering stars, primes, or covers. + */ + double h = 0; + for ( int row = 0 ; row < rows ; row++ ) { + if ( !row_mask[row] ) { + for ( int col = 0 ; col < cols ; col++ ) { + if ( !col_mask[col] ) { + if ( (h > matrix(row,col) && matrix(row,col) != 0) || h == 0 ) { + h = matrix(row,col); + } + } + } + } + } + + for ( int row = 0 ; row < rows ; row++ ) + if ( row_mask[row] ) + for ( int col = 0 ; col < cols ; col++ ) + matrix(row,col) += h; + + for ( int col = 0 ; col < cols ; col++ ) + if ( !col_mask[col] ) + for ( int row = 0 ; row < rows ; row++ ) + matrix(row,col) -= h; + + return 3; +} + +void +Munkres::solve(Matrix<double> &m) { + // Linear assignment problem solution + // [modifies matrix in-place.] + // matrix(row,col): row major format assumed. + + // Assignments are remaining 0 values + // (extra 0 values are replaced with -1) +#ifdef DEBUG + std::cout << "Munkres input matrix:" << std::endl; + for ( int row = 0 ; row < m.rows() ; row++ ) { + for ( int col = 0 ; col < m.columns() ; col++ ) { + std::cout.width(8); + std::cout << m(row,col) << ","; + } + std::cout << std::endl; + } + std::cout << std::endl; +#endif + + double highValue = 0; + for ( int row = 0 ; row < m.rows() ; row++ ) { + for ( int col = 0 ; col < m.columns() ; col++ ) { + if ( m(row,col) != INFINITY && m(row,col) > highValue ) + highValue = m(row,col); + } + } + highValue++; + + for ( int row = 0 ; row < m.rows() ; row++ ) + for ( int col = 0 ; col < m.columns() ; col++ ) + if ( m(row,col) == INFINITY ) + m(row,col) = highValue; + + bool notdone = true; + int step = 1; + + this->matrix = m; + // STAR == 1 == starred, PRIME == 2 == primed + mask_matrix.resize(matrix.rows(), matrix.columns()); + + row_mask = new bool[matrix.rows()]; + col_mask = new bool[matrix.columns()]; + for ( int i = 0 ; i < matrix.rows() ; i++ ) { + row_mask[i] = false; + } + + for ( int i = 0 ; i < matrix.columns() ; i++ ) { + col_mask[i] = false; + } + + while ( notdone ) { + switch ( step ) { + case 0: + notdone = false; + break; + case 1: + step = step1(); + break; + case 2: + step = step2(); + break; + case 3: + step = step3(); + break; + case 4: + step = step4(); + break; + case 5: + step = step5(); + break; + } + } + + // Store results + for ( int row = 0 ; row < matrix.rows() ; row++ ) + for ( int col = 0 ; col < matrix.columns() ; col++ ) + if ( mask_matrix(row,col) == STAR ) + matrix(row,col) = 0; + else + matrix(row,col) = -1; + +#ifdef DEBUG + std::cout << "Munkres output matrix:" << std::endl; + for ( int row = 0 ; row < matrix.rows() ; row++ ) { + for ( int col = 0 ; col < matrix.columns() ; col++ ) { + std::cout.width(1); + std::cout << matrix(row,col) << ","; + } + std::cout << std::endl; + } + std::cout << std::endl; +#endif + + m = matrix; + + delete [] row_mask; + delete [] col_mask; +} diff -r 3a3dd22a98d9 -r 870865d25958 include/utilities/munkres/munkres.h --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/include/utilities/munkres/munkres.h Fri May 11 17:06:55 2012 -0700 @@ -0,0 +1,52 @@ +/* + * Copyright (c) 2007 John Weaver + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + */ + +#if !defined(_MUNKRES_H_) +#define _MUNKRES_H_ + +#include "matrix.h" + +#include <list> +#include <utility> + +class Munkres { +public: + void solve(Matrix<double> &m); +private: + static const int NORMAL = 0; + static const int STAR = 1; + static const int PRIME = 2; + inline bool find_uncovered_in_matrix(double,int&,int&); + inline bool pair_in_list(const std::pair<int,int> &, const std::list<std::pair<int,int> > &); + int step1(void); + int step2(void); + int step3(void); + int step4(void); + int step5(void); + int step6(void); + Matrix<int> mask_matrix; + Matrix<double> matrix; + bool *row_mask; + bool *col_mask; + int saverow, savecol; +}; + +// DM: This is dangerous, but will do for now +#include "munkres.cpp" + +#endif /* !defined(_MUNKRES_H_) */ diff -r 3a3dd22a98d9 -r 870865d25958 tools/CMakeLists.txt