#include #include #include #include #include #include #include "prettyprint.hpp" //#include class binomial_coeff_table { std::vector > B; int n_max, k_max; public: binomial_coeff_table(int n, int k) { n_max = n; k_max = k; B.resize(n + 1); for( int i = 0; i <= n; i++ ) { B[i].resize(k + 1); for ( int j = 0; j <= std::min(i, k); j++ ) { if (j == 0 || j == i) B[i][j] = 1; else B[i][j] = B[i-1][j-1] + B[i-1][j]; } } } int operator()(int n, int k) const { // std::cout << "B(" << n << "," << k << ")\n"; return B[n][k]; } }; template OutputIterator get_simplex_vertices( int idx, int dim, int n, const binomial_coeff_table& binomial_coeff, OutputIterator out ) { --n; for( int k = dim + 1; k > 0; --k ) { while( binomial_coeff( n , k ) > idx ) { --n; } *out++ = n; idx -= binomial_coeff( n , k ); } return out; } std::vector vertices_of_simplex(int simplex_index, int dim, int n, const binomial_coeff_table& binomial_coeff) { std::vector vertices; get_simplex_vertices( simplex_index, dim, n, binomial_coeff, std::back_inserter(vertices) ); return vertices; } template class rips_filtration_comparator { public: const DistanceMatrix& dist; const int dim; private: std::vector vertices; typedef decltype(dist(0,0)) dist_t; bool reverse; const binomial_coeff_table& binomial_coeff; public: rips_filtration_comparator( const DistanceMatrix& _dist, const int _dim, const binomial_coeff_table& _binomial_coeff // , // bool _reverse = true ): dist(_dist), dim(_dim), vertices(_dim + 1), binomial_coeff(_binomial_coeff) // , // reverse(_reverse) {}; dist_t diam(const int index) { dist_t diam = 0; get_simplex_vertices(index, dim, dist.size(), binomial_coeff, vertices.begin() ); for (int i = 0; i <= dim; ++i) for (int j = i + 1; j <= dim; ++j) { auto d = dist(vertices[i], vertices[j]); diam = std::max(diam, dist(vertices[i], vertices[j])); } return diam; } bool operator()(const int a, const int b) { assert(a < binomial_coeff(dist.size(), dim + 1)); assert(b < binomial_coeff(dist.size(), dim + 1)); dist_t a_diam = 0, b_diam = 0; b_diam = diam(b); get_simplex_vertices(a, dim, dist.size(), binomial_coeff, vertices.begin() ); for (int i = 0; i <= dim; ++i) for (int j = i + 1; j <= dim; ++j) { a_diam = std::max(a_diam, dist(vertices[i], vertices[j])); if (a_diam > b_diam) // (((a_diam < b_diam) && !reverse) || // ((a_diam > b_diam) && reverse)) return true; } return (a_diam == b_diam) && (a > b); // return (a_diam == b_diam) && (((a < b) && !reverse) || ((a > b) && reverse)); } }; template void get_simplex_coboundary( int idx, int dim, int n, const binomial_coeff_table& binomial_coeff, OutputIterator coboundary ) { --n; int modified_idx = idx; for( int k = dim + 1; k >= 0 && n >= 0; --k ) { while( binomial_coeff( n , k ) > idx ) { // std::cout << "binomial_coeff(" << n << ", " << k << ") = " << binomial_coeff( n , k ) << " > " << idx << std::endl; *coboundary++ = modified_idx + binomial_coeff( n , k + 1 ); if (n==0) break; --n; } idx -= binomial_coeff( n , k ); modified_idx -= binomial_coeff( n , k ); modified_idx += binomial_coeff( n , k + 1 ); --n; } return; } class distance_matrix { public: typedef double value_type; std::vector > distances; double operator()(const int a, const int b) const { return distances[a][b]; } size_t size() const { return distances.size(); } }; template class compressed_sparse_matrix { public: std::vector bounds; std::vector entries; size_t size() const { return bounds.size(); } typename std::vector::const_iterator cbegin(size_t index) { assert(index < size()); return index == 0 ? entries.cbegin() : entries.cbegin() + bounds[index - 1]; } typename std::vector::const_iterator cend(size_t index) { assert(index < size()); return entries.cbegin() + bounds[index]; } template void append(Iterator begin, Iterator end) { for (Iterator it = begin; it != end; ++it) { entries.push_back(*it); } bounds.push_back(entries.size()); } template void append(const Collection collection) { append(collection.cbegin(), collection.cend()); } }; template int get_pivot(Heap& column) { if( column.empty() ) return -1; else { int max_element = column.top(); column.pop(); while( !column.empty() && column.top() == max_element ) { column.pop(); if( column.empty() ) return -1; else { max_element = column.top(); column.pop(); } } if( max_element != -1 ) column.push( max_element ); return max_element; } } void print_help_and_exit() { std::cerr << "Usage: " << "ripser " << "[options] input_filename output_filename" << std::endl; std::cerr << std::endl; std::cerr << "Options:" << std::endl; std::cerr << std::endl; std::cerr << "--help -- prints this screen" << std::endl; std::cerr << "--top_dim N -- maximal dimension to compute" << std::endl; std::cerr << "--threshold D -- maximal diameter to compute" << std::endl; exit(-1); } int main( int argc, char** argv ) { if( argc < 3 ) print_help_and_exit(); std::string input_filename = argv[ argc - 2 ]; std::string output_filename = argv[ argc - 1 ]; int dim_max = 2; double threshold = std::numeric_limits::max(); for( int idx = 1; idx < argc - 2; idx++ ) { const std::string option = argv[ idx ]; if( option == "--help" ) { print_help_and_exit(); } else if( option == "--top_dim" ) { idx++; if( idx >= argc - 2 ) print_help_and_exit(); std::string parameter = std::string( argv[ idx ] ); size_t pos_last_digit; dim_max = std::stoll( parameter, &pos_last_digit ); if( pos_last_digit != parameter.size() ) print_help_and_exit(); } else if( option == "--threshold" ) { idx++; if( idx >= argc - 2 ) print_help_and_exit(); std::string parameter = std::string( argv[ idx ] ); size_t pos_last_digit; threshold = std::stod( parameter, &pos_last_digit ); if( pos_last_digit != parameter.size() ) print_help_and_exit(); } else print_help_and_exit(); } std::ifstream input_stream( input_filename.c_str( ), std::ios_base::binary | std::ios_base::in ); if( input_stream.fail( ) ) { std::cerr << "couldn't open file" << input_filename << std::endl; exit(-1); } int64_t magic_number; input_stream.read( (char*)&magic_number, sizeof( int64_t ) ); if( magic_number != 8067171840 ) { std::cerr << input_filename << " is not a Dipha file (magic number: 8067171840)" << std::endl; exit(-1); } int64_t file_type; input_stream.read( (char*)&file_type, sizeof( int64_t ) ); if( file_type != 7 ) { std::cerr << input_filename << " is not a Dipha distance matrix (file type: 7)" << std::endl; exit(-1); } int64_t n; input_stream.read( (char*)&n, sizeof( int64_t ) ); std::cout << "distance matrix with " << n << " points" << std::endl; //std::vector distances = distance_matrix dist; dist.distances = std::vector>(n, std::vector(n));; // std::cout << dist.distances << std::endl; for( int i = 0; i < n; ++i ) { input_stream.read( (char*)&dist.distances[i][0], n * sizeof(int64_t) ); } // dist.distances = { // {0,1,3,4,3,1}, // {1,0,1,3,4,3}, // {3,1,0,1,3,4}, // {4,3,1,0,1,3}, // {3,4,3,1,0,1}, // {1,3,4,3,1,0} // }; // n = dist.size(); assert(dim_max < n - 1); binomial_coeff_table binomial_coeff(n, dim_max + 2); // std::cout << dist (0,1) << std::endl; // // rips_filtration_comparator comp1(dist, 1, binomial_coeff); // rips_filtration_comparator comp2(dist, 2, binomial_coeff); // // std::cout << (comp1(0,1) ? "0<1" : "0>=1") << std::endl; // std::cout << (comp1(1,0) ? "1<0" : "1>=0") << std::endl; // // std::cout << (comp1(0,2) ? "0<2" : "0>=2") << std::endl; // std::cout << (comp1(1,2) ? "1<2" : "1>=2") << std::endl; // // std::vector edges = {0,1,2,3,4,5}; // // std::sort(edges.begin(), edges.end(), comp1); // // std::cout << "sorted edges: " << edges << std::endl; // // // std::vector triangles = {0,1,2,3}; // // std::sort(triangles.begin(), triangles.end(), comp2); // // std::cout << "sorted triangles: " << triangles << std::endl; // // // int dim = 1; // int simplex_index = 2; // // double threshold = 7; // // std::vector vertices; // // get_simplex_vertices( simplex_index, dim, n, binomial_coeff, std::back_inserter(vertices) ); // // // std::cout << "coboundary of simplex " << vertices << ":" << std::endl; // // std::vector coboundary; // get_simplex_coboundary( simplex_index, dim, n, binomial_coeff, std::back_inserter(coboundary) ); // // // for (int coboundary_simplex_index: coboundary) { // std::vector vertices; // // get_simplex_vertices( coboundary_simplex_index, dim + 1, n, binomial_coeff, std::back_inserter(vertices) ); // std::cout << " " << coboundary_simplex_index << " " << vertices << " (" << comp1.diam(coboundary_simplex_index) << ")" << std::endl; // // } // // // compressed_sparse_matrix csm; // // csm.append(std::vector({1,2,3})); // // csm.append(std::vector({5,6,7,8})); // // csm.append(std::vector({10,11})); // // csm.append(std::vector()); // // csm.append(std::vector({2})); // // std::cout << "compressed sparse matrix: " << std::endl; // // for (int i = 0; i < csm.size(); ++i) { // std::cout << " " << std::vector(csm.cbegin(i), csm.cend(i)) << std::endl; // } // // std::cout << "bounds: " << csm.bounds << std::endl; // // std::cout << "entries: " << csm.entries << std::endl; // // // std::priority_queue, rips_filtration_comparator > queue(comp1); // // for (int e: coboundary) queue.push(e); // // std::cout << "pivot of coboundary: " << queue.top() << std::endl; // // std::cout << (comp1(3,6) ? "3<6" : "3>=6") << std::endl; // std::cout << (comp1(0,6) ? "0<6" : "0>=6") << std::endl; // // // // std::vector columns_to_reduce = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9 }; // // std::sort(columns_to_reduce.begin(), columns_to_reduce.end(), comp1); // // std::cout << "sorted 1-simplex columns to reduce: " << columns_to_reduce << std::endl; // // for (int index: columns_to_reduce) { // std::vector vertices; // // get_simplex_vertices( index, 1, n, binomial_coeff, std::back_inserter(vertices) ); // std::cout << " " << index << " " << vertices << " (" << comp1.diam(index) << ")" << std::endl; // } // // // std::sort(columns_to_reduce.begin(), columns_to_reduce.end(), comp2); // // std::cout << "sorted 2-simplex columns to reduce: " << columns_to_reduce << std::endl; // // for (int index: columns_to_reduce) { // std::vector vertices; // // get_simplex_vertices( index, 2, n, binomial_coeff, std::back_inserter(vertices) ); // std::cout << " " << index << " " << vertices << " (" << comp2.diam(index) << ")" << std::endl; // } // // // // // std::vector columns_to_reduce; std::vector coboundary; for (int index = 0; index < n; ++index) { columns_to_reduce.push_back(index); } for (int dim = 0; dim < dim_max; ++dim) { //compressed_sparse_matrix reduction_matrix; rips_filtration_comparator comp(dist, dim + 1, binomial_coeff); std::unordered_map pivot_column_index; //std::vector reduction_column; // std::cout << "reduce columns in dim " << dim << ": " << columns_to_reduce << std::endl; // std::cout << " rows in dim " << dim + 1 << ": " << columns_to_reduce << std::endl; // std::vector rows(binomial_coeff(n, dim + 2)); // for (int simplex_index = 0; simplex_index < binomial_coeff(n, dim + 2); ++simplex_index) { // rows[simplex_index] = simplex_index; // } // std::sort(rows.begin(), rows.end(), comp); // // for (int simplex_index: rows) { // std::vector vertices; // // get_simplex_vertices( simplex_index, dim + 1, n, binomial_coeff, std::back_inserter(vertices) ); // std::cout << " " << simplex_index << " " << vertices << " (" << comp.diam(simplex_index) << ")" << std::endl; // // } for (int index: columns_to_reduce) { //reduction_column.clear(); std::priority_queue, rips_filtration_comparator > working_coboundary(comp); // std::cout << "reduce column " << index << std::endl; int pivot, column = index; do { coboundary.clear(); get_simplex_coboundary( column, dim, n, binomial_coeff, std::back_inserter(coboundary) ); std::vector sorted_coboundary = coboundary; std::sort(sorted_coboundary.begin(), sorted_coboundary.end(), comp); // std::cout << "add " << sorted_coboundary << " to working col" << std::endl; // for (int coboundary_simplex_index: coboundary) { // std::vector vertices; // // get_simplex_vertices( coboundary_simplex_index, dim + 1, n, binomial_coeff, std::back_inserter(vertices) ); // std::cout << " " << coboundary_simplex_index << " " << vertices << " (" << comp.diam(coboundary_simplex_index) << ")" << std::endl; // } for (int e: coboundary) if (comp.diam(e) <= threshold) working_coboundary.push(e); // std::cout << "push " << e << std::endl;} // std::cout << "=" << std::endl; // auto working_coboundary_copy = working_coboundary; // while (!working_coboundary_copy.empty()) { // std::cout << " " << working_coboundary_copy.top() << std::endl; // working_coboundary_copy.pop(); // } // std::cout << "=" << std::endl; pivot = get_pivot(working_coboundary); //add boundary column at index birth to working_coboundary //since the boundary column is not stored explicitly, //add the boundary of the column at index birth in the reduction matrix instead //space-efficient variant: add just the boundary column at index birth instead //this avoids having to store the reduction matrix if (pivot != -1) { // std::cout << "pivot: " << pivot << std::endl; auto pair = pivot_column_index.find(pivot); if (pair == pivot_column_index.end()) { pivot_column_index.insert(std::make_pair(pivot, index)); break; } column = pair->second; } /* coboundary.clear(); get_simplex_coboundary( birth, dim, n, binomial_coeff, std::back_inserter(coboundary) ); for (int e: coboundary) if (comp2.diam(e) <= threshold) working_coboundary.push(e); //space-efficient variant: drop this part (and the reduction_matrix) for (int col = reduction_matrix.cbegin()) { coboundary.clear(); get_simplex_coboundary( col, dim, n, binomial_coeff, std::back_inserter(coboundary) ); for (int e: coboundary) if (comp2.diam(e) <= threshold) working_coboundary.push(e); } */ } while ( pivot != -1 ); // std::cout << std::endl; } std::cout << "dimension " << dim << " pairs:" << std::endl; // std::cout << pivot_column_index << std::endl; rips_filtration_comparator comp_prev(dist, dim, binomial_coeff); for (std::pair pair: pivot_column_index) { double birth = comp_prev.diam(pair.second), death = comp.diam(pair.first); // std::cout << vertices_of_simplex(pair.second, dim, n, binomial_coeff) << "," << // vertices_of_simplex(pair.first, dim + 1, n, binomial_coeff) << std::endl; if (birth != death) std::cout << " [" << birth << "," << death << ")" << std::endl; } if (dim == dim_max - 1) break; int num_simplices = binomial_coeff(n, dim + 2); columns_to_reduce.clear(); // std::cout << "columns to reduce in dim " << dim + 1 << " (" << num_simplices << " total)" << std::endl; for (int index = 0; index < num_simplices; ++index) { // if (comp.diam(index) > threshold) { // std::cout << " " << vertices_of_simplex(index, dim + 1, n, binomial_coeff) << ": " << comp.diam(index) << " above threshold" << std::endl; // } else if (pivot_column_index.find(index) != pivot_column_index.end()) { // std::cout << " " << vertices_of_simplex(index, dim + 1, n, binomial_coeff) << " appears in pair" << std::endl; // } if (comp.diam(index) <= threshold && pivot_column_index.find(index) == pivot_column_index.end()) { columns_to_reduce.push_back(index); } } std::sort(columns_to_reduce.begin(), columns_to_reduce.end(), comp); // std::cout << "sorted " << dim + 1 << "-columns to reduce: " << columns_to_reduce << std::endl; // // for (int index: columns_to_reduce) { // std::vector vertices; // // get_simplex_vertices( index, dim, n, binomial_coeff, std::back_inserter(vertices) ); // std::cout << " " << index << " " << vertices << " (" << comp.diam(index) << ")" << std::endl; // } // // std::cout << std::endl; } }