#include #include #include #include #include #include #include #include #include typedef float value_t; typedef long index_t; #define PRECOMPUTE_DIAMETERS #define PRECOMPUTE_DIAMETERS_IN_TOP_DIMENSION #define USE_BINARY_SEARCH #define USE_EXPONENTIAL_SEARCH #define INDICATE_PROGRESS #define PRINT_PERSISTENCE_PAIRS #define USE_COEFFICIENTS //#define ASSEMBLE_REDUCTION_COLUMN //#define FILE_FORMAT_DIPHA #define FILE_FORMAT_UPPER_TRIANGULAR_CSV //#define FILE_FORMAT_LOWER_TRIANGULAR_CSV class binomial_coeff_table { std::vector > B; index_t n_max, k_max; public: binomial_coeff_table(index_t n, index_t k) { n_max = n; k_max = k; B.resize(n + 1); for( index_t i = 0; i <= n; i++ ) { B[i].resize(k + 1); for ( index_t j = 0; j <= std::min(i, k); j++ ) { if (j == 0 || j == i) B[i][j] = 1; else B[i][j] = B[i-1][j-1] + B[i-1][j]; } } } inline index_t operator()(index_t n, index_t k) const { assert(n <= n_max); assert(k <= k_max); return B[n][k]; } }; template OutputIterator get_simplex_vertices( index_t idx, const index_t dim, index_t n, const binomial_coeff_table& binomial_coeff, OutputIterator out ) { --n; for( index_t k = dim + 1; k > 0; --k ) { #ifdef USE_BINARY_SEARCH if ( binomial_coeff( n , k ) > idx ) { index_t count; #ifdef USE_EXPONENTIAL_SEARCH for (count = 1; (binomial_coeff( n - count , k ) > idx); count = std::min(count << 1, n)); #else count = n; #endif while (count > 0) { index_t i = n; index_t step = count >> 1; i -= step; if (binomial_coeff( i , k ) > idx) { n = --i; count -= step + 1; } else count = step; } } #else while( binomial_coeff( n , k ) > idx ) --n; #endif assert( binomial_coeff( n , k ) <= idx ); assert( binomial_coeff( n + 1, k ) > idx ); *out++ = n; idx -= binomial_coeff( n , k ); } return out; } std::vector vertices_of_simplex(const index_t simplex_index, const index_t dim, const index_t n, const binomial_coeff_table& binomial_coeff) { std::vector vertices; get_simplex_vertices( simplex_index, dim, n, binomial_coeff, std::back_inserter(vertices) ); return vertices; } template class rips_filtration_comparator { public: const DistanceMatrix& dist; const index_t dim; private: mutable std::vector vertices; const binomial_coeff_table& binomial_coeff; public: rips_filtration_comparator( const DistanceMatrix& _dist, const index_t _dim, const binomial_coeff_table& _binomial_coeff ): dist(_dist), dim(_dim), vertices(_dim + 1), binomial_coeff(_binomial_coeff) {}; inline value_t diameter(const index_t index) const { value_t diam = 0; get_simplex_vertices(index, dim, dist.size(), binomial_coeff, vertices.begin() ); for (index_t i = 0; i <= dim; ++i) for (index_t j = 0; j < i; ++j) { diam = std::max(diam, dist(vertices[i], vertices[j])); } return diam; } inline bool operator()(const index_t a, const index_t b) const { assert(a < binomial_coeff(dist.size(), dim + 1)); assert(b < binomial_coeff(dist.size(), dim + 1)); value_t a_diam = 0, b_diam = 0; b_diam = diameter(b); get_simplex_vertices(a, dim, dist.size(), binomial_coeff, vertices.begin() ); for (index_t i = 0; i <= dim; ++i) for (index_t j = i + 1; j <= dim; ++j) { a_diam = std::max(a_diam, dist(vertices[i], vertices[j])); if (a_diam > b_diam) return true; } return (a_diam == b_diam) && (a > b); } }; #ifdef USE_COEFFICIENTS struct entry_t { index_t index; index_t value; entry_t(index_t _index, index_t _value) : index(_index), value(_value) {} entry_t(index_t _index) : index(_index), value(0) {} }; entry_t make_entry(index_t _index, index_t _value) { return entry_t(_index, _value); } index_t get_index(entry_t e) { return e.index; } #else typedef index_t entry_t; index_t get_index(index_t i) { return i; } entry_t make_entry(index_t _index, index_t _value) { return entry_t(_index); } #endif class simplex_coboundary_enumerator { private: index_t idx, modified_idx, dim, n, k; const binomial_coeff_table& binomial_coeff; public: inline simplex_coboundary_enumerator ( index_t _idx, index_t _dim, index_t _n, const binomial_coeff_table& _binomial_coeff): idx(_idx), modified_idx(_idx), dim(_dim), k(dim + 1), n(_n - 1), binomial_coeff(_binomial_coeff) {} inline bool has_next() { while ( (k != -1 && n != -1) && (binomial_coeff( n , k ) <= idx) ) { idx -= binomial_coeff( n , k ); modified_idx -= binomial_coeff( n , k ); modified_idx += binomial_coeff( n , k + 1 ); --n; --k; } return k != -1 && n != -1; } inline entry_t next() { while ( binomial_coeff( n , k ) <= idx ) { idx -= binomial_coeff( n , k ); modified_idx -= binomial_coeff( n , k ); modified_idx += binomial_coeff( n , k + 1 ); --n; } return make_entry( modified_idx + binomial_coeff( n-- , k + 1 ), k & 1 ? 1 : -1 ); } }; template std::vector get_diameters ( const DistanceMatrix& dist, const index_t dim, const std::vector& previous_diameters, const binomial_coeff_table& binomial_coeff ) { index_t n = dist.size(); std::vector diameters(binomial_coeff(n, dim + 1), 0); std::vector coboundary; for (index_t simplex = 0; simplex < previous_diameters.size(); ++simplex) { coboundary.clear(); #ifdef INDICATE_PROGRESS std::cout << "\033[Kpropagating diameter of simplex " << simplex + 1 << "/" << previous_diameters.size() << std::flush << "\r"; #endif simplex_coboundary_enumerator coboundaries(simplex, dim - 1, n, binomial_coeff); while (coboundaries.has_next()) { index_t coface = get_index(coboundaries.next()); diameters[coface] = std::max( diameters[coface], previous_diameters[simplex]); } } #ifdef INDICATE_PROGRESS std::cout << "\033[K"; #endif return diameters; } class rips_filtration_diameter_comparator { private: const std::vector& diameters; const index_t dim; public: std::vector vertices; typedef value_t dist_t; const binomial_coeff_table& binomial_coeff; public: rips_filtration_diameter_comparator( const std::vector& _diameters, const index_t _dim, const binomial_coeff_table& _binomial_coeff ): diameters(_diameters), dim(_dim), binomial_coeff(_binomial_coeff) {} inline value_t diameter(const index_t a) const { assert(a < diameters.size()); return diameters[a]; } inline bool operator()(const index_t a, const index_t b) const { assert(a < diameters.size()); assert(b < diameters.size()); dist_t a_diam = diameters[a], b_diam = diameters[b]; return ((a_diam > b_diam) || ((a_diam == b_diam) && (a > b))); } template inline bool operator()(const Entry& a, const Entry& b) const { return operator()(get_index(a), get_index(b)); } }; class distance_matrix { public: typedef value_t value_type; std::vector > distances; inline value_t operator()(const index_t a, const index_t b) const { return distances[a][b]; } inline size_t size() const { return distances.size(); } }; class compressed_upper_distance_matrix_adapter { public: typedef value_t value_type; std::vector& distances; std::vector rows; index_t n; void init_distances () { distances.resize(n * (n-1) / 2); } void init_rows () { rows.resize(n); value_t* pointer = &distances[0] - 1; for (index_t i = 0; i < n - 1; ++i) { rows[i] = pointer; pointer += n - i - 2; } } compressed_upper_distance_matrix_adapter(std::vector& _distances) : distances(_distances) { n = (1 + std::sqrt(1+ 8 * _distances.size())) / 2; assert( distances.size() == n * (n-1) / 2 ); init_rows(); } inline value_t operator()(const index_t a, const index_t b) const { if (a < b) return rows[a][b]; else if (a > b) return rows[b][a]; else return 0; } inline size_t size() const { return n; } }; class compressed_lower_distance_matrix_adapter { public: typedef value_t value_type; std::vector& distances; std::vector rows; index_t n; void init_distances () { distances.resize(n * (n-1) / 2); } void init_rows () { rows.resize(n); value_t* pointer = &distances[0]; for (index_t i = 1; i < n; ++i) { rows[i] = pointer; pointer += i; } } compressed_lower_distance_matrix_adapter( std::vector& _distances, const index_t _n) : distances(_distances), n(_n) { init_distances(); init_rows(); } compressed_lower_distance_matrix_adapter(std::vector& _distances) : distances(_distances) { n = (1 + std::sqrt(1+ 8 * distances.size())) / 2; assert( distances.size() == n * (n-1) / 2 ); init_rows(); } template compressed_lower_distance_matrix_adapter( std::vector& _distances, const DistanceMatrix& mat) : distances(_distances), n(mat.size()) { init_distances(); init_rows(); for (index_t i = 1; i < n; ++i) { for (index_t j = 0; j < i; ++j) { rows[i][j] = mat(i, j); } } } inline value_t operator()(const index_t i, const index_t j) const { if (i > j) return rows[i][j]; else if (i < j) return rows[j][i]; else return 0; } inline size_t size() const { return n; } }; template inline entry_t pop_pivot(Heap& column) { if( column.empty() ) return entry_t(-1); else { entry_t max_element = column.top(); column.pop(); while( !column.empty() && get_index(column.top()) == get_index(max_element) ) { column.pop(); if( column.empty() ) return entry_t(-1); else { max_element = column.top(); column.pop(); } } return max_element; } } template inline entry_t get_pivot(Heap& column) { entry_t max_element = pop_pivot(column); if( get_index(max_element) != -1 ) column.push( max_element ); return max_element; } template void assemble_columns_to_reduce ( std::vector& columns_to_reduce, std::unordered_map& pivot_column_index, const Comparator& comp, index_t dim, index_t n, value_t threshold, const binomial_coeff_table& binomial_coeff ) { index_t num_simplices = binomial_coeff(n, dim + 2); columns_to_reduce.clear(); for (index_t index = 0; index < num_simplices; ++index) { if (comp.diameter(index) <= threshold && pivot_column_index.find(index) == pivot_column_index.end()) { columns_to_reduce.push_back(index); } } std::sort(columns_to_reduce.begin(), columns_to_reduce.end(), comp); } template void compute_pairs( std::vector& columns_to_reduce, std::unordered_map& pivot_column_index, const ComparatorCofaces& comp, const Comparator& comp_prev, index_t dim, index_t n, value_t threshold, const binomial_coeff_table& binomial_coeff ) { std::cout << "persistence intervals in dim " << dim << ":" << std::endl; for (index_t i = 0; i < columns_to_reduce.size(); ++i) { index_t index = columns_to_reduce[i]; #ifdef ASSEMBLE_REDUCTION_COLUMN std::priority_queue, decltype(comp) > reduction_column(comp); #endif std::priority_queue, decltype(comp) > working_coboundary(comp); #ifdef INDICATE_PROGRESS std::cout << "\033[K" << "reducing column " << i + 1 << "/" << columns_to_reduce.size() << " (diameter " << comp_prev.diameter(index) << ")" << std::flush << "\r"; #endif index_t pivot, column = index; std::vector coboundary; do { #ifdef ASSEMBLE_REDUCTION_COLUMN reduction_column.push( column ); #endif simplex_coboundary_enumerator coboundaries(column, dim, n, binomial_coeff); while (coboundaries.has_next()) { entry_t coface = coboundaries.next(); index_t coface_index = get_index(coface); if (comp.diameter(coface_index) <= threshold) working_coboundary.push(coface); } pivot = get_index(get_pivot(working_coboundary)); if (pivot != -1) { auto pair = pivot_column_index.find(pivot); if (pair == pivot_column_index.end()) { pivot_column_index.insert(std::make_pair(pivot, index)); #ifdef PRINT_PERSISTENCE_PAIRS value_t birth = comp_prev.diameter(index), death = comp.diameter(pivot); if (birth != death) std::cout << "\033[K" << " [" << birth << "," << death << ")" << std::endl << std::flush; #endif break; } column = pair->second; } } while ( pivot != -1 ); #ifdef PRINT_PERSISTENCE_PAIRS if ( pivot == -1 ) { value_t birth = comp_prev.diameter(index); std::cout << "\033[K" << " [" << birth << ", )" << std::endl << std::flush; } #endif } std::cout << "\033[K"; } void print_usage_and_exit(int exit_code) { std::cerr << "Usage: " << "ripser " << "[options] filename" << std::endl; std::cerr << std::endl; std::cerr << "Options:" << std::endl; std::cerr << std::endl; std::cerr << " --help print this screen" << std::endl; std::cerr << " --top_dim compute persistent homology up to dimension " << std::endl; std::cerr << " --threshold compute Rips complexes up to diameter " << std::endl; exit(exit_code); } int main( int argc, char** argv ) { if( argc < 2 ) print_usage_and_exit(-1); const char *filename = nullptr; index_t dim_max = 1; value_t threshold = std::numeric_limits::max(); for( index_t i = 1; i < argc; ++i ) { const std::string arg(argv[ i ]); if( arg == "--help" ) { print_usage_and_exit(0); } else if( arg == "--top_dim" ) { std::string parameter = std::string( argv[ ++i ] ); size_t next_pos; dim_max = std::stol( parameter, &next_pos ); if( next_pos != parameter.size() ) print_usage_and_exit( -1 ); } else if( arg == "--threshold" ) { std::string parameter = std::string( argv[ ++i ] ); size_t next_pos; threshold = std::stof( parameter, &next_pos ); if( next_pos != parameter.size() ) print_usage_and_exit( -1 ); } else { if (filename) { print_usage_and_exit( -1 ); } filename = argv[i]; } } std::ifstream input_stream( filename, std::ios_base::binary | std::ios_base::in ); if( input_stream.fail( ) ) { std::cerr << "couldn't open file" << filename << std::endl; exit(-1); } std::vector> diameters(dim_max + 2); #ifdef FILE_FORMAT_DIPHA int64_t magic_number; input_stream.read( reinterpret_cast(&magic_number), sizeof( int64_t ) ); if( magic_number != 8067171840 ) { std::cerr << filename << " is not a Dipha file (magic number: 8067171840)" << std::endl; exit(-1); } int64_t file_type; input_stream >> file_type; if( file_type != 7 ) { std::cerr << filename << " is not a Dipha distance matrix (file type: 7)" << std::endl; exit(-1); } int64_t n; input_stream.read( reinterpret_cast(&n), sizeof( int64_t ) ); distance_matrix dist_full; dist_full.distances = std::vector>(n, std::vector(n)); for( int i = 0; i < n; ++i ) { for( int j = 0; j < n; ++j ) { double val; input_stream.read( reinterpret_cast(&val), n * sizeof(double) ); dist_full.distances[i][j] = val; } } std::cout << "distance matrix with " << n << " points" << std::endl; compressed_lower_distance_matrix_adapter dist(diameters[1], dist_full); std::cout << "distance matrix transformed to lower triangular form" << std::endl; #endif #ifdef FILE_FORMAT_UPPER_TRIANGULAR_CSV std::vector distances; std::string value_string; while(std::getline(input_stream, value_string, ',')) distances.push_back(std::stod(value_string)); compressed_upper_distance_matrix_adapter dist_upper(distances); index_t n = dist_upper.size(); std::cout << "distance matrix with " << n << " points" << std::endl; compressed_lower_distance_matrix_adapter dist(diameters[1], dist_upper); std::cout << "distance matrix transformed to lower triangular form" << std::endl; #endif #ifdef FILE_FORMAT_LOWER_TRIANGULAR_CSV std::vector distances; std::string value_string; while(std::getline(input_stream, value_string, ',')) distances.push_back(std::stod(value_string)); compressed_lower_distance_matrix dist(std::move(distances)); index_t n = dist.size(); std::cout << "distance matrix with " << n << " points" << std::endl; #endif auto result = std::minmax_element(dist.distances.begin(), dist.distances.end()); std::cout << "value range: [" << *result.first << "," << *result.second << "]" << std::endl; assert(dim_max < n - 2); binomial_coeff_table binomial_coeff(n, dim_max + 2); std::vector columns_to_reduce; for (index_t index = n; index-- > 0; ) { columns_to_reduce.push_back(index); } index_t dim = 0; { rips_filtration_diameter_comparator comp(diameters[1], dim + 1, binomial_coeff); rips_filtration_comparator comp_prev(dist, dim, binomial_coeff); std::unordered_map pivot_column_index; compute_pairs( columns_to_reduce, pivot_column_index, comp, comp_prev, dim, n, threshold, binomial_coeff ); assemble_columns_to_reduce( columns_to_reduce, pivot_column_index, comp, dim, n, threshold, binomial_coeff ); } #ifdef PRECOMPUTE_DIAMETERS_IN_TOP_DIMENSION for (dim = 1; dim <= dim_max; ++dim) { #else for (dim = 1; dim < dim_max; ++dim) { #endif #ifdef PRECOMPUTE_DIAMETERS std::cout << "precomputing " << dim + 1 << "-simplex diameters" << std::endl; diameters[dim + 1] = get_diameters( dist, dim + 1, diameters[dim], binomial_coeff ); rips_filtration_diameter_comparator comp(diameters[dim + 1], dim + 1, binomial_coeff); rips_filtration_diameter_comparator comp_prev(diameters[dim], dim, binomial_coeff); #else rips_filtration_comparator comp(dist, dim + 1, binomial_coeff); rips_filtration_comparator comp_prev(dist, dim, binomial_coeff); #endif std::unordered_map pivot_column_index; compute_pairs( columns_to_reduce, pivot_column_index, comp, comp_prev, dim, n, threshold, binomial_coeff ); assemble_columns_to_reduce( columns_to_reduce, pivot_column_index, comp, dim, n, threshold, binomial_coeff ); // if ( dim > 1 ) // diameters[dim] = std::vector(); } #ifdef PRECOMPUTE_DIAMETERS #ifndef PRECOMPUTE_DIAMETERS_IN_TOP_DIMENSION { dim = dim_max; rips_filtration_diameter_comparator comp_prev(diameters[dim], dim, binomial_coeff); rips_filtration_comparator comp(dist, dim + 1, binomial_coeff); std::unordered_map pivot_column_index; compute_pairs( columns_to_reduce, pivot_column_index, comp, comp_prev, dim, n, threshold, binomial_coeff ); } #endif #endif }