/* This file is part of the Gudhi Library. The Gudhi library * (Geometric Understanding in Higher Dimensions) is a generic C++ * library for computational topology. * * Author(s): Pawel Dlotko * * Copyright (C) 2015 INRIA (France) * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . */ #ifndef Read_Persitence_From_File_H #define Read_Persitence_From_File_H #include #include #include #include #include #include namespace Gudhi { namespace Gudhi_stat { /** * This procedure reads birth-death dagta from a file. We assume that in the file, there may be one type of string 'inf' or 'Inf'. If the second parameter of the program is set to -1, * then those vales are ignored. If the second parameter of this program is set to a positive value, then the infinite intervals will be substituted by that number. **/ std::vector< std::pair< double,double > > read_persistence_file_that_may_contain_inf_string( const char* filename , double what_to_substitute_for_infinite_bar = -1 ) { bool dbg = true; if ( !( access( filename, F_OK ) != -1 ) ) { std::cerr << "The file : " << filename << " do not exist. The program will now terminate \n"; throw "The file from which you are trying to read do not exist. The program will now terminate \n"; } std::string line; std::vector< std::pair > barcode; std::ifstream in; in.open( filename ); while (!in.eof()) { getline(in,line); if ( !(line.length() == 0 || line[0] == '#') ) { std::stringstream lineSS(line); double beginn, endd; if ( (line.find("inf") != std::string::npos) || (line.find("Inf") != std::string::npos) ) { if ( dbg ) { std::cerr << "This line: " << line << " contains infinite interval. We will skip it. \n"; } if ( what_to_substitute_for_infinite_bar != -1 ) { lineSS >> beginn; endd = what_to_substitute_for_infinite_bar; } else { continue; } } else { lineSS >> beginn; lineSS >> endd; } if ( beginn > endd ) { std::swap(beginn,endd); } if ( dbg ) { std::cerr << "Getting an interval : " << beginn << "," << endd << std::endl; } barcode.push_back( std::make_pair( beginn , endd ) ); } } return barcode; }//readFileNames /** * This procedure reads names of files which are stored in a file. **/ std::vector< std::string > readFileNames( const char* filenameWithFilenames ) { bool dbg = false; if ( !( access( filenameWithFilenames, F_OK ) != -1 ) ) { std::cerr << "The file : " << filenameWithFilenames << " do not exist. The program will now terminate \n"; throw "The file from which you are trying to read do not exist. The program will now terminate \n"; } std::vector< std::string > result; std::ifstream in; in.open( filenameWithFilenames ); std::string line; while (!in.eof()) { getline(in,line); line.erase( std::remove_if( line.begin(), line.end(), ::isspace) , line.end() ); if (dbg){std::cerr << "line : " << line << std::endl;} if ( (line.length() == 0) || (line[0] == '#') ) { //in this case we have a file name. First we should remove all the white spaces. if ( dbg ){std::cerr << "This is a line with comment, it will be ignored n";} } else { result.push_back( line.c_str() ); if (dbg){std::cerr << "Line after removing white spaces : " << line << std::endl;} } } in.close(); return result; }//readFileNames /** * This method reads persistence from standalone file. The format of the file is as follows: * In every line there are two numbers which denotes birth and death of a persistence interval. The file is not supposed to contains any nonwhite characters excet from digits. In particular symbols * like 'inf' are not allowed. * If begin of the interval is greater than the end of the interval, those two numbers are swapped. **/ std::vector< std::pair< double , double > > read_standard_persistence_file( const char* filename ) { bool dbg = false; std::ifstream in; in.open( filename ); if ( !( access( filename, F_OK ) != -1 ) ) { std::cerr << "The file : " << filename << " do not exist. The program will now terminate \n"; throw "The file from which you are trying to read the persistence landscape do not exist. The program will now terminate \n"; } std::string line; std::vector< std::pair > barcode; while (!in.eof()) { getline(in,line); if ( !(line.length() == 0 || line[0] == '#') ) { std::stringstream lineSS(line); double beginn, endd; lineSS >> beginn; lineSS >> endd; if ( beginn == endd )continue; if ( beginn > endd ) { std::swap(beginn,endd); } barcode.push_back( std::make_pair( beginn , endd ) ); if (dbg) { std::cerr << beginn << " , " << endd << std::endl; } } } in.close(); return barcode; }//read_standard_file /** * This procedure reads Gudhi style file. The format of a Gudhi style file is as follows: * Each line consist of the following information: * A prime number p indicating that the class is nontrivial over Z_p field. * A positive numebr, being a dimension of a persistence class * A birth and a death time of a class. * Death time may be infitnity, in which case a string 'inf' is used. * If begin of the interval is greater than the end of the interval, those two numbers are swapped. * Note that this procedure reads persistence in a single dimension. The dimension of intervals that * are to be read are determined by the second parameter of the function. **/ std::vector< std::pair< double , double > > read_gudhi_persistence_file_in_one_dimension( const char* filename , size_t dimension = 0 , double what_to_substitute_for_infinite_bar = -1) { bool dbg = false; if ( !( access( filename, F_OK ) != -1 ) ) { std::cerr << "The file : " << filename << " do not exist. The program will now terminate \n"; throw "The file from which you are trying to read the persistence landscape do not exist. The program will now terminate \n"; } std::ifstream in; in.open( filename ); std::string line; std::vector< std::pair > barcode; while (!in.eof()) { getline(in,line); if ( !(line.length() == 0 || line[0] == '#') ) { if ( line.find("inf") != std::string::npos ) { if ( dbg ) { std::cerr << "This line: " << line << " contains infinite interval. We will skip it. \n"; } if ( what_to_substitute_for_infinite_bar != -1 ) { double beginn, field, dim; std::stringstream lineSS(line); lineSS >> field; lineSS >> dim; lineSS >> beginn; if ( dim == dimension ) { if ( beginn > what_to_substitute_for_infinite_bar ) { barcode.push_back( std::make_pair( what_to_substitute_for_infinite_bar , beginn ) ); } else { barcode.push_back( std::make_pair( beginn , what_to_substitute_for_infinite_bar ) ); } if (dbg) { std::cerr << beginn << " , " << what_to_substitute_for_infinite_bar << std::endl; } } } continue; } std::stringstream lineSS(line); double beginn, endd, field, dim; lineSS >> field; lineSS >> dim; lineSS >> beginn; lineSS >> endd; if ( beginn > endd ) { std::swap(beginn,endd); } if ( dim == dimension ) { barcode.push_back( std::make_pair( beginn , endd ) ); if (dbg) { std::cerr << beginn << " , " << endd << std::endl; } } } } in.close(); return barcode; }//read_gudhi_file std::vector< std::vector< double > > read_numbers_from_file_line_by_line( const char* filename ) { bool dbg = false; if ( !( access( filename, F_OK ) != -1 ) ) { std::cerr << "The file : " << filename << " do not exist. The program will now terminate \n"; throw "The file from which you are trying to read the persistence landscape do not exist. The program will now terminate \n"; } std::vector< std::vector< double > > result; double number; std::ifstream in(filename); std::string line; while ( in.good() ) { std::getline(in,line); std::stringstream ss(line); if ( dbg )std::cerr << "\n Reading line : " << line << std::endl; std::vector< double > this_line; while ( ss.good() ) { ss >> number; this_line.push_back( number ); if ( dbg )std::cerr << number << " "; } if ( this_line.size() && in.good() ) result.push_back( this_line ); } in.close(); return result; }//read_numbers_from_file_line_by_line /** * Universal procedure to read files with persistence. It ignores the lines starting from # (treat them as comments). * It reads the fist line which is not a comment and assume that there are some numerical entries over there. The program assume * that each other line in the file, which is not a comment, have the same number of numerical entries. * If there are two numerical entries per line, then the function assume that they are birth/death coordinates. * If there are three numerical entries per line, then the function assume that they are: dimension and birth/death coordinates. * If there are four numerical entries per line, then the function assume that they are: thc characteristic of a filed over which * persistence was computed, dimension and birth/death coordinates. * The procedure returns vector of persistence pairs. **/ std::vector> read_persistence_intervals_in_one_dimension_from_file(std::string const& filename, int dimension=-1 , double what_to_substitute_for_infinite_bar = -1 ) { bool dbg = false; //checking if the file exist: if ( !( access( filename.c_str() , F_OK ) != -1 ) ) { std::cerr << "The file : " << filename << " do not exist. The program will now terminate \n"; throw "The file from which you are trying to read the persistence landscape do not exist. The program will now terminate \n"; } std::ifstream in; in.open( filename ); std::string line; std::vector< std::pair > barcode; int number_of_entries_per_line = -1; while (!in.eof()) { getline(in,line); if ( dbg )std::cerr << "Reading line : " << line << std::endl; if ( !(line.length() == 0 || line[0] == '#') ) { if ( number_of_entries_per_line == -1 ) { //check how many entries we have in the line. std::stringstream ss( line ); int number; std::vector this_line; while ( ss >> number ) { this_line.push_back( number ); } number_of_entries_per_line = (int)this_line.size(); //if thie line contains 'inf' string, then we need to increment number_of_entries_per_line if ( line.find("inf") != std::string::npos )++number_of_entries_per_line; if ( dbg ) { std::cerr << "number_of_entries_per_line : " << number_of_entries_per_line << ". This number was obtained by analyzing this line : " << line << std::endl; } if ( (number_of_entries_per_line < 2) || ( number_of_entries_per_line > 4 ) ) { std::cerr << "The input file you have provided have wrong number of numerical entries per line. The program will now terminate. \n"; throw "The input file you have provided have wrong number of numerical entries per line. The program will now terminate. \n"; } } if ( line.find("inf") != std::string::npos ) { if ( dbg ) { std::cerr << "This line: " << line << " contains infinite interval. \n"; } if ( what_to_substitute_for_infinite_bar != -1 ) { double beginn, field, dim; std::stringstream lineSS(line); if ( number_of_entries_per_line == 4 )lineSS >> field; if ( number_of_entries_per_line >= 3 ) { lineSS >> dim; } else { dim = dimension; } lineSS >> beginn; if ( dim == dimension ) { if ( beginn > what_to_substitute_for_infinite_bar ) { barcode.push_back( std::make_pair( what_to_substitute_for_infinite_bar , beginn ) ); } else { barcode.push_back( std::make_pair( beginn , what_to_substitute_for_infinite_bar ) ); } if (dbg) { std::cerr << "this is the line that is going to the output : " << beginn << " , " << what_to_substitute_for_infinite_bar << std::endl; } } } else { if ( dbg ) { std::cerr << "We will skip it \n"; } } continue; } std::stringstream lineSS(line); double beginn, endd, field, dim; if ( number_of_entries_per_line == 4 )lineSS >> field; if ( number_of_entries_per_line >= 3 ) { lineSS >> dim; } else { dim = dimension; } lineSS >> beginn; lineSS >> endd; if ( beginn > endd ) { std::swap(beginn,endd); } if ( dim == dimension ) { barcode.push_back( std::make_pair( beginn , endd ) ); if (dbg) { std::cerr << "This is a line that is going to the output : " << beginn << " , " << endd << std::endl; } } } else { if ( dbg ) { std::cerr << "This is a comment line \n"; } } } in.close(); if ( dbg )std::cerr << "End of reading \n"; return barcode; }//read_persistence_intervals_in_one_dimension_from_file }//namespace Gudhi_stat }//namespace Gudhi #endif