From fd404406e6b65d6d2e195ee91d693068e50fbff7 Mon Sep 17 00:00:00 2001 From: Giovanni Bussi <giovanni.bussi@gmail.com> Date: Wed, 8 Jan 2014 10:10:57 +0100 Subject: [PATCH] Implementation of zlib Files with gz extension are transparently compressed and decompressed. Closes #17 --- src/config/Config.cpp.in | 9 ++++++ src/config/Config.h | 2 ++ src/core/CLToolMain.cpp | 2 ++ src/tools/FileBase.cpp | 57 +++++++++++++++++++++++---------- src/tools/FileBase.h | 8 ++++- src/tools/IFile.cpp | 23 ++++++++++++-- src/tools/OFile.cpp | 68 +++++++++++++++++++++++++++++++++++++--- src/tools/OFile.h | 2 ++ 8 files changed, 146 insertions(+), 25 deletions(-) diff --git a/src/config/Config.cpp.in b/src/config/Config.cpp.in index 4c326f277..5c850d41a 100644 --- a/src/config/Config.cpp.in +++ b/src/config/Config.cpp.in @@ -86,6 +86,15 @@ bool hasMolfile(){ #endif } +bool hasZlib(){ +#if __PLUMED_HAS_ZLIB + return true; +#else + return false; +#endif +} + + } diff --git a/src/config/Config.h b/src/config/Config.h index 81d7fc78b..c1f36f63f 100644 --- a/src/config/Config.h +++ b/src/config/Config.h @@ -45,6 +45,8 @@ bool hasCregex(); bool hasMolfile(); +bool hasZlib(); + } } diff --git a/src/core/CLToolMain.cpp b/src/core/CLToolMain.cpp index 1d2fa942c..790e04dfa 100644 --- a/src/core/CLToolMain.cpp +++ b/src/core/CLToolMain.cpp @@ -128,6 +128,8 @@ int CLToolMain::run(int argc, char **argv,FILE*in,FILE*out,Communicator& pc){ return (config::hasDlopen()?0:1); } else if(a=="--has-molfile"){ return (config::hasMolfile()?0:1); + } else if(a=="--has-zlib"){ + return (config::hasZlib()?0:1); } else if(a=="--is-installed"){ return (config::isInstalled()?0:1); } else if(a=="--no-mpi"){ diff --git a/src/tools/FileBase.cpp b/src/tools/FileBase.cpp index 7dd31845e..0df6860be 100644 --- a/src/tools/FileBase.cpp +++ b/src/tools/FileBase.cpp @@ -32,6 +32,10 @@ #include <iostream> #include <string> +#ifdef __PLUMED_HAS_ZLIB +#include <zlib.h> +#endif + namespace PLMD{ void FileBase::test(){ @@ -69,11 +73,7 @@ FileBase& FileBase::link(FILE*fp){ } FileBase& FileBase::flush(){ - fflush(fp); - if(heavyFlush){ - fclose(fp); - fp=std::fopen(const_cast<char*>(path.c_str()),"a"); - } + if(fp) fflush(fp); return *this; } @@ -102,16 +102,17 @@ FileBase& FileBase::open(const std::string& path,const std::string& mode){ eof=false; err=false; fp=NULL; - if(plumed){ - this->path=path+plumed->getSuffix(); - fp=std::fopen(const_cast<char*>(this->path.c_str()),const_cast<char*>(mode.c_str())); - } - if(!fp){ - this->path=path; - fp=std::fopen(const_cast<char*>(this->path.c_str()),const_cast<char*>(mode.c_str())); + gzfp=NULL; + bool do_exist=FileExist(path); + fp=std::fopen(const_cast<char*>(this->path.c_str()),const_cast<char*>(mode.c_str())); + if(Tools::extension(this->path)=="gz"){ +#ifdef __PLUMED_HAS_ZLIB + gzfp=(void*)gzopen(const_cast<char*>(this->path.c_str()),const_cast<char*>(mode.c_str())); +#else + plumed_merror("trying to use a gz file without zlib being linked"); +#endif } if(plumed) plumed->insertFile(*this); - plumed_massert(fp,"file " + path + "cannot be found"); return *this; } @@ -120,7 +121,7 @@ bool FileBase::FileExist(const std::string& path){ FILE *ff=NULL; bool do_exist=false; if(plumed){ - this->path=path+plumed->getSuffix(); + this->path=appendSuffix(path,plumed->getSuffix()); ff=std::fopen(const_cast<char*>(this->path.c_str()),"r"); } if(!ff){ @@ -142,12 +143,17 @@ void FileBase::close(){ plumed_assert(!cloned); eof=false; err=false; - std::fclose(fp); + if(fp) std::fclose(fp); +#ifdef __PLUMED_HAS_ZLIB + if(gzfp) gzclose(gzFile(gzfp)); +#endif fp=NULL; + gzfp=NULL; } FileBase::FileBase(): fp(NULL), + gzfp(NULL), comm(NULL), plumed(NULL), action(NULL), @@ -161,11 +167,30 @@ FileBase::FileBase(): FileBase::~FileBase() { if(plumed) plumed->eraseFile(*this); - if(!cloned && fp) fclose(fp); + if(!cloned && fp) fclose(fp); +#ifdef __PLUMED_HAS_ZLIB + if(!cloned && gzfp) gzclose(gzFile(gzfp)); +#endif } FileBase::operator bool()const{ return !eof; } +std::string FileBase::appendSuffix(const std::string&path,const std::string&suffix){ + std::string ret=path; + std::string ext=Tools::extension(path); + if(ext=="gz"){ + int l=path.length()-3; + plumed_assert(l>=0); + ret=ret.substr(0,l); + } + ret+=suffix; + if(ext=="gz")ret+=".gz"; + return ret; +} + + + + } diff --git a/src/tools/FileBase.h b/src/tools/FileBase.h index 0ab890fe1..2cbd3b499 100644 --- a/src/tools/FileBase.h +++ b/src/tools/FileBase.h @@ -55,6 +55,8 @@ protected: /// file pointer FILE* fp; +/// zip file pointer. + void* gzfp; /// communicator. NULL if not set Communicator* comm; /// pointer to main plumed object. NULL if not linked @@ -75,6 +77,10 @@ protected: std::string path; /// Set to true if you want flush to be heavy (close/reopen) bool heavyFlush; +/// Append suffix. +/// It appends the desired suffix to the string. Notice that +/// it conserves a possible ".gz" suffix. + static std::string appendSuffix(const std::string&path,const std::string&suffix); public: /// Link to an already open filed FileBase& link(FILE*); @@ -87,7 +93,7 @@ public: /// Automatically links also the corresponding PlumedMain and Communicator. FileBase& link(Action&); /// Flushes the file to disk - FileBase& flush(); + virtual FileBase& flush(); /// Closes the file /// Should be used only for explicitely opened files. void close(); diff --git a/src/tools/IFile.cpp b/src/tools/IFile.cpp index 00e9ca30b..fc95ecfe3 100644 --- a/src/tools/IFile.cpp +++ b/src/tools/IFile.cpp @@ -31,15 +31,29 @@ #include <iostream> #include <string> +#ifdef __PLUMED_HAS_ZLIB +#include <zlib.h> +#endif namespace PLMD{ size_t IFile::llread(char*ptr,size_t s){ plumed_assert(fp); size_t r; - r=fread(ptr,1,s,fp); - if(feof(fp)) eof=true; - if(ferror(fp)) err=true; + if(gzfp){ +#ifdef __PLUMED_HAS_ZLIB + int rr=gzread(gzFile(gzfp),ptr,s); + if(rr==0) eof=true; + if(rr<0) err=true; + r=rr; +#else + plumed_merror("trying to use a gz file without zlib being linked"); +#endif + } else { + r=fread(ptr,1,s,fp); + if(feof(fp)) eof=true; + if(ferror(fp)) err=true; + } return r; } @@ -193,6 +207,9 @@ void IFile::reset(bool reset){ eof = reset; err = reset; if(!reset) clearerr(fp); +#ifdef __PLUMED_HAS_ZLIB + if(!reset && gzfp) gzclearerr(gzFile(gzfp)); +#endif return; } diff --git a/src/tools/OFile.cpp b/src/tools/OFile.cpp index 55f6ac6a9..8d8ce53b3 100644 --- a/src/tools/OFile.cpp +++ b/src/tools/OFile.cpp @@ -34,6 +34,10 @@ #include <cstdlib> #include <cerrno> +#ifdef __PLUMED_HAS_ZLIB +#include <zlib.h> +#endif + namespace PLMD{ size_t OFile::llwrite(const char*ptr,size_t s){ @@ -41,7 +45,15 @@ size_t OFile::llwrite(const char*ptr,size_t s){ if(linked) return linked->llwrite(ptr,s); if(! (comm && comm->Get_rank()>0)){ if(!fp) plumed_merror("writing on uninitilized File"); - r=fwrite(ptr,1,s,fp); + if(gzfp){ +#ifdef __PLUMED_HAS_ZLIB + r=gzwrite(gzFile(gzfp),ptr,s); +#else + plumed_merror("trying to use a gz file without zlib being linked"); +#endif + } else { + r=fwrite(ptr,1,s,fp); + } } if(comm) comm->Bcast(r,0); return r; @@ -70,6 +82,7 @@ OFile::~OFile(){ OFile& OFile::link(OFile&l){ fp=NULL; + gzfp=NULL; linked=&l; return *this; } @@ -222,7 +235,7 @@ void OFile::setBackupString( const std::string& str ){ void OFile::backupAllFiles( const std::string& str ){ plumed_assert( backstring!="bck" && plumed && !plumed->getRestart() ); size_t found=str.find_last_of("/\\"); - std::string filename = str + plumed->getSuffix(); + std::string filename = appendSuffix(str,plumed->getSuffix()); std::string directory=filename.substr(0,found+1); std::string file=filename.substr(found+1); if( FileExist(filename) ) backupFile("bck", filename); @@ -266,16 +279,31 @@ OFile& OFile::open(const std::string&path){ eof=false; err=false; fp=NULL; + gzfp=NULL; this->path=path; if(plumed){ - this->path+=plumed->getSuffix(); + this->path=appendSuffix(path,plumed->getSuffix()); } if(plumed && plumed->getRestart()){ fp=std::fopen(const_cast<char*>(this->path.c_str()),"a"); + if(Tools::extension(this->path)=="gz"){ +#ifdef __PLUMED_HAS_ZLIB + gzfp=(void*)gzopen(const_cast<char*>(this->path.c_str()),"a9"); +#else + plumed_merror("trying to use a gz file without zlib being linked"); +#endif + } } else { backupFile( backstring, this->path ); if(comm)comm->Barrier(); fp=std::fopen(const_cast<char*>(this->path.c_str()),"w"); + if(Tools::extension(this->path)=="gz"){ +#ifdef __PLUMED_HAS_ZLIB + gzfp=(void*)gzopen(const_cast<char*>(this->path.c_str()),"w9"); +#else + plumed_merror("trying to use a gz file without zlib being linked"); +#endif + } } if(plumed) plumed->insertFile(*this); return *this; @@ -286,8 +314,38 @@ OFile& OFile::rewind(){ // the reason is that normal rewind does not work when in append mode plumed_assert(fp); clearFields(); - fclose(fp); - fp=std::fopen(const_cast<char*>(path.c_str()),"w"); + if(gzfp){ +#ifdef __PLUMED_HAS_ZLIB + gzclose((gzFile)gzfp); + gzfp=(void*)gzopen(const_cast<char*>(this->path.c_str()),"w9"); +#endif + } else { + fclose(fp); + fp=std::fopen(const_cast<char*>(path.c_str()),"w"); + } + return *this; +} + +FileBase& OFile::flush(){ + if(heavyFlush){ + if(gzfp){ +#ifdef __PLUMED_HAS_ZLIB + gzclose(gzFile(gzfp)); + gzfp=(void*)gzopen(const_cast<char*>(path.c_str()),"a"); +#endif + } else{ + fclose(fp); + fp=std::fopen(const_cast<char*>(path.c_str()),"a"); + } + } else { + FileBase::flush(); + // if(gzfp) gzflush(gzFile(gzfp),Z_FINISH); + // for some reason flushing with Z_FINISH has problems on linux + // I thus use this (incomplete) flush +#ifdef __PLUMED_HAS_ZLIB + if(gzfp) gzflush(gzFile(gzfp),Z_FULL_FLUSH); +#endif + } return *this; } diff --git a/src/tools/OFile.h b/src/tools/OFile.h index cad69614b..7ae4ffc0a 100644 --- a/src/tools/OFile.h +++ b/src/tools/OFile.h @@ -186,6 +186,8 @@ this method can be used to clean the field list. friend OFile& operator<<(OFile&,const T &); /// Rewind a file OFile&rewind(); +/// Flush a file + virtual FileBase&flush(); }; /// Write using << syntax -- GitLab