/* * Dataset.hpp, part of LatAnalyze 3 * * Copyright (C) 2013 - 2014 Antonin Portelli * * LatAnalyze 3 is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * LatAnalyze 3 is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with LatAnalyze 3. If not, see . */ #ifndef Latan_Dataset_hpp_ #define Latan_Dataset_hpp_ #include #include #include #include #include #include BEGIN_NAMESPACE /****************************************************************************** * Dataset class * ******************************************************************************/ template class Dataset: public StatArray { private: typedef StatArray Base; public: // constructor using Base::Base; Dataset(void); Dataset(const std::string &listFileName, const std::string &dataName); template Dataset(const Eigen::EigenBase &dataset); // destructor virtual ~Dataset(void); // IO void load(const std::string &listFileName, const std::string &dataName); // resampling Sample bootstrapMean(const unsigned int nSample, RandGen& generator); private: // mean from pointer vector for resampling void ptVectorMean(T &m, const std::vector &v); private: FileType file_; }; /****************************************************************************** * Dataset template implementation * ******************************************************************************/ // constructor ///////////////////////////////////////////////////////////////// template Dataset::Dataset(void) {} template Dataset::Dataset(const std::string &listFileName, const std::string &dataName) { load(listFileName, dataName); } // destructor ////////////////////////////////////////////////////////////////// template Dataset::~Dataset(void) {} // IO ////////////////////////////////////////////////////////////////////////// template void Dataset::load(const std::string &listFileName, const std::string &dataName) { std::ifstream listFile; char dataFileNameBuf[MAX_PATH_LENGTH]; std::vector dataFileName; listFile.open(listFileName, std::ios::in); while (!listFile.eof()) { listFile.getline(dataFileNameBuf, MAX_PATH_LENGTH); if (!std::string(dataFileNameBuf).empty()) { dataFileName.push_back(dataFileNameBuf); } } listFile.close(); this->resize(dataFileName.size()); for (unsigned int i = 0; i < dataFileName.size(); ++i) { file_.open(dataFileName[i], File::Mode::read); (*this)[i] = file_.template read(dataName); file_.close(); } } // resampling ////////////////////////////////////////////////////////////////// template Sample Dataset::bootstrapMean(const unsigned int nSample, RandGen& generator) { unsigned int nData = this->size(); std::vector data(nData); Sample s(nSample); for (unsigned int j = 0; j < nData; ++j) { data[j] = &((*this)[j]); } ptVectorMean(s[central], data); for (unsigned int i = 0; i < nSample; ++i) { for (unsigned int j = 0; j < nData; ++j) { data[j] = &((*this)[generator.discreteUniform(nData)]); } ptVectorMean(s[i], data); } return s; } template void Dataset::ptVectorMean(T &m, const std::vector &v) { if (v.size()) { m = *(v[0]); for (unsigned int i = 1; i < v.size(); ++i) { m += *(v[i]); } m /= static_cast(v.size()); } } END_NAMESPACE #endif // Latan_Dataset_hpp_