/* * Dataset.hpp, part of LatAnalyze 3 * * Copyright (C) 2013 - 2014 Antonin Portelli * * LatAnalyze 3 is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * LatAnalyze 3 is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with LatAnalyze 3. If not, see . */ #ifndef Latan_Dataset_hpp_ #define Latan_Dataset_hpp_ #include #include #include #include #include #include BEGIN_NAMESPACE /****************************************************************************** * Dataset class * ******************************************************************************/ template class Dataset: public StatArray { public: // constructors Dataset(void) = default; Dataset(const Index size); template Dataset(const std::string &listFileName, const std::string &dataName); EIGEN_EXPR_CTOR(Dataset, Dataset, StatArray, ArrayExpr) // destructor virtual ~Dataset(void) = default; // IO template void load(const std::string &listFileName, const std::string &dataName); // resampling Sample bootstrapMean(const Index nSample, RandGen& generator); private: // mean from pointer vector for resampling void ptVectorMean(T &m, const std::vector &v); }; /****************************************************************************** * Dataset template implementation * ******************************************************************************/ // constructors //////////////////////////////////////////////////////////////// template Dataset::Dataset(const Index size) : StatArray(size) {} template template Dataset::Dataset(const std::string &listFileName, const std::string &dataName) { load(listFileName, dataName); } // IO ////////////////////////////////////////////////////////////////////////// template template void Dataset::load(const std::string &listFileName, const std::string &dataName) { FileType file; std::ifstream listFile; char dataFileNameBuf[MAX_PATH_LENGTH]; std::vector dataFileName; listFile.open(listFileName, std::ios::in); while (!listFile.eof()) { listFile.getline(dataFileNameBuf, MAX_PATH_LENGTH); if (!std::string(dataFileNameBuf).empty()) { dataFileName.push_back(dataFileNameBuf); } } listFile.close(); this->resize(dataFileName.size()); for (Index i = 0; i < static_cast(dataFileName.size()); ++i) { file.open(dataFileName[i], File::Mode::read); (*this)[i] = file.template read(dataName); file.close(); } } // resampling ////////////////////////////////////////////////////////////////// template Sample Dataset::bootstrapMean(const Index nSample, RandGen& generator) { Index nData = this->size(); std::vector data(nData); Sample s(nSample); for (Index j = 0; j < nData; ++j) { data[j] = &((*this)[j]); } ptVectorMean(s[central], data); for (Index i = 0; i < nSample; ++i) { for (Index j = 0; j < nData; ++j) { data[j] = &((*this)[generator.discreteUniform(nData)]); } ptVectorMean(s[i], data); } return s; } template void Dataset::ptVectorMean(T &m, const std::vector &v) { if (v.size()) { m = *(v[0]); for (unsigned int i = 1; i < v.size(); ++i) { m += *(v[i]); } m /= static_cast(v.size()); } } END_NAMESPACE #endif // Latan_Dataset_hpp_