1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115
|
/***********************************************/
/**
* @file loopFileLines.h
*
* @brief Loop over lines of a text file.
*
* @author Torsten Mayer-Guerr
* @date 2023-05-31
*
*/
/***********************************************/
#ifndef __GROOPS_LOOPFILELINES__
#define __GROOPS_LOOPFILELINES__
// Latex documentation
#ifdef DOCSTRING_Loop
static const char *docstringLoopFileLines = R"(
\subsection{FileLines}
Loop over lines of a text file.
)";
#endif
/***********************************************/
#include "base/import.h"
#include "inputOutput/file.h"
#include "classes/loop/loop.h"
#include <unordered_set>
/***** CLASS ***********************************/
/** @brief Loop over lines of a text file.
* @ingroup loopGroup
* @see Loop */
class LoopFileLines : public Loop
{
std::string nameLine, nameIndex, nameCount;
std::vector<std::string> lines;
public:
LoopFileLines(Config &config);
UInt count() const override {return lines.size();}
Bool iteration(VariableList &varList) override;
};
/***********************************************/
/***** Inlines *********************************/
/***********************************************/
inline LoopFileLines::LoopFileLines(Config &config)
{
try
{
std::vector<FileName> fileNames;
UInt startIndex;
UInt countElements = MAX_UINT;
Bool sort;
Bool removeDuplicates;
readConfig(config, "inputfile", fileNames, Config::MUSTSET, "", "simple ASCII file with lines");
readConfig(config, "sort", sort, Config::DEFAULT, "0", "sort lines alphabetically (ascending)");
readConfig(config, "removeDuplicates", removeDuplicates, Config::DEFAULT, "0", "remove duplicate lines (order is preserved)");
readConfig(config, "startIndex", startIndex, Config::DEFAULT, "0", "start at element startIndex (counting from 0)");
readConfig(config, "count", countElements, Config::OPTIONAL, "", "use number of lines only (default: use all)");
readConfig(config, "variableLoopLine", nameLine, Config::OPTIONAL, "loopLine", "name of the variable to be replaced");
readConfig(config, "variableLoopIndex", nameIndex, Config::OPTIONAL, "", "variable with index of current iteration (starts with zero)");
readConfig(config, "variableLoopCount", nameCount, Config::OPTIONAL, "", "variable with total number of iterations");
readConfigCondition(config);
if(isCreateSchema(config)) return;
for(auto &fileName : fileNames)
{
InFile file(fileName);
std::string line;
while(std::getline(file, line))
lines.push_back(line);
}
if(sort)
std::sort(lines.begin(), lines.end());
if(removeDuplicates)
{
std::unordered_set<std::string> set;
lines.erase(std::copy_if(lines.begin(), lines.end(), lines.begin(), [&set](auto &s) {return set.insert(s).second;}), lines.end());
}
lines.erase(lines.begin(), lines.begin()+std::min(startIndex, lines.size()));
lines.erase(lines.begin()+std::min(countElements, lines.size()), lines.end());
}
catch(std::exception &e)
{
GROOPS_RETHROW(e)
}
}
/***********************************************/
inline Bool LoopFileLines::iteration(VariableList &varList)
{
if(index() >= count())
return FALSE;
if(!nameLine.empty()) varList.setVariable(nameLine, lines.at(index()));
if(!nameIndex.empty()) varList.setVariable(nameIndex, index());
if(!nameCount.empty()) varList.setVariable(nameCount, count());
return checkCondition(varList);
}
/***********************************************/
#endif
|