1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189
|
/*
* Copyright 2009- ECMWF.
*
* This software is licensed under the terms of the Apache Licence version 2.0
* which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
* In applying this licence, ECMWF does not waive the privileges and immunities
* granted to it by virtue of its status as an intergovernmental organisation
* nor does it submit to any jurisdiction.
*/
#include <iostream>
#include <string>
#include <vector>
#include "ecflow/attribute/Variable.hpp"
#include "ecflow/core/File.hpp"
#include "ecflow/core/Log.hpp"
#include "ecflow/core/Str.hpp"
#include "ecflow/node/Defs.hpp"
#include "ecflow/node/JobProfiler.hpp"
#include "ecflow/node/Jobs.hpp"
#include "ecflow/node/JobsParam.hpp"
#include "ecflow/node/Task.hpp"
using namespace std;
using namespace ecf;
// #define DEBUG 1
// This relies on Pyext/samples/TestJobGenPerf.py to make any defs amenable
// for this test program.
//
// The defs is in /var/tmp/ma0/ECFLOW_TEST/TestJobGenPerf
//
// Timing for /var/tmp/ma0/DEFS/metabuilder.def
// First/base point: real:10.15 user: 5.58 sys: 1.62
// After ECFLOW-846: real: 4.46 user: 3.72 sys: 0.74 # Only open/close include file once
// After ECFLOW-864: real: 4.36 user: 3.68 sys: 0.68 # minimise stat calls
//
// strace -c ./Base/bin/gcc-4.8/release/perf_job_gen ./metabuilder.def
//
// % time seconds usecs/call calls errors syscall
// ------ ----------- ----------- --------- --------- ----------------
// Before ECFLOW-864: 22.77 0.001159 0 132329 50737 stat
// After ECFLOW-864: 21.35 0.001097 0 125644 50737 stat
//
//
// After ECFLOW-1244:
// - cacheing of stat of include files
// - re-arranging EcfFile data member for hotness
// - re-arrange search for generation variables, most common first
// - replace ecffile_->countEcfMicro _. EcfFile::countEcfMicro(..) remove reference since function is static
//
// time Base/bin/gcc-5.3.0/release/perf_job_gen ./metabuilder.def : submitted 5808 out of 7941( fastest of 10 attempts)
// - ECFLOW-1244: real: 2.84s user: 2.41s sys: 0.40s
//
// perf stat -r 10 -d Base/bin/gcc-5.3.0/release/perf_job_gen ./metabuilder.def
// Performance counter stats for 'Base/bin/gcc-5.3.0/release/perf_job_gen ./metabuilder.def' (10 runs):
//
// 2908.895909 task-clock (msec) # 0.933 CPUs utilized ( +- 1.02% )
// 89 context-switches # 0.031 K/sec ( +- 7.13% )
// 2 cpu-migrations # 0.001 K/sec ( +- 25.00% )
// 11,500 page-faults # 0.004 M/sec ( +- 0.03% )
// 10,900,694,824 cycles # 3.747 GHz ( +- 0.93% ) (37.44%)
// 4,810,738,973 stalled-cycles-frontend # 44.13% frontend cycles idle ( +- 2.34% ) (49.98%)
// <not supported> stalled-cycles-backend
// 13,845,775,843 instructions # 1.27 insns per cycle
// # 0.35 stalled cycles per insn ( +- 0.03% ) (62.51%)
// 3,777,695,721 branches # 1298.670 M/sec ( +- 0.05% ) (62.56%)
// 107,367,375 branch-misses # 2.84% of all branches ( +- 0.15% ) (62.70%)
// 3,410,593,440 L1-dcache-loads # 1172.470 M/sec ( +- 0.09% ) (49.60%)
// 260,536,494 L1-dcache-load-misses # 7.64% of all L1-dcache hits ( +- 0.13% ) (24.94%)
// 101,191,979 LLC-loads # 34.787 M/sec ( +- 0.20% ) (24.90%)
// <not supported> LLC-load-misses
//
// 3.118979324 seconds time elapsed ( +- 2.80% )
int main(int argc, char* argv[]) {
if (argc != 2) {
cout << "TestJobGenPerf.cpp --> " << argv[0] << "\n";
cout << "Expect single argument which is path to a defs file\n";
return 1;
}
// delete the log file if it exists.
std::string log_path = File::test_data("Base/test/TestJobGenPerf.log", "Base");
fs::remove(log_path);
std::string path = argv[1];
#ifdef DEBUG
cout << "Loading file " << path << " log file " << log_path << "\n";
#endif
Defs defs;
std::string errorMsg, warningMsg;
if (!defs.restore(path, errorMsg, warningMsg)) {
cout << errorMsg << "\n";
cout << warningMsg << "\n";
return 1;
}
// std::vector<std::string> suites_to_remove;
// suites_to_remove.push_back("codes_ui");
// suites_to_remove.push_back("libemos_test");
// suites_to_remove.push_back("metview");
// suites_to_remove.push_back("ecflow");
// suites_to_remove.push_back("mir_bundle");
// #ifdef DEBUG
// cout << "remove dodgy suites, these are based on localhost\n";
// #endif
// for(size_t i = 0; i < suites_to_remove.size(); ++i) {
// suite_ptr suite = defs.findSuite(suites_to_remove[i]);
// if (suite) suite->remove();
// }
// cout << defs ;
// exit(0);
// Check number of tasks, if the submitted output below is too low
std::vector<Task*> tasks;
defs.getAllTasks(tasks);
// #ifdef DEBUG
// cout << "Total number of tasks: " << tasks.size() << "\n";
// cout << "begin-all\n";
// #endif
defs.beginAll();
// #ifdef DEBUG
// cout << "Free all dependencies, free suspended time and trigger dependencies\n";
// #endif
std::vector<node_ptr> all_nodes;
defs.get_all_nodes(all_nodes);
for (size_t i = 0; i < all_nodes.size(); ++i) {
if (all_nodes[i]->isSuspended()) {
all_nodes[i]->resume();
}
all_nodes[i]->freeTrigger();
all_nodes[i]->freeHoldingDateDependencies();
all_nodes[i]->freeHoldingTimeDependencies();
const std::vector<InLimit>& inlimits = all_nodes[i]->inlimits();
for (const auto& inlim : inlimits) {
all_nodes[i]->deleteInlimit(inlim.name());
}
if (all_nodes[i]->state() == NState::COMPLETE && all_nodes[i]->isTask()) {
all_nodes[i]->set_state(NState::QUEUED);
}
}
// Create a new log, file, place after begin to avoid queued state
TestLog test_log(log_path); // will create log file, and destroy log and remove file at end of scope
// This controls the log output when job generation > submitJobsInterval
JobProfiler::set_task_threshold(100); // 100ms where 1000ms is one second
JobsParam jobParam(20 /*submitJobsInterval*/, true /*createJobs*/, false /* spawn jobs */);
Jobs job(&defs);
if (!job.generate(jobParam)) {
cout << " generate failed: " << jobParam.getErrorMsg();
}
cout << "submitted " << jobParam.submitted().size() << " out of " << tasks.size() << "\n";
if (jobParam.submitted().size() != tasks.size()) {
for (size_t i = 0; i < tasks.size(); i++) {
if (tasks[i]->state() != NState::SUBMITTED &&
tasks[i]->findVariable("ECF_DUMMY_TASK") == Variable::EMPTY()) {
// We are NOT a dummy task
cout << "task " << tasks[i]->absNodePath() << " state: " << NState::toString(tasks[i]->state()) << "\n";
Node* parent = tasks[i]->parent();
while (parent) {
cout << " node " << parent->absNodePath() << " state: " << NState::toString(parent->state())
<< "\n";
parent = parent->parent();
}
std::vector<std::string> theReasonWhy;
tasks[i]->bottom_up_why(theReasonWhy, false /*html tags*/);
for (const auto& r : theReasonWhy) {
cout << " Reason: " << r << "\n";
}
}
}
}
return 0;
}
|