refactor(GridFire): updated outputs
This commit is contained in:
@@ -15,11 +15,15 @@
|
||||
|
||||
#include "quill/Logger.h"
|
||||
#include "quill/Backend.h"
|
||||
#include "nlohmann/json.hpp"
|
||||
|
||||
#include <clocale>
|
||||
|
||||
#include <sys/utsname.h>
|
||||
|
||||
#include "gridfire/reaction/reaclib.h"
|
||||
#include "gridfire/utils/gf_omp.h"
|
||||
#include "gridfire/utils/config.h"
|
||||
|
||||
gridfire::NetIn init(const double temp, const double rho, const double tMax) {
|
||||
std::setlocale(LC_ALL, "");
|
||||
@@ -63,97 +67,157 @@ int main() {
|
||||
std::println("Scratch Blob State: {}", *construct.scratch_blob);
|
||||
|
||||
|
||||
constexpr size_t runs = 10;
|
||||
auto startTime = std::chrono::high_resolution_clock::now();
|
||||
constexpr size_t runs = 100;
|
||||
nlohmann::json results;
|
||||
nlohmann::json metadata;
|
||||
|
||||
// arrays to store timings
|
||||
std::array<std::chrono::duration<double>, runs> setup_times;
|
||||
std::array<std::chrono::duration<double>, runs> eval_times;
|
||||
std::array<NetOut, runs> serial_results;
|
||||
for (size_t i = 0; i < runs; ++i) {
|
||||
auto start_setup_time = std::chrono::high_resolution_clock::now();
|
||||
solver::PointSolverContext solverCtx(*construct.scratch_blob);
|
||||
solverCtx.set_stdout_logging(false);
|
||||
solver::PointSolver solver(construct.engine);
|
||||
auto end_setup_time = std::chrono::high_resolution_clock::now();
|
||||
std::chrono::duration<double> setup_elapsed = end_setup_time - start_setup_time;
|
||||
setup_times[i] = setup_elapsed;
|
||||
const auto now = std::chrono::system_clock::now();
|
||||
std::string now_str = std::format("{:%Y-%m-%d %H:%M:%S}", now);
|
||||
|
||||
auto start_eval_time = std::chrono::high_resolution_clock::now();
|
||||
const NetOut netOut = solver.evaluate(solverCtx, netIn);
|
||||
auto end_eval_time = std::chrono::high_resolution_clock::now();
|
||||
serial_results[i] = netOut;
|
||||
std::chrono::duration<double> eval_elapsed = end_eval_time - start_eval_time;
|
||||
eval_times[i] = eval_elapsed;
|
||||
}
|
||||
auto endTime = std::chrono::high_resolution_clock::now();
|
||||
std::chrono::duration<double> elapsed = endTime - startTime;
|
||||
std::println("");
|
||||
metadata["Datetime"] = now_str;
|
||||
metadata["GF_Version"] = version::toString();
|
||||
|
||||
// Summarize serial timings
|
||||
double total_setup_time = 0.0;
|
||||
double total_eval_time = 0.0;
|
||||
for (size_t i = 0; i < runs; ++i) {
|
||||
total_setup_time += setup_times[i].count();
|
||||
total_eval_time += eval_times[i].count();
|
||||
}
|
||||
std::println("Average Setup Time over {} runs: {:.6f} seconds", runs, total_setup_time / runs);
|
||||
std::println("Average Evaluation Time over {} runs: {:.6f} seconds", runs, total_eval_time / runs);
|
||||
std::println("Total Time for {} runs: {:.6f} seconds", runs, elapsed.count());
|
||||
|
||||
|
||||
std::array<NetOut, runs> parallelResults;
|
||||
std::array<std::chrono::duration<double>, runs> setupTimes;
|
||||
std::array<std::chrono::duration<double>, runs> evalTimes;
|
||||
std::array<std::unique_ptr<gridfire::engine::scratch::StateBlob>, runs> workspaces;
|
||||
for (size_t i = 0; i < runs; ++i) {
|
||||
workspaces[i] = construct.scratch_blob->clone_structure();
|
||||
utsname buffer{};
|
||||
if (uname(&buffer) == 0) {
|
||||
std::string osName = buffer.sysname;
|
||||
#ifdef __APPLE__
|
||||
if (osName == "Darwin") osName = "macOS";
|
||||
#endif
|
||||
metadata["OS"] = osName;
|
||||
metadata["OS Version"] = buffer.release;
|
||||
metadata["Architecture"] = buffer.machine;
|
||||
} else {
|
||||
metadata["OS"] = "Unknown";
|
||||
}
|
||||
|
||||
#if defined(__clang__)
|
||||
metadata["Compiler"] = "Clang " __clang_version__;
|
||||
#elif defined(__GNUC__)
|
||||
metadata["Compiler"] = "GCC " __VERSION__;
|
||||
#else
|
||||
metadata["Compiler"] = "Unknown";
|
||||
#endif
|
||||
|
||||
// Parallel runs
|
||||
startTime = std::chrono::high_resolution_clock::now();
|
||||
metadata["Threads"] = omp_get_max_threads();
|
||||
metadata["Runs"] = runs;
|
||||
metadata["Temperature"] = temp;
|
||||
metadata["Density"] = rho;
|
||||
metadata["tMax_per_run_s"] = tMax;
|
||||
|
||||
GF_OMP(parallel for, for (size_t i = 0; i < runs; ++i)) {
|
||||
auto start_setup_time = std::chrono::high_resolution_clock::now();
|
||||
solver::PointSolverContext solverCtx(*construct.scratch_blob);
|
||||
solverCtx.set_stdout_logging(false);
|
||||
solver::PointSolver solver(construct.engine);
|
||||
auto end_setup_time = std::chrono::high_resolution_clock::now();
|
||||
std::chrono::duration<double> setup_elapsed = end_setup_time - start_setup_time;
|
||||
setupTimes[i] = setup_elapsed;
|
||||
auto start_eval_time = std::chrono::high_resolution_clock::now();
|
||||
parallelResults[i] = solver.evaluate(solverCtx, netIn);
|
||||
auto end_eval_time = std::chrono::high_resolution_clock::now();
|
||||
std::chrono::duration<double> eval_elapsed = end_eval_time - start_eval_time;
|
||||
evalTimes[i] = eval_elapsed;
|
||||
}
|
||||
endTime = std::chrono::high_resolution_clock::now();
|
||||
elapsed = endTime - startTime;
|
||||
std::println("");
|
||||
results["Metadata"] = metadata;
|
||||
|
||||
// Summarize parallel timings
|
||||
total_setup_time = 0.0;
|
||||
total_eval_time = 0.0;
|
||||
for (size_t i = 0; i < runs; ++i) {
|
||||
total_setup_time += setupTimes[i].count();
|
||||
total_eval_time += evalTimes[i].count();
|
||||
for (size_t rID = 0; rID < runs; rID++) {
|
||||
nlohmann::json run_result;
|
||||
nlohmann::json run_metadata;
|
||||
run_metadata["num_zones"] = rID;
|
||||
run_result["metadata"] = run_metadata;
|
||||
|
||||
|
||||
auto startTime = std::chrono::high_resolution_clock::now();
|
||||
|
||||
// arrays to store timings
|
||||
std::array<std::chrono::duration<double>, runs> setup_times{};
|
||||
std::array<std::chrono::duration<double>, runs> eval_times{};
|
||||
std::array<NetOut, runs> serial_results;
|
||||
for (size_t i = 0; i < rID; ++i) {
|
||||
auto start_setup_time = std::chrono::high_resolution_clock::now();
|
||||
solver::PointSolverContext solverCtx(*construct.scratch_blob);
|
||||
solverCtx.set_stdout_logging(false);
|
||||
solver::PointSolver solver(construct.engine);
|
||||
auto end_setup_time = std::chrono::high_resolution_clock::now();
|
||||
std::chrono::duration<double> setup_elapsed = end_setup_time - start_setup_time;
|
||||
setup_times[i] = setup_elapsed;
|
||||
|
||||
auto start_eval_time = std::chrono::high_resolution_clock::now();
|
||||
const NetOut netOut = solver.evaluate(solverCtx, netIn);
|
||||
auto end_eval_time = std::chrono::high_resolution_clock::now();
|
||||
serial_results[i] = netOut;
|
||||
std::chrono::duration<double> eval_elapsed = end_eval_time - start_eval_time;
|
||||
eval_times[i] = eval_elapsed;
|
||||
}
|
||||
auto endTime = std::chrono::high_resolution_clock::now();
|
||||
std::chrono::duration<double> elapsed = endTime - startTime;
|
||||
std::println("");
|
||||
|
||||
nlohmann::json point_solver_time_results;
|
||||
point_solver_time_results["total_time_s"] = elapsed.count();
|
||||
run_result["Serial"] = point_solver_time_results;
|
||||
|
||||
// Summarize serial timings
|
||||
double total_setup_time = 0.0;
|
||||
double total_eval_time = 0.0;
|
||||
for (size_t i = 0; i < rID; ++i) {
|
||||
total_setup_time += setup_times[i].count();
|
||||
total_eval_time += eval_times[i].count();
|
||||
}
|
||||
std::println("Average Setup Time over {} runs: {:.6f} seconds", runs, total_setup_time / runs);
|
||||
std::println("Average Evaluation Time over {} runs: {:.6f} seconds", runs, total_eval_time / runs);
|
||||
std::println("Total Time for {} runs: {:.6f} seconds", runs, elapsed.count());
|
||||
|
||||
|
||||
std::array<NetOut, runs> parallelResults;
|
||||
std::array<std::chrono::duration<double>, runs> setupTimes;
|
||||
std::array<std::chrono::duration<double>, runs> evalTimes;
|
||||
std::array<std::unique_ptr<gridfire::engine::scratch::StateBlob>, runs> workspaces;
|
||||
for (size_t i = 0; i < rID; ++i) {
|
||||
workspaces[i] = construct.scratch_blob->clone_structure();
|
||||
}
|
||||
|
||||
|
||||
// Parallel runs
|
||||
startTime = std::chrono::high_resolution_clock::now();
|
||||
|
||||
GF_OMP(parallel for, for (size_t i = 0; i < rID; ++i)) {
|
||||
auto start_setup_time = std::chrono::high_resolution_clock::now();
|
||||
solver::PointSolverContext solverCtx(*construct.scratch_blob);
|
||||
solverCtx.set_stdout_logging(false);
|
||||
solver::PointSolver solver(construct.engine);
|
||||
auto end_setup_time = std::chrono::high_resolution_clock::now();
|
||||
std::chrono::duration<double> setup_elapsed = end_setup_time - start_setup_time;
|
||||
setupTimes[i] = setup_elapsed;
|
||||
auto start_eval_time = std::chrono::high_resolution_clock::now();
|
||||
parallelResults[i] = solver.evaluate(solverCtx, netIn);
|
||||
auto end_eval_time = std::chrono::high_resolution_clock::now();
|
||||
std::chrono::duration<double> eval_elapsed = end_eval_time - start_eval_time;
|
||||
evalTimes[i] = eval_elapsed;
|
||||
}
|
||||
endTime = std::chrono::high_resolution_clock::now();
|
||||
elapsed = endTime - startTime;
|
||||
std::println("");
|
||||
|
||||
nlohmann::json grid_solver_results;
|
||||
grid_solver_results["total_time_s"] = elapsed.count();
|
||||
run_result["Parallel"] = grid_solver_results;
|
||||
|
||||
// Summarize parallel timings
|
||||
total_setup_time = 0.0;
|
||||
total_eval_time = 0.0;
|
||||
for (size_t i = 0; i < runs; ++i) {
|
||||
total_setup_time += setupTimes[i].count();
|
||||
total_eval_time += evalTimes[i].count();
|
||||
}
|
||||
|
||||
std::println("Average Parallel Setup Time over {} runs: {:.6f} seconds", runs, total_setup_time / runs);
|
||||
std::println("Average Parallel Evaluation Time over {} runs: {:.6f} seconds", runs, total_eval_time / runs);
|
||||
std::println("Total Parallel Time for {} runs: {:.6f} seconds", runs, elapsed.count());
|
||||
|
||||
std::println("========== Summary ==========");
|
||||
std::println("Serial Runs:");
|
||||
std::println(" Average Setup Time: {:.6f} seconds", total_setup_time / runs);
|
||||
std::println(" Average Evaluation Time: {:.6f} seconds", total_eval_time / runs);
|
||||
std::println("Parallel Runs:");
|
||||
std::println(" Average Setup Time: {:.6f} seconds", total_setup_time / runs);
|
||||
std::println(" Average Evaluation Time: {:.6f} seconds", total_eval_time / runs);
|
||||
std::println("Difference:");
|
||||
std::println(" Setup Time Difference: {:.6f} seconds", (total_setup_time / runs) - (total_setup_time / runs));
|
||||
std::println(" Evaluation Time Difference: {:.6f} seconds", (total_eval_time / runs) - (total_eval_time / runs));
|
||||
std::println(" Setup Time Fractional Difference: {:.2f}%", ((total_setup_time / runs) - (total_setup_time / runs)) / (total_setup_time / runs) * 100.0);
|
||||
std::println(" Evaluation Time Fractional Difference: {:.2f}%", ((total_eval_time / runs) - (total_eval_time / runs)) / (total_eval_time / runs) * 100.0);
|
||||
|
||||
results[std::format("Run_{}", rID)] = run_result;
|
||||
}
|
||||
|
||||
std::println("Average Parallel Setup Time over {} runs: {:.6f} seconds", runs, total_setup_time / runs);
|
||||
std::println("Average Parallel Evaluation Time over {} runs: {:.6f} seconds", runs, total_eval_time / runs);
|
||||
std::println("Total Parallel Time for {} runs: {:.6f} seconds", runs, elapsed.count());
|
||||
|
||||
std::println("========== Summary ==========");
|
||||
std::println("Serial Runs:");
|
||||
std::println(" Average Setup Time: {:.6f} seconds", total_setup_time / runs);
|
||||
std::println(" Average Evaluation Time: {:.6f} seconds", total_eval_time / runs);
|
||||
std::println("Parallel Runs:");
|
||||
std::println(" Average Setup Time: {:.6f} seconds", total_setup_time / runs);
|
||||
std::println(" Average Evaluation Time: {:.6f} seconds", total_eval_time / runs);
|
||||
std::println("Difference:");
|
||||
std::println(" Setup Time Difference: {:.6f} seconds", (total_setup_time / runs) - (total_setup_time / runs));
|
||||
std::println(" Evaluation Time Difference: {:.6f} seconds", (total_eval_time / runs) - (total_eval_time / runs));
|
||||
std::println(" Setup Time Fractional Difference: {:.2f}%", ((total_setup_time / runs) - (total_setup_time / runs)) / (total_setup_time / runs) * 100.0);
|
||||
std::println(" Evaluation Time Fractional Difference: {:.2f}%", ((total_eval_time / runs) - (total_eval_time / runs)) / (total_eval_time / runs) * 100.0);
|
||||
}
|
||||
std::ofstream o("gf_single_zone_solver_benchmark_results.json");
|
||||
o << std::setw(4) << results << std::endl;
|
||||
o.close();
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user