1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129
|
/* ************************************************************************
* Copyright (C) 2018-2020 Advanced Micro Devices, Inc. All rights Reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a copy
* of this software and associated documentation files (the "Software"), to deal
* in the Software without restriction, including without limitation the rights
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
* copies of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
* THE SOFTWARE.
*
* ************************************************************************ */
#include "common.hpp"
#include <iostream>
#include <mpi.h>
#include <rocalution/rocalution.hpp>
#define ValueType double
using namespace rocalution;
int main(int argc, char* argv[])
{
// Initialize MPI
MPI_Init(&argc, &argv);
MPI_Comm comm = MPI_COMM_WORLD;
int rank;
int num_procs;
MPI_Comm_rank(comm, &rank);
MPI_Comm_size(comm, &num_procs);
if(argc < 2)
{
std::cerr << argv[0] << " <global_matrix>" << std::endl;
return -1;
}
// Disable OpenMP thread affinity
set_omp_affinity_rocalution(false);
// Initialize platform with rank and # of accelerator devices in the node
init_rocalution(rank, 2);
// Disable OpenMP
set_omp_threads_rocalution(1);
// Print platform
info_rocalution();
// Load undistributed matrix
LocalMatrix<ValueType> lmat;
lmat.ReadFileMTX(argv[1]);
// Global structures
ParallelManager manager;
GlobalMatrix<ValueType> mat;
// Distribute matrix - lmat will be destroyed
distribute_matrix(&comm, &lmat, &mat, &manager);
// rocALUTION vectors
GlobalVector<ValueType> rhs(manager);
GlobalVector<ValueType> x(manager);
GlobalVector<ValueType> e(manager);
// Move structures to accelerator, if available
mat.MoveToAccelerator();
rhs.MoveToAccelerator();
x.MoveToAccelerator();
e.MoveToAccelerator();
// Allocate memory
rhs.Allocate("rhs", mat.GetM());
x.Allocate("x", mat.GetN());
e.Allocate("sol", mat.GetN());
e.Ones();
mat.Apply(e, &rhs);
x.Zeros();
CG<GlobalMatrix<double>, GlobalVector<double>, double> ls;
Jacobi<GlobalMatrix<double>, GlobalVector<double>, double> p;
ls.SetPreconditioner(p);
ls.SetOperator(mat);
ls.Build();
ls.Verbose(1);
mat.Info();
double time = rocalution_time();
ls.Solve(rhs, &x);
time = rocalution_time() - time;
if(rank == 0)
{
std::cout << "Solving: " << time / 1e6 << " sec" << std::endl;
}
e.ScaleAdd(-1.0, x);
double nrm2 = e.Norm();
if(rank == 0)
{
std::cout << "||e - x||_2 = " << nrm2 << std::endl;
}
ls.Clear();
stop_rocalution();
MPI_Finalize();
return 0;
}
|