Fix number of tuples group-and-sort
This commit is contained in:
parent
78580c5edb
commit
5aa10f31ad
71
atrip.org
71
atrip.org
@ -1503,6 +1503,7 @@ using PartialTuple = std::array<size_t, 2>;
|
|||||||
using ABCTuples = std::vector<ABCTuple>;
|
using ABCTuples = std::vector<ABCTuple>;
|
||||||
|
|
||||||
constexpr ABCTuple FAKE_TUPLE = {0, 0, 0};
|
constexpr ABCTuple FAKE_TUPLE = {0, 0, 0};
|
||||||
|
constexpr ABCTuple INVALID_TUPLE = {1, 1, 1};
|
||||||
#+end_src
|
#+end_src
|
||||||
|
|
||||||
*** Distributing the tuples
|
*** Distributing the tuples
|
||||||
@ -1733,22 +1734,17 @@ namespace group_and_sort {
|
|||||||
**** Utils
|
**** Utils
|
||||||
|
|
||||||
#+begin_src c++ :tangle (atrip-tuples-h)
|
#+begin_src c++ :tangle (atrip-tuples-h)
|
||||||
|
|
||||||
// Provides the node on which the slice-element is found
|
// Provides the node on which the slice-element is found
|
||||||
// Right now we distribute the slices in a round robin fashion
|
// Right now we distribute the slices in a round robin fashion
|
||||||
// over the different nodes (NOTE: not mpi ranks but nodes)
|
// over the different nodes (NOTE: not mpi ranks but nodes)
|
||||||
inline
|
inline
|
||||||
size_t isOnNode(size_t tuple, size_t nodes) { return tuple % nodes; }
|
size_t isOnNode(size_t tuple, size_t nNodes) { return tuple % nNodes; }
|
||||||
|
|
||||||
|
|
||||||
struct Info {
|
|
||||||
size_t nNodes;
|
|
||||||
size_t nodeId;
|
|
||||||
};
|
|
||||||
|
|
||||||
|
|
||||||
// return the node (or all nodes) where the elements of this
|
// return the node (or all nodes) where the elements of this
|
||||||
// tuple are located
|
// tuple are located
|
||||||
std::vector<size_t> getTupleNodes(ABCTuple t, size_t nNodes) {
|
std::vector<size_t> getTupleNodes(ABCTuple const& t, size_t nNodes) {
|
||||||
std::vector<size_t>
|
std::vector<size_t>
|
||||||
nTuple = { isOnNode(t[0], nNodes)
|
nTuple = { isOnNode(t[0], nNodes)
|
||||||
, isOnNode(t[1], nNodes)
|
, isOnNode(t[1], nNodes)
|
||||||
@ -1756,6 +1752,12 @@ std::vector<size_t> getTupleNodes(ABCTuple t, size_t nNodes) {
|
|||||||
};
|
};
|
||||||
return unique(nTuple);
|
return unique(nTuple);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
struct Info {
|
||||||
|
size_t nNodes;
|
||||||
|
size_t nodeId;
|
||||||
|
};
|
||||||
|
|
||||||
#+end_src
|
#+end_src
|
||||||
|
|
||||||
**** Distribution
|
**** Distribution
|
||||||
@ -1781,27 +1783,33 @@ ABCTuples specialDistribution(Info const& info, ABCTuples const& allTuples) {
|
|||||||
if (info.nodeId == 0)
|
if (info.nodeId == 0)
|
||||||
std::cout << "\tGoing through all "
|
std::cout << "\tGoing through all "
|
||||||
<< allTuples.size()
|
<< allTuples.size()
|
||||||
<< " tuples\n";
|
<< " tuples in "
|
||||||
|
<< nNodes
|
||||||
|
<< " nodes\n";
|
||||||
|
|
||||||
// build container-n-d's
|
// build container-n-d's
|
||||||
for (auto const& t: allTuples) {
|
for (auto const& t: allTuples) {
|
||||||
// one which node(s) are the tuple elements located...
|
// one which node(s) are the tuple elements located...
|
||||||
// put them into the right container
|
// put them into the right container
|
||||||
auto const _nodes = getTupleNodes(t, nNodes);
|
auto const _nodes = getTupleNodes(t, nNodes);
|
||||||
|
|
||||||
switch (_nodes.size()) {
|
switch (_nodes.size()) {
|
||||||
case 1:
|
case 1:
|
||||||
container1d[_nodes[0]].push_back(t);
|
container1d[_nodes[0]].push_back(t);
|
||||||
|
break;
|
||||||
case 2:
|
case 2:
|
||||||
container2d[ _nodes[0]
|
container2d[ _nodes[0]
|
||||||
+ _nodes[1] * nNodes
|
+ _nodes[1] * nNodes
|
||||||
].push_back(t);
|
].push_back(t);
|
||||||
|
break;
|
||||||
case 3:
|
case 3:
|
||||||
container3d[ _nodes[0]
|
container3d[ _nodes[0]
|
||||||
+ _nodes[1] * nNodes
|
+ _nodes[1] * nNodes
|
||||||
+ _nodes[2] * nNodes * nNodes
|
+ _nodes[2] * nNodes * nNodes
|
||||||
].push_back(t);
|
].push_back(t);
|
||||||
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (info.nodeId == 0)
|
if (info.nodeId == 0)
|
||||||
@ -1809,9 +1817,9 @@ ABCTuples specialDistribution(Info const& info, ABCTuples const& allTuples) {
|
|||||||
// DISTRIBUTE 1-d containers
|
// DISTRIBUTE 1-d containers
|
||||||
// every tuple which is only located at one node belongs to this node
|
// every tuple which is only located at one node belongs to this node
|
||||||
{
|
{
|
||||||
auto const& _tuplesVec = container1d[info.nodeId];
|
auto const& _tuples = container1d[info.nodeId];
|
||||||
nodeTuples.resize(_tuplesVec.size());
|
nodeTuples.resize(_tuples.size(), INVALID_TUPLE);
|
||||||
std::copy(_tuplesVec.begin(), _tuplesVec.end(), nodeTuples.begin());
|
std::copy(_tuples.begin(), _tuples.end(), nodeTuples.begin());
|
||||||
}
|
}
|
||||||
|
|
||||||
if (info.nodeId == 0)
|
if (info.nodeId == 0)
|
||||||
@ -1820,12 +1828,12 @@ ABCTuples specialDistribution(Info const& info, ABCTuples const& allTuples) {
|
|||||||
//the tuples which are located at two nodes are half/half given to these nodes
|
//the tuples which are located at two nodes are half/half given to these nodes
|
||||||
for (size_t yx = 0; yx < container2d.size(); yx++) {
|
for (size_t yx = 0; yx < container2d.size(); yx++) {
|
||||||
|
|
||||||
auto const& _tuplesVec = container2d[yx];
|
auto const& _tuples = container2d[yx];
|
||||||
const
|
const
|
||||||
size_t idx = yx % nNodes
|
size_t idx = yx % nNodes
|
||||||
// remeber: yx = idy * nNodes + idx
|
// remeber: yx = idy * nNodes + idx
|
||||||
, idy = yx / nNodes
|
, idy = yx / nNodes
|
||||||
, n_half = _tuplesVec.size() / 2
|
, n_half = _tuples.size() / 2
|
||||||
, size = nodeTuples.size()
|
, size = nodeTuples.size()
|
||||||
;
|
;
|
||||||
|
|
||||||
@ -1835,16 +1843,16 @@ ABCTuples specialDistribution(Info const& info, ABCTuples const& allTuples) {
|
|||||||
nend = n_half;
|
nend = n_half;
|
||||||
} else if (info.nodeId == idy) {
|
} else if (info.nodeId == idy) {
|
||||||
nbeg = 1 * n_half;
|
nbeg = 1 * n_half;
|
||||||
nend = _tuplesVec.size();
|
nend = _tuples.size();
|
||||||
} else {
|
} else {
|
||||||
// either idx or idy is my node
|
// either idx or idy is my node
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
|
|
||||||
size_t const nextra = nend - nbeg;
|
size_t const nextra = nend - nbeg;
|
||||||
nodeTuples.resize(size + nextra);
|
nodeTuples.resize(size + nextra, INVALID_TUPLE);
|
||||||
std::copy(_tuplesVec.begin() + nbeg,
|
std::copy(_tuples.begin() + nbeg,
|
||||||
_tuplesVec.begin() + nend,
|
_tuples.begin() + nend,
|
||||||
nodeTuples.begin() + size);
|
nodeTuples.begin() + size);
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -1853,14 +1861,14 @@ ABCTuples specialDistribution(Info const& info, ABCTuples const& allTuples) {
|
|||||||
std::cout << "\tBuilding 3-d containers\n";
|
std::cout << "\tBuilding 3-d containers\n";
|
||||||
// DISTRIBUTE 3-d containers
|
// DISTRIBUTE 3-d containers
|
||||||
for (size_t zyx = 0; zyx < container3d.size(); zyx++) {
|
for (size_t zyx = 0; zyx < container3d.size(); zyx++) {
|
||||||
auto const& _tuplesVec = container3d[zyx];
|
auto const& _tuples = container3d[zyx];
|
||||||
|
|
||||||
const
|
const
|
||||||
size_t idx = zyx % nNodes
|
size_t idx = zyx % nNodes
|
||||||
, idy = (zyx / nNodes) % nNodes
|
, idy = (zyx / nNodes) % nNodes
|
||||||
// remember: zyx = idx + idy * nNodes + idz * nNodes^2
|
// remember: zyx = idx + idy * nNodes + idz * nNodes^2
|
||||||
, idz = zyx / nNodes / nNodes
|
, idz = zyx / nNodes / nNodes
|
||||||
, n_third = _tuplesVec.size() / 3
|
, n_third = _tuples.size() / 3
|
||||||
, size = nodeTuples.size()
|
, size = nodeTuples.size()
|
||||||
;
|
;
|
||||||
|
|
||||||
@ -1870,19 +1878,19 @@ ABCTuples specialDistribution(Info const& info, ABCTuples const& allTuples) {
|
|||||||
nend = 1 * n_third;
|
nend = 1 * n_third;
|
||||||
} else if (info.nodeId == idy) {
|
} else if (info.nodeId == idy) {
|
||||||
nbeg = 1 * n_third;
|
nbeg = 1 * n_third;
|
||||||
nend = 2 * nextra;
|
nend = 2 * n_third;
|
||||||
} else if (info.nodeId == idz) {
|
} else if (info.nodeId == idz) {
|
||||||
nbeg = 2 * n_third;
|
nbeg = 2 * n_third;
|
||||||
nend = _tuplesVec.size();
|
nend = _tuples.size();
|
||||||
} else {
|
} else {
|
||||||
// either idx or idy or idz is my node
|
// either idx or idy or idz is my node
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
|
|
||||||
size_t const nextra = nend - nbeg;
|
size_t const nextra = nend - nbeg;
|
||||||
nodeTuples.resize(size + nextra);
|
nodeTuples.resize(size + nextra, INVALID_TUPLE);
|
||||||
std::copy(_tuplesVec.begin() + nbeg,
|
std::copy(_tuples.begin() + nbeg,
|
||||||
_tuplesVec.begin() + nend,
|
_tuples.begin() + nend,
|
||||||
nodeTuples.begin() + size);
|
nodeTuples.begin() + size);
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -1926,6 +1934,16 @@ ABCTuples specialDistribution(Info const& info, ABCTuples const& allTuples) {
|
|||||||
// we bring the tuples abc back in the order a<b<c
|
// we bring the tuples abc back in the order a<b<c
|
||||||
for (auto &t: nodeTuples) std::sort(t.begin(), t.end());
|
for (auto &t: nodeTuples) std::sort(t.begin(), t.end());
|
||||||
|
|
||||||
|
#if ATRIP_DEBUG > 1
|
||||||
|
if (info.nodeId == 0)
|
||||||
|
std::cout << "checking for validity of " << nodeTuples.size() << std::endl;
|
||||||
|
const bool anyInvalid
|
||||||
|
= std::any_of(nodeTuples.begin(),
|
||||||
|
nodeTuples.end(),
|
||||||
|
[](ABCTuple const& t) { return t == INVALID_TUPLE; });
|
||||||
|
if (anyInvalid) throw "Some tuple is invalid in group-and-sort algorithm";
|
||||||
|
#endif
|
||||||
|
|
||||||
return nodeTuples;
|
return nodeTuples;
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -2850,6 +2868,7 @@ Atrip::Output Atrip::run(Atrip::Input const& in) {
|
|||||||
const size_t Nv = in.ea->lens[0];
|
const size_t Nv = in.ea->lens[0];
|
||||||
LOG(0,"Atrip") << "No: " << No << "\n";
|
LOG(0,"Atrip") << "No: " << No << "\n";
|
||||||
LOG(0,"Atrip") << "Nv: " << Nv << "\n";
|
LOG(0,"Atrip") << "Nv: " << Nv << "\n";
|
||||||
|
LOG(0,"Atrip") << "np: " << np << "\n";
|
||||||
|
|
||||||
// allocate the three scratches, see piecuch
|
// allocate the three scratches, see piecuch
|
||||||
std::vector<double> Tijk(No*No*No) // doubles only (see piecuch)
|
std::vector<double> Tijk(No*No*No) // doubles only (see piecuch)
|
||||||
|
|||||||
@ -27,6 +27,7 @@ using PartialTuple = std::array<size_t, 2>;
|
|||||||
using ABCTuples = std::vector<ABCTuple>;
|
using ABCTuples = std::vector<ABCTuple>;
|
||||||
|
|
||||||
constexpr ABCTuple FAKE_TUPLE = {0, 0, 0};
|
constexpr ABCTuple FAKE_TUPLE = {0, 0, 0};
|
||||||
|
constexpr ABCTuple INVALID_TUPLE = {1, 1, 1};
|
||||||
// Tuples types:1 ends here
|
// Tuples types:1 ends here
|
||||||
|
|
||||||
// [[file:~/atrip/atrip.org::*Distributing%20the%20tuples][Distributing the tuples:1]]
|
// [[file:~/atrip/atrip.org::*Distributing%20the%20tuples][Distributing the tuples:1]]
|
||||||
@ -86,11 +87,11 @@ struct RankInfo {
|
|||||||
};
|
};
|
||||||
|
|
||||||
template <typename A>
|
template <typename A>
|
||||||
std::vector<A> unique(std::vector<A> const &xs) {
|
A unique(A const &xs) {
|
||||||
auto result = xs;
|
auto result = xs;
|
||||||
std::sort(result.begin(), result.end());
|
std::sort(std::begin(result), std::end(result));
|
||||||
auto const& last = std::unique(result.begin(), result.end());
|
auto const& last = std::unique(std::begin(result), std::end(result));
|
||||||
result.erase(last, result.end());
|
result.erase(last, std::end(result));
|
||||||
return result;
|
return result;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -207,29 +208,25 @@ namespace group_and_sort {
|
|||||||
// Provides the node on which the slice-element is found
|
// Provides the node on which the slice-element is found
|
||||||
// Right now we distribute the slices in a round robin fashion
|
// Right now we distribute the slices in a round robin fashion
|
||||||
// over the different nodes (NOTE: not mpi ranks but nodes)
|
// over the different nodes (NOTE: not mpi ranks but nodes)
|
||||||
size_t isOnNode(size_t tuple, size_t nodes) { return tuple % nodes; }
|
inline
|
||||||
|
size_t isOnNode(size_t tuple, size_t nNodes) { return tuple % nNodes; }
|
||||||
|
|
||||||
|
|
||||||
|
// return the node (or all nodes) where the elements of this
|
||||||
|
// tuple are located
|
||||||
|
std::vector<size_t> getTupleNodes(ABCTuple const& t, size_t nNodes) {
|
||||||
|
std::vector<size_t>
|
||||||
|
nTuple = { isOnNode(t[0], nNodes)
|
||||||
|
, isOnNode(t[1], nNodes)
|
||||||
|
, isOnNode(t[2], nNodes)
|
||||||
|
};
|
||||||
|
return unique(nTuple);
|
||||||
|
}
|
||||||
|
|
||||||
struct Info {
|
struct Info {
|
||||||
size_t nNodes;
|
size_t nNodes;
|
||||||
size_t nodeId;
|
size_t nodeId;
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
||||||
// return the node (or all nodes) where the elements of this
|
|
||||||
// tuple are located
|
|
||||||
std::vector<size_t> getTupleNodes(ABCTuple t, size_t nNodes) {
|
|
||||||
std::vector<size_t> result;
|
|
||||||
ABCTuple nTuple = { isOnNode(t[0], nNodes)
|
|
||||||
, isOnNode(t[1], nNodes)
|
|
||||||
, isOnNode(t[2], nNodes)
|
|
||||||
};
|
|
||||||
std::sort(nTuple.begin(), nTuple.end());
|
|
||||||
ABCTuple::iterator it = std::unique(nTuple.begin(), nTuple.end());
|
|
||||||
result.resize(it - nTuple.begin());
|
|
||||||
std::copy(nTuple.begin(), it, result.begin());
|
|
||||||
return result;
|
|
||||||
}
|
|
||||||
// Utils:1 ends here
|
// Utils:1 ends here
|
||||||
|
|
||||||
// [[file:~/atrip/atrip.org::*Distribution][Distribution:1]]
|
// [[file:~/atrip/atrip.org::*Distribution][Distribution:1]]
|
||||||
@ -238,28 +235,42 @@ ABCTuples specialDistribution(Info const& info, ABCTuples const& allTuples) {
|
|||||||
ABCTuples nodeTuples;
|
ABCTuples nodeTuples;
|
||||||
size_t const nNodes(info.nNodes);
|
size_t const nNodes(info.nNodes);
|
||||||
|
|
||||||
std::map< size_t /* nodeId */, ABCTuples >
|
std::vector<ABCTuples>
|
||||||
container1d, container2d, container3d;
|
container1d(nNodes)
|
||||||
|
, container2d(nNodes * nNodes)
|
||||||
|
, container3d(nNodes * nNodes * nNodes)
|
||||||
|
;
|
||||||
|
|
||||||
|
if (info.nodeId == 0)
|
||||||
|
std::cout << "\tGoing through all "
|
||||||
|
<< allTuples.size()
|
||||||
|
<< " tuples in "
|
||||||
|
<< nNodes
|
||||||
|
<< " nodes\n";
|
||||||
|
|
||||||
// build container-n-d's
|
// build container-n-d's
|
||||||
for (auto const& t: allTuples) {
|
for (auto const& t: allTuples) {
|
||||||
// one which node(s) are the tuple elements located...
|
// one which node(s) are the tuple elements located...
|
||||||
// put them into the right container
|
// put them into the right container
|
||||||
auto const _nodes = getTupleNodes(t, nNodes);
|
auto const _nodes = getTupleNodes(t, nNodes);
|
||||||
|
|
||||||
switch (_nodes.size()) {
|
switch (_nodes.size()) {
|
||||||
case 1:
|
case 1:
|
||||||
container1d[_nodes[0]].push_back(t);
|
container1d[_nodes[0]].push_back(t);
|
||||||
|
break;
|
||||||
case 2:
|
case 2:
|
||||||
container2d[ _nodes[0]
|
container2d[ _nodes[0]
|
||||||
+ nNodes * _nodes[1]
|
+ _nodes[1] * nNodes
|
||||||
].push_back(t);
|
].push_back(t);
|
||||||
|
break;
|
||||||
case 3:
|
case 3:
|
||||||
container3d[ _nodes[0]
|
container3d[ _nodes[0]
|
||||||
+ nNodes * _nodes[1]
|
+ _nodes[1] * nNodes
|
||||||
+ nNodes * nNodes * _nodes[2]
|
+ _nodes[2] * nNodes * nNodes
|
||||||
].push_back(t);
|
].push_back(t);
|
||||||
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (info.nodeId == 0)
|
if (info.nodeId == 0)
|
||||||
@ -267,43 +278,42 @@ ABCTuples specialDistribution(Info const& info, ABCTuples const& allTuples) {
|
|||||||
// DISTRIBUTE 1-d containers
|
// DISTRIBUTE 1-d containers
|
||||||
// every tuple which is only located at one node belongs to this node
|
// every tuple which is only located at one node belongs to this node
|
||||||
{
|
{
|
||||||
auto const& _tuplesVec = container1d[info.nodeId];
|
auto const& _tuples = container1d[info.nodeId];
|
||||||
nodeTuples.resize(_tuplesVec.size());
|
nodeTuples.resize(_tuples.size(), INVALID_TUPLE);
|
||||||
std::copy(_tuplesVec.begin(), _tuplesVec.end(), nodeTuples.begin());
|
std::copy(_tuples.begin(), _tuples.end(), nodeTuples.begin());
|
||||||
}
|
}
|
||||||
|
|
||||||
if (info.nodeId == 0)
|
if (info.nodeId == 0)
|
||||||
std::cout << "\tBuilding 2-d containers\n";
|
std::cout << "\tBuilding 2-d containers\n";
|
||||||
// DISTRIBUTE 2-d containers
|
// DISTRIBUTE 2-d containers
|
||||||
//the tuples which are located at two nodes are half/half given to these nodes
|
//the tuples which are located at two nodes are half/half given to these nodes
|
||||||
for (auto const& m: container2d) {
|
for (size_t yx = 0; yx < container2d.size(); yx++) {
|
||||||
|
|
||||||
auto const& _tuplesVec = m.second;
|
auto const& _tuples = container2d[yx];
|
||||||
const
|
const
|
||||||
size_t idx = m.first % nNodes
|
size_t idx = yx % nNodes
|
||||||
// remeber: m.first = idy * nNodes + idx
|
// remeber: yx = idy * nNodes + idx
|
||||||
, idy = m.first / nNodes
|
, idy = yx / nNodes
|
||||||
, n_half = _tuplesVec.size() / 2
|
, n_half = _tuples.size() / 2
|
||||||
, size = nodeTuples.size()
|
, size = nodeTuples.size()
|
||||||
;
|
;
|
||||||
|
|
||||||
size_t nextra, nbegin, nend;
|
size_t nbeg, nend;
|
||||||
if (info.nodeId == idx) {
|
if (info.nodeId == idx) {
|
||||||
nextra = n_half;
|
nbeg = 0 * n_half;
|
||||||
nbegin = 0 * n_half;
|
|
||||||
nend = n_half;
|
nend = n_half;
|
||||||
} else if (info.nodeId == idy) {
|
} else if (info.nodeId == idy) {
|
||||||
nextra = _tuplesVec.size() - n_half;
|
nbeg = 1 * n_half;
|
||||||
nbegin = 1 * n_half;
|
nend = _tuples.size();
|
||||||
nend = _tuplesVec.size();
|
|
||||||
} else {
|
} else {
|
||||||
// either idx or idy is my node
|
// either idx or idy is my node
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
|
|
||||||
nodeTuples.resize(size + nextra);
|
size_t const nextra = nend - nbeg;
|
||||||
std::copy(_tuplesVec.begin() + nbegin,
|
nodeTuples.resize(size + nextra, INVALID_TUPLE);
|
||||||
_tuplesVec.begin() + nend,
|
std::copy(_tuples.begin() + nbeg,
|
||||||
|
_tuples.begin() + nend,
|
||||||
nodeTuples.begin() + size);
|
nodeTuples.begin() + size);
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -311,39 +321,37 @@ ABCTuples specialDistribution(Info const& info, ABCTuples const& allTuples) {
|
|||||||
if (info.nodeId == 0)
|
if (info.nodeId == 0)
|
||||||
std::cout << "\tBuilding 3-d containers\n";
|
std::cout << "\tBuilding 3-d containers\n";
|
||||||
// DISTRIBUTE 3-d containers
|
// DISTRIBUTE 3-d containers
|
||||||
for (auto const& m: container3d){
|
for (size_t zyx = 0; zyx < container3d.size(); zyx++) {
|
||||||
auto const& _tuplesVec = m.second;
|
auto const& _tuples = container3d[zyx];
|
||||||
|
|
||||||
const
|
const
|
||||||
size_t idx = m.first % nNodes
|
size_t idx = zyx % nNodes
|
||||||
, idy = (m.first / nNodes) % nNodes
|
, idy = (zyx / nNodes) % nNodes
|
||||||
// remember: m.first = idx + idy * nNodes + idz * nNodes^2
|
// remember: zyx = idx + idy * nNodes + idz * nNodes^2
|
||||||
, idz = m.first / nNodes / nNodes
|
, idz = zyx / nNodes / nNodes
|
||||||
, n_third = _tuplesVec.size() / 3
|
, n_third = _tuples.size() / 3
|
||||||
, size = nodeTuples.size()
|
, size = nodeTuples.size()
|
||||||
;
|
;
|
||||||
|
|
||||||
size_t nextra, nbegin, nend;
|
size_t nbeg, nend;
|
||||||
if (info.nodeId == idx) {
|
if (info.nodeId == idx) {
|
||||||
nextra = n_third;
|
nbeg = 0 * n_third;
|
||||||
nbegin = 0 * n_third;
|
nend = 1 * n_third;
|
||||||
nend = nextra;
|
|
||||||
} else if (info.nodeId == idy) {
|
} else if (info.nodeId == idy) {
|
||||||
nextra = n_third;
|
nbeg = 1 * n_third;
|
||||||
nbegin = 1 * n_third;
|
nend = 2 * n_third;
|
||||||
nend = 2 * nextra;
|
|
||||||
} else if (info.nodeId == idz) {
|
} else if (info.nodeId == idz) {
|
||||||
nextra = _tuplesVec.size() - 2 * n_third;
|
nbeg = 2 * n_third;
|
||||||
nbegin = 2 * n_third;
|
nend = _tuples.size();
|
||||||
nend = _tuplesVec.size();
|
|
||||||
} else {
|
} else {
|
||||||
// either idx or idy or idz is my node
|
// either idx or idy or idz is my node
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
|
|
||||||
nodeTuples.resize(size + nextra);
|
size_t const nextra = nend - nbeg;
|
||||||
std::copy(_tuplesVec.begin() + nbegin,
|
nodeTuples.resize(size + nextra, INVALID_TUPLE);
|
||||||
_tuplesVec.begin() + nend,
|
std::copy(_tuples.begin() + nbeg,
|
||||||
|
_tuples.begin() + nend,
|
||||||
nodeTuples.begin() + size);
|
nodeTuples.begin() + size);
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -387,6 +395,16 @@ ABCTuples specialDistribution(Info const& info, ABCTuples const& allTuples) {
|
|||||||
// we bring the tuples abc back in the order a<b<c
|
// we bring the tuples abc back in the order a<b<c
|
||||||
for (auto &t: nodeTuples) std::sort(t.begin(), t.end());
|
for (auto &t: nodeTuples) std::sort(t.begin(), t.end());
|
||||||
|
|
||||||
|
#if ATRIP_DEBUG > 1
|
||||||
|
if (info.nodeId == 0)
|
||||||
|
std::cout << "checking for validity of " << nodeTuples.size() << std::endl;
|
||||||
|
const bool anyInvalid
|
||||||
|
= std::any_of(nodeTuples.begin(),
|
||||||
|
nodeTuples.end(),
|
||||||
|
[](ABCTuple const& t) { return t == INVALID_TUPLE; });
|
||||||
|
if (anyInvalid) throw "Some tuple is invalid in group-and-sort algorithm";
|
||||||
|
#endif
|
||||||
|
|
||||||
return nodeTuples;
|
return nodeTuples;
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -497,8 +515,6 @@ if (computeDistribution) {
|
|||||||
// Main:4 ends here
|
// Main:4 ends here
|
||||||
|
|
||||||
// [[file:~/atrip/atrip.org::*Main][Main:5]]
|
// [[file:~/atrip/atrip.org::*Main][Main:5]]
|
||||||
LOG(1,"Atrip") << "scattering tuples \n";
|
|
||||||
|
|
||||||
return result;
|
return result;
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|||||||
@ -33,6 +33,7 @@ Atrip::Output Atrip::run(Atrip::Input const& in) {
|
|||||||
const size_t Nv = in.ea->lens[0];
|
const size_t Nv = in.ea->lens[0];
|
||||||
LOG(0,"Atrip") << "No: " << No << "\n";
|
LOG(0,"Atrip") << "No: " << No << "\n";
|
||||||
LOG(0,"Atrip") << "Nv: " << Nv << "\n";
|
LOG(0,"Atrip") << "Nv: " << Nv << "\n";
|
||||||
|
LOG(0,"Atrip") << "np: " << np << "\n";
|
||||||
|
|
||||||
// allocate the three scratches, see piecuch
|
// allocate the three scratches, see piecuch
|
||||||
std::vector<double> Tijk(No*No*No) // doubles only (see piecuch)
|
std::vector<double> Tijk(No*No*No) // doubles only (see piecuch)
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user