AUTH's THMMY "Parallel and distributed systems" course assignments.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

distsort.hpp 12 KiB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328
  1. /*!
  2. * \file
  3. * \brief Distributed sort implementation header
  4. *
  5. * \author
  6. * Christos Choutouridis AEM:8997
  7. * <cchoutou@ece.auth.gr>
  8. */
  9. #ifndef DISTBITONIC_H_
  10. #define DISTBITONIC_H_
  11. #include <vector>
  12. #include <algorithm>
  13. #include <cmath>
  14. #include <cstdint>
  15. #if !defined DEBUG
  16. #define NDEBUG
  17. #endif
  18. #include <cassert>
  19. #include "utils.hpp"
  20. #include "config.h"
  21. /*!
  22. * Enumerator for the different versions of the sorting method
  23. */
  24. enum class SortMode {
  25. Bubbletonic, //!< The v0.5 of the algorithm where we use a bubble-sort like approach
  26. Bitonic //!< The v1.0 of the algorithm where we use the bitonic data-exchange approach
  27. };
  28. /*
  29. * ============================== Sort utilities ==============================
  30. */
  31. /*!
  32. * The primary function template of ascending(). It is DISABLED since , it is explicitly specialized
  33. * for each of the \c SortMode
  34. */
  35. template <SortMode Mode> inline bool ascending(mpi_id_t, [[maybe_unused]] size_t) noexcept = delete;
  36. /*!
  37. * Returns the ascending or descending configuration of the node's sequence based on
  38. * the current node (MPI process) and the depth of the sorting network
  39. *
  40. * @param node [mpi_id_t] The current node (MPI process)
  41. * @return [bool] True if we need ascending configuration, false otherwise
  42. */
  43. template <> inline
  44. bool ascending<SortMode::Bubbletonic>(mpi_id_t node, [[maybe_unused]] size_t depth) noexcept {
  45. return (node % 2) == 0;
  46. }
  47. /*!
  48. * Returns the ascending or descending configuration of the node's sequence based on
  49. * the current node (MPI process) and the depth of the sorting network
  50. *
  51. * @param node [mpi_id_t] The current node (MPI process)
  52. * @param depth [size_t] The total depth of the sorting network (same for each step for a given network)
  53. * @return [bool] True if we need ascending configuration, false otherwise
  54. */
  55. template <> inline
  56. bool ascending<SortMode::Bitonic>(mpi_id_t node, size_t depth) noexcept {
  57. return !(node & (1 << depth));
  58. }
  59. /*!
  60. * The primary function template of partner(). It is DISABLED since , it is explicitly specialized
  61. * for each of the \c SortMode
  62. */
  63. template <SortMode Mode> inline mpi_id_t partner(mpi_id_t, size_t) noexcept = delete;
  64. /*!
  65. * Returns the node's partner for data exchange during the sorting network iterations
  66. * of Bubbletonic
  67. *
  68. * @param node [mpi_id_t] The current node
  69. * @param step [size_t] The step of the sorting network
  70. * @return [mpi_id_t] The node id of the partner for data exchange
  71. */
  72. template <> inline
  73. mpi_id_t partner<SortMode::Bubbletonic>(mpi_id_t node, size_t step) noexcept {
  74. //return (node % 2 == step % 2) ? node + 1 : node - 1;
  75. return (((node+step) % 2) == 0) ? node + 1 : node - 1;
  76. }
  77. /*!
  78. * Returns the node's partner for data exchange during the sorting network iterations
  79. * of Bitonic
  80. *
  81. * @param node [mpi_id_t] The current node
  82. * @param step [size_t] The step of the sorting network
  83. * @return [mpi_id_t] The node id of the partner for data exchange
  84. */
  85. template <> inline
  86. mpi_id_t partner<SortMode::Bitonic>(mpi_id_t node, size_t step) noexcept {
  87. return (node ^ (1 << step));
  88. }
  89. /*!
  90. * The primary function template of keepSmall(). It is DISABLED since , it is explicitly specialized
  91. * for each of the \c SortMode
  92. */
  93. template<SortMode Mode> inline bool keepSmall(mpi_id_t, mpi_id_t, [[maybe_unused]] size_t) = delete;
  94. /*!
  95. * Predicate to check if a node keeps the small numbers during the bubbletonic sort network exchange.
  96. *
  97. * @param node [mpi_id_t] The node for which we check
  98. * @param partner [mpi_id_t] The partner of the data exchange
  99. * @return [bool] True if the node should keep the small values, false otherwise
  100. */
  101. template <> inline
  102. bool keepSmall<SortMode::Bubbletonic>(mpi_id_t node, mpi_id_t partner, [[maybe_unused]] size_t depth) {
  103. if (node == partner)
  104. throw std::runtime_error("(keepSmall) Node and Partner can not be the same\n");
  105. return (node < partner);
  106. }
  107. /*!
  108. * Predicate to check if a node keeps the small numbers during the bitonic sort network exchange.
  109. *
  110. * @param node [mpi_id_t] The node for which we check
  111. * @param partner [mpi_id_t] The partner of the data exchange
  112. * @param depth [size_t] The total depth of the sorting network (same for each step for a given network)
  113. * @return [bool] True if the node should keep the small values, false otherwise
  114. */
  115. template <> inline
  116. bool keepSmall<SortMode::Bitonic>(mpi_id_t node, mpi_id_t partner, size_t depth) {
  117. if (node == partner)
  118. throw std::runtime_error("(keepSmall) Node and Partner can not be the same\n");
  119. return ascending<SortMode::Bitonic>(node, depth) == (node < partner);
  120. }
  121. /*!
  122. * Predicate to check if the node is active in the current iteration of the bubbletonic
  123. * sort exchange.
  124. *
  125. * @param node [mpi_id_t] The node to check
  126. * @param nodes [size_t] The total number of nodes
  127. * @return [bool] True if the node is active, false otherwise
  128. */
  129. bool isActive(mpi_id_t node, size_t nodes);
  130. /*
  131. * ============================== Data utilities ==============================
  132. */
  133. /*!
  134. * Sort a range using the build-in O(Nlog(N)) algorithm
  135. *
  136. * @tparam RangeT A range type with random access iterator
  137. *
  138. * @param data [RangeT] The data to be sorted
  139. * @param ascending [bool] Flag to indicate the sorting order
  140. */
  141. template<typename RangeT>
  142. void fullSort(RangeT& data, bool ascending) noexcept {
  143. // Use introsort from stdlib++ here, unless ...
  144. if (ascending)
  145. std::sort(data.begin(), data.end(), std::less<>());
  146. else
  147. std::sort(data.begin(), data.end(), std::greater<>());
  148. }
  149. /*!
  150. * Core functionality of sort for shadowed buffer types using
  151. * the "elbow sort" algorithm.
  152. *
  153. * @note:
  154. * This algorithm can not work "in place".
  155. * We use the active buffer as source and the shadow as target.
  156. * At the end we switch which buffer is active and which is the shadow.
  157. * @note
  158. * This is the core functionality. Use the elbowSort() function instead
  159. *
  160. * @tparam ShadowedT A Shadowed buffer type with random access iterator.
  161. * @tparam CompT A Comparison type for binary operation comparisons
  162. *
  163. * @param data [ShadowedT] The data to sort
  164. * @param ascending [bool] Flag to indicate the sorting order
  165. * @param comp [CompT] The binary operator object
  166. */
  167. template<typename ShadowedT, typename CompT>
  168. void elbowSortCore(ShadowedT& data, bool ascending, CompT comp) noexcept {
  169. auto& active = data.getActive(); // Get the source vector (the data to sort)
  170. auto& shadow = data.getShadow(); // Get the target vector (the sorted data)
  171. size_t N = data.size(); // The total size is the same or both vectors
  172. size_t left = std::distance(
  173. active.begin(),
  174. (ascending) ?
  175. std::min_element(active.begin(), active.end()) :
  176. std::max_element(active.begin(), active.end())
  177. ); // start 'left' from elbow of the bitonic
  178. size_t right = (left == N-1) ? 0 : left + 1;
  179. // Walk in opposite directions from elbow and insert-sort to target vector
  180. for (size_t i = 0 ; i<N ; ++i) {
  181. if (comp(active[left], active[right])) {
  182. shadow[i] = active[left];
  183. left = (left == 0) ? N-1 : left -1; // cycle decrease
  184. }
  185. else {
  186. shadow[i] = active[right];
  187. right = (right + 1) % N; // cycle increase
  188. }
  189. }
  190. data.switch_active(); // Switch active-shadow buffers
  191. }
  192. /*!
  193. * Sort a shadowed buffer using the "elbow sort" algorithm.
  194. *
  195. * @tparam ShadowedT A Shadowed buffer type with random access iterator.
  196. *
  197. * @param data [ShadowedT] The data to sort
  198. * @param ascending [bool] Flag to indicate the sorting order
  199. */
  200. template<typename ShadowedT>
  201. void elbowSort(ShadowedT& data, bool ascending) noexcept {
  202. if (ascending)
  203. elbowSortCore(data, ascending, std::less<>());
  204. else
  205. elbowSortCore(data, ascending, std::greater<>());
  206. }
  207. /*!
  208. * Takes two sorted sequences where one is in increasing and the other is in decreasing order
  209. * and selects either the larger or the smaller items in one-to-one comparison between them.
  210. * The result is a bitonic sequence.
  211. *
  212. * @tparam RangeT A range type with random access iterator
  213. *
  214. * @param local [RangeT] Reference to the local sequence
  215. * @param remote [const RangeT] Reference to the remote sequence (copied locally by MPI)
  216. * @param keepSmall [bool] Flag to indicate if we keep the small items in local sequence
  217. */
  218. template<typename RangeT>
  219. void minmax(RangeT& local, const RangeT& remote, bool keepSmall) noexcept {
  220. using value_t = typename RangeT::value_type;
  221. std::transform(
  222. local.begin(), local.end(),
  223. remote.begin(),
  224. local.begin(),
  225. [&keepSmall](const value_t& a, const value_t& b){
  226. return (keepSmall) ? std::min(a, b) : std::max(a, b);
  227. });
  228. }
  229. /*
  230. * ============================== Sort algorithms ==============================
  231. */
  232. /*!
  233. * A distributed version of the Bubbletonic sort algorithm.
  234. *
  235. * @note
  236. * Each MPI process should run an instance of this function.
  237. *
  238. * @tparam ShadowedT A Shadowed buffer type with random access iterator.
  239. *
  240. * @param data [ShadowedT] The local to MPI process data to sort
  241. * @param Processes [mpi_id_t] The total number of MPI processes
  242. */
  243. template<typename ShadowedT>
  244. void distBubbletonic(ShadowedT& data, mpi_id_t Processes, mpi_id_t rank) {
  245. // Initially sort to create a half part of a bitonic sequence
  246. fullSort(data, ascending<SortMode::Bubbletonic>(rank, 0));
  247. // Sort network (O(N) iterations)
  248. for (size_t step = 0; step < static_cast<size_t>(Processes); ++step) {
  249. // Find out exchange configuration
  250. auto part = partner<SortMode::Bubbletonic>(rank, step);
  251. auto ks = keepSmall<SortMode::Bubbletonic>(rank, part, Processes);
  252. if ( isActive(rank, Processes) &&
  253. isActive(part, Processes) ) {
  254. // Exchange with partner, keep nim-or-max and sort - O(N)
  255. mpi.exchange(part, data.getActive(), data.getShadow(), step);
  256. minmax(data.getActive(), data.getShadow(), ks);
  257. elbowSort(data, ascending<SortMode::Bubbletonic>(rank, Processes));
  258. }
  259. }
  260. // Invert if the node was descending.
  261. if (!ascending<SortMode::Bubbletonic>(rank, 0))
  262. elbowSort(data, true);
  263. }
  264. /*!
  265. * A distributed version of the Bitonic sort algorithm.
  266. *
  267. * @note
  268. * Each MPI process should run an instance of this function.
  269. *
  270. * @tparam ShadowedT A Shadowed buffer type with random access iterator.
  271. *
  272. * @param data [ShadowedT] The local to MPI process data to sort
  273. * @param Processes [mpi_id_t] The total number of MPI processes
  274. */
  275. template<typename ShadowedT>
  276. void distBitonic(ShadowedT& data, mpi_id_t Processes, mpi_id_t rank) {
  277. // Initially sort to create a half part of a bitonic sequence
  278. fullSort(data, ascending<SortMode::Bitonic>(rank, 0));
  279. // Run through sort network using elbow-sort ( O(LogN * LogN) iterations )
  280. auto p = static_cast<uint32_t>(std::log2(Processes));
  281. for (size_t depth = 1; depth <= p; ++depth) {
  282. for (size_t step = depth; step > 0;) {
  283. --step;
  284. // Find out exchange configuration
  285. auto part = partner<SortMode::Bitonic>(rank, step);
  286. auto ks = keepSmall<SortMode::Bitonic>(rank, part, depth);
  287. // Exchange with partner, keep nim-or-max
  288. mpi.exchange(part, data.getActive(), data.getShadow(), (depth << 8) | step);
  289. minmax(data.getActive(), data.getShadow(), ks);
  290. }
  291. // sort - O(N)
  292. elbowSort (data, ascending<SortMode::Bitonic>(rank, depth));
  293. }
  294. }
  295. #endif //DISTBITONIC_H_