Introduction

TNL offers several different parallel algorithms for sorting of arrays (or vectors) and also sorting based on user defined swapping. The latter is more general but also less efficient.

Sorting of arrays and vectors

The sorting of arrays and vectors is accessible via the following functions:

TNL::Algorithms::ascendingSort for sorting elements of array in ascending order,
TNL::Algorithms::descendingSort for sorting elements of array in descending order,
TNL::Algorithms::sort for sorting with user defined ordering.

The following example demonstrates the use of ascending and descending sort:

#include <iostream>
#include <TNL/Containers/Array.h>
#include <TNL/Algorithms/sort.h>
 
using namespace TNL;
using namespace TNL::Containers;
using namespace TNL::Algorithms;
 
template< typename ArrayT >
void
sort( ArrayT& array )
{
   const int size = 10;
 
   /****
    * Fill the array with random integers.
    */
   Array< int > aux_array( size );
   srand( size + 2021 );
   parallelFor< Devices::Host >( 0,
                                 size,
                                 [ & ]( int i )
                                 {
                                    aux_array[ i ] = std::rand() % ( 2 * size );
                                 } );
   array = aux_array;
 
   std::cout << "Random array: " << array << std::endl;
 
   /****
    * Sort the array in ascending order.
    */
   ascendingSort( array );
   std::cout << "Array sorted in ascending order:" << array << std::endl;
 
   /***
    * Sort the array in descending order.
    */
   descendingSort( array );
   std::cout << "Array sorted in descending order:" << array << std::endl;
}
 
int
main( int argc, char* argv[] )
{
   /***
    * Firstly, test the sorting on CPU.
    */
   std::cout << "Sorting on CPU ... " << std::endl;
   Array< int, Devices::Host > host_array;
   sort( host_array );
 
#ifdef __CUDACC__
   /***
    * And then also on GPU.
    */
   std::cout << "Sorting on GPU ... " << std::endl;
   Array< int, Devices::Cuda > cuda_array;
   sort( cuda_array );
#endif
   return EXIT_SUCCESS;
}

Here we create an array with random sequence of integers using the parallelFor function and then we sort the array in ascending order using ascendingSort and descending order using the descendingSort.

The result looks as follows:

Sorting on CPU ... 
Random array: [ 5, 1, 15, 5, 0, 11, 2, 14, 14, 8 ]
Array sorted in ascending order:[ 0, 1, 2, 5, 5, 8, 11, 14, 14, 15 ]
Array sorted in descending order:[ 15, 14, 14, 11, 8, 5, 5, 2, 1, 0 ]
Sorting on GPU ... 
Random array: [ 5, 1, 15, 5, 0, 11, 2, 14, 14, 8 ]
Array sorted in ascending order:[ 0, 1, 2, 5, 5, 8, 11, 14, 14, 15 ]
Array sorted in descending order:[ 15, 14, 14, 11, 8, 5, 5, 2, 1, 0 ]

How to achieve the same result with user defined ordering is demonstrated by the following example:

#include <iostream>
#include <TNL/Containers/Array.h>
#include <TNL/Algorithms/sort.h>
 
using namespace TNL;
using namespace TNL::Containers;
using namespace TNL::Algorithms;
 
template< typename ArrayT >
void
sort( ArrayT& array )
{
   const int size = 10;
 
   /****
    * Fill the array with random integers.
    */
   Array< int > aux_array( size );
   srand( size + 2021 );
   parallelFor< Devices::Host >( 0,
                                 size,
                                 [ & ]( int i )
                                 {
                                    aux_array[ i ] = std::rand() % ( 2 * size );
                                 } );
   array = aux_array;
 
   std::cout << "Random array: " << array << std::endl;
 
   /****
    * Sort the array in ascending order.
    */
   sort( array,
         [] __cuda_callable__( int a, int b )
         {
            return a < b;
         } );
   std::cout << "Array sorted in ascending order:" << array << std::endl;
 
   /***
    * Sort the array in descending order.
    */
   sort( array,
         [] __cuda_callable__( int a, int b )
         {
            return a > b;
         } );
   std::cout << "Array sorted in descending order:" << array << std::endl;
}
 
int
main( int argc, char* argv[] )
{
   /***
    * Firstly, test the sorting on CPU.
    */
   std::cout << "Sorting on CPU ... " << std::endl;
   Array< int, Devices::Host > host_array;
   sort( host_array );
 
#ifdef __CUDACC__
   /***
    * And then also on GPU.
    */
   std::cout << "Sorting on GPU ... " << std::endl;
   Array< int, Devices::Cuda > cuda_array;
   sort( cuda_array );
#endif
   return EXIT_SUCCESS;
}

The result looks as follows:

Sorting on CPU ... 
Random array: [ 5, 1, 15, 5, 0, 11, 2, 14, 14, 8 ]
Array sorted in ascending order:[ 0, 1, 2, 5, 5, 8, 11, 14, 14, 15 ]
Array sorted in descending order:[ 15, 14, 14, 11, 8, 5, 5, 2, 1, 0 ]
Sorting on GPU ... 
Random array: [ 5, 1, 15, 5, 0, 11, 2, 14, 14, 8 ]
Array sorted in ascending order:[ 0, 1, 2, 5, 5, 8, 11, 14, 14, 15 ]
Array sorted in descending order:[ 15, 14, 14, 11, 8, 5, 5, 2, 1, 0 ]

The same way, one can sort also TNL::Containers::ArrayView, TNL::Containers::Vector and TNL::Containers::VectorView.

Sorting with user-defined swapping

#include <iostream>
#include <TNL/Containers/Array.h>
#include <TNL/Algorithms/sort.h>
 
using namespace TNL;
using namespace TNL::Containers;
using namespace TNL::Algorithms;
 
template< typename ArrayT >
void
sort( ArrayT& array )
{
   const int size = 10;
 
   /****
    * Fill the array with random integers.
    */
   Array< int > aux_array( size );
   srand( size + 2021 );
   parallelFor< Devices::Host >( 0,
                                 size,
                                 [ & ]( int i )
                                 {
                                    aux_array[ i ] = std::rand() % ( 2 * size );
                                 } );
   array = aux_array;
 
   /***
    * Prepare second array holding elements positions.
    */
   ArrayT index( size );
   index.forAllElements(
      [] __cuda_callable__( int idx, int& value )
      {
         value = idx;
      } );
   std::cout << "Random array:     " << array << std::endl;
   std::cout << "Index array:      " << index << std::endl;
 
   /***
    * Sort the array `array` and apply the same permutation on the array `identity`.
    */
   auto array_view = array.getView();
   auto index_view = index.getView();
   sort< typename ArrayT::DeviceType,   // device on which the sorting will be performed
         typename ArrayT::IndexType >(  // type used for indexing
      0,
      size,                                              // range of indexes
      [ = ] __cuda_callable__( int i, int j ) -> bool {  // comparison lambda function
         return array_view[ i ] < array_view[ j ];
      },
      [ = ] __cuda_callable__( int i, int j ) mutable {  // lambda function for swapping of elements
         TNL::swap( array_view[ i ], array_view[ j ] );
         TNL::swap( index_view[ i ], index_view[ j ] );
      } );
   std::cout << "Sorted array:      " << array << std::endl;
   std::cout << "Index:             " << index << std::endl;
}
 
int
main( int argc, char* argv[] )
{
   /***
    * Firstly, test the sorting on CPU.
    */
   std::cout << "Sorting on CPU ... " << std::endl;
   Array< int, Devices::Host > host_array;
   sort( host_array );
 
#ifdef __CUDACC__
   /***
    * And then also on GPU.
    */
   std::cout << "Sorting on GPU ... " << std::endl;
   Array< int, Devices::Cuda > cuda_array;
   sort( cuda_array );
#endif
   return EXIT_SUCCESS;
}

In this example, we fill array array with random numbers and array index with numbers equal to position of an element in the array. We want to sort the array array and permute the index array correspondingly. This is achieved by calling a variant of the sort function, which does not accept an array-like data structure, but only range of indexes and two lambda functions. The first lambda function defines the ordering of the elements by comparing elements of array array. The second lambda function is responsible for swapping elements. Note that we do not swap only elements of array array, but also index array.

The result looks as follows:

Sorting on CPU ... 
Random array:     [ 5, 1, 15, 5, 0, 11, 2, 14, 14, 8 ]
Index array:      [ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9 ]
Sorted array:      [ 0, 1, 2, 5, 5, 8, 11, 14, 14, 15 ]
Index:             [ 4, 1, 6, 3, 0, 9, 5, 8, 7, 2 ]
Sorting on GPU ... 
Random array:     [ 5, 1, 15, 5, 0, 11, 2, 14, 14, 8 ]
Index array:      [ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9 ]
Sorted array:      [ 0, 1, 2, 5, 5, 8, 11, 14, 14, 15 ]
Index:             [ 4, 1, 6, 0, 3, 9, 5, 7, 8, 2 ]

Table of Contents

Introduction

Sorting of arrays and vectors

Sorting with user-defined swapping