[764b4b2] | 1 | // |
---|
[2e457d8] | 2 | // Cforall Version 1.0.0 Copyright (C) 2017 University of Waterloo |
---|
| 3 | // |
---|
[90449e4] | 4 | // The contents of this file are covered under the licence agreement in the |
---|
| 5 | // file "LICENCE" distributed with Cforall. |
---|
[764b4b2] | 6 | // |
---|
[90449e4] | 7 | // quickSort.c -- In-place concurrent quick-sort: threads are created to partition to a specific depth, then sequential |
---|
| 8 | // recursive-calls are use to sort each partition. |
---|
[764b4b2] | 9 | // |
---|
[90449e4] | 10 | // Author : Peter A. Buhr |
---|
| 11 | // Created On : Wed Dec 6 12:15:52 2017 |
---|
| 12 | // Last Modified By : Peter A. Buhr |
---|
[921cd82] | 13 | // Last Modified On : Wed Feb 12 18:24:47 2020 |
---|
| 14 | // Update Count : 177 |
---|
[764b4b2] | 15 | // |
---|
[90449e4] | 16 | |
---|
[73abe95] | 17 | #include <fstream.hfa> |
---|
| 18 | #include <stdlib.hfa> |
---|
| 19 | #include <kernel.hfa> |
---|
| 20 | #include <thread.hfa> |
---|
[90449e4] | 21 | #include <string.h> // strcmp |
---|
| 22 | |
---|
| 23 | thread Quicksort { |
---|
[f0322e20] | 24 | int * values; // communication variables |
---|
[90449e4] | 25 | int low, high, depth; |
---|
| 26 | }; |
---|
| 27 | |
---|
[f0322e20] | 28 | void ?{}( Quicksort & qs, int values[], int size, int depth ) { |
---|
[921cd82] | 29 | qs.[values, low, high, depth] = [values, 0, size, depth]; |
---|
[90449e4] | 30 | } // Quicksort |
---|
| 31 | |
---|
[f0322e20] | 32 | void main( Quicksort & qs ) { // thread starts here |
---|
[90449e4] | 33 | // nested routines: information hiding |
---|
| 34 | |
---|
[f0322e20] | 35 | void ?{}( Quicksort & qs, int values[], int low, int high, int depth ) { |
---|
[90449e4] | 36 | qs.values = values; qs.low = low; qs.high = high; qs.depth = depth; |
---|
| 37 | } // Quicksort |
---|
| 38 | |
---|
[f0322e20] | 39 | void sort( int values[], int low, int high, int depth ) { |
---|
[90449e4] | 40 | int left, right; // index to left/right-hand side of the values |
---|
[f0322e20] | 41 | int pivot; // pivot value of values |
---|
| 42 | int swap; // temporary |
---|
[90449e4] | 43 | |
---|
| 44 | //verify(); // check for stack overflow due to recursion |
---|
| 45 | |
---|
| 46 | // partition while 2 or more elements in the array |
---|
| 47 | if ( low < high ) { |
---|
| 48 | pivot = values[low + ( high - low ) / 2]; |
---|
| 49 | left = low; |
---|
| 50 | right = high; |
---|
| 51 | |
---|
| 52 | // partition: move values less < pivot before the pivot and values > pivot after the pivot |
---|
| 53 | do { |
---|
| 54 | while ( values[left] < pivot ) left += 1; // changed values[left] < pivot |
---|
| 55 | while ( pivot < values[right] ) right -= 1; |
---|
| 56 | if ( left <= right ) { |
---|
| 57 | swap = values[left]; // interchange values |
---|
| 58 | values[left] = values[right]; |
---|
| 59 | values[right] = swap; |
---|
| 60 | left += 1; |
---|
| 61 | right -= 1; |
---|
| 62 | } // if |
---|
| 63 | } while ( left <= right ); |
---|
| 64 | |
---|
| 65 | // restrict number of tasks to slightly greater than number of processors |
---|
| 66 | if ( depth > 0 ) { |
---|
| 67 | depth -= 1; |
---|
[fdf4efb] | 68 | Quicksort lqs = { values, low, right, depth }; // concurrently sort lower half |
---|
| 69 | Quicksort rqs = { values, left, high, depth }; // concurrently sort upper half |
---|
| 70 | // Quicksort lqs = { values, low, right, depth }; // concurrently sort lower half |
---|
| 71 | // sort( values, left, high, depth ); // concurrently sort upper half |
---|
[90449e4] | 72 | } else { |
---|
| 73 | sort( values, low, right, 0 ); // sequentially sort lower half |
---|
| 74 | sort( values, left, high, 0 ); // sequentially sort upper half |
---|
| 75 | } // if |
---|
| 76 | } // if |
---|
| 77 | } // sort |
---|
| 78 | |
---|
| 79 | with( qs ) { |
---|
| 80 | sort( values, low, high, depth ); |
---|
| 81 | } // with |
---|
| 82 | } // main |
---|
| 83 | |
---|
| 84 | |
---|
| 85 | bool convert( int & val, const char * nptr ) { // convert C string to integer |
---|
| 86 | char * eptr; |
---|
| 87 | int temp = strto( nptr, &eptr, 10 ); // do not change val on false |
---|
| 88 | // true => entire string valid with no extra characters |
---|
| 89 | return *nptr != '\0' && *eptr == '\0' ? val = temp, true : false; |
---|
| 90 | } // convert |
---|
| 91 | |
---|
| 92 | void usage( char * argv[] ) { |
---|
[200fcb3] | 93 | sout | "Usage:" | argv[0] | "( -s unsorted-file [ sorted-file ] | -t size (>= 0) [ depth (>= 0) ] )"; |
---|
[90449e4] | 94 | exit( EXIT_FAILURE ); // TERMINATE! |
---|
| 95 | } // usage |
---|
| 96 | |
---|
[edb6f79] | 97 | |
---|
[90449e4] | 98 | int main( int argc, char * argv[] ) { |
---|
| 99 | ifstream & unsortedfile = sin; |
---|
| 100 | ofstream & sortedfile = sout; // default value |
---|
| 101 | int depth = 0, size; |
---|
| 102 | |
---|
| 103 | if ( argc != 1 ) { // do not use defaults |
---|
| 104 | if ( argc < 2 || argc > 4 ) usage( argv ); // wrong number of options |
---|
[c1135eef] | 105 | if ( strcmp( argv[1], "-t" ) == 0 ) { // timing ? |
---|
[f0322e20] | 106 | &unsortedfile = (ifstream *)0; // no input |
---|
[90449e4] | 107 | choose ( argc ) { |
---|
| 108 | case 4: |
---|
[f0322e20] | 109 | if ( ! convert( depth, argv[3] ) || depth < 0 ) usage( argv ); |
---|
| 110 | fallthrough; |
---|
| 111 | case 3: |
---|
| 112 | if ( ! convert( size, argv[2] ) || size < 0 ) usage( argv ); |
---|
| 113 | } // choose |
---|
| 114 | } else { // sort file |
---|
| 115 | choose ( argc ) { |
---|
| 116 | case 3: |
---|
| 117 | &sortedfile = new( (const char *)argv[2] ); // open the output file |
---|
[90449e4] | 118 | if ( fail( sortedfile ) ) { |
---|
[200fcb3] | 119 | serr | "Error! Could not open sorted output file \"" | argv[2] | "\""; |
---|
[90449e4] | 120 | usage( argv ); |
---|
| 121 | } // if |
---|
| 122 | fallthrough; |
---|
[f0322e20] | 123 | case 2: |
---|
| 124 | &unsortedfile = new( (const char *)argv[1] ); // open the input file |
---|
[90449e4] | 125 | if ( fail( unsortedfile ) ) { |
---|
[200fcb3] | 126 | serr | "Error! Could not open unsorted input file \"" | argv[1] | "\""; |
---|
[90449e4] | 127 | usage( argv ); |
---|
| 128 | } // if |
---|
| 129 | } // choose |
---|
[f0322e20] | 130 | } // if |
---|
[90449e4] | 131 | } // if |
---|
[200fcb3] | 132 | sortedfile | nlOff; // turn off auto newline |
---|
[90449e4] | 133 | |
---|
| 134 | enum { ValuesPerLine = 22 }; // number of values printed per line |
---|
| 135 | |
---|
| 136 | if ( &unsortedfile ) { // generate output ? |
---|
[adb6b30f] | 137 | for () { |
---|
[90449e4] | 138 | unsortedfile | size; // read number of elements in the list |
---|
| 139 | if ( eof( unsortedfile ) ) break; |
---|
[f0322e20] | 140 | int * values = alloc( size ); // values to be sorted, too large to put on stack |
---|
[3aa1d22] | 141 | for ( counter; size ) { // read unsorted numbers |
---|
[90449e4] | 142 | unsortedfile | values[counter]; |
---|
[200fcb3] | 143 | if ( counter != 0 && counter % ValuesPerLine == 0 ) sortedfile | nl | " "; |
---|
[90449e4] | 144 | sortedfile | values[counter]; |
---|
| 145 | if ( counter < size - 1 && (counter + 1) % ValuesPerLine != 0 ) sortedfile | ' '; |
---|
| 146 | } // for |
---|
[200fcb3] | 147 | sortedfile | nl; |
---|
[90449e4] | 148 | if ( size > 0 ) { // values to sort ? |
---|
[f0322e20] | 149 | Quicksort QS = { values, size - 1, 0 }; // sort values |
---|
[90449e4] | 150 | } // wait until sort tasks terminate |
---|
[3aa1d22] | 151 | for ( counter; size ) { // print sorted list |
---|
[200fcb3] | 152 | if ( counter != 0 && counter % ValuesPerLine == 0 ) sortedfile | nl | " "; |
---|
[90449e4] | 153 | sortedfile | values[counter]; |
---|
| 154 | if ( counter < size - 1 && (counter + 1) % ValuesPerLine != 0 ) sortedfile | ' '; |
---|
| 155 | } // for |
---|
[5ea5b28] | 156 | sortedfile | nl | nl; |
---|
[90449e4] | 157 | |
---|
| 158 | delete( values ); |
---|
| 159 | } // for |
---|
| 160 | if ( &unsortedfile != &sin ) delete( &unsortedfile ); // close input/output files |
---|
| 161 | if ( &sortedfile != &sout ) delete( &sortedfile ); |
---|
| 162 | } else { |
---|
| 163 | processor processors[ (1 << depth) - 1 ] __attribute__(( unused )); // create 2^depth-1 kernel threads |
---|
| 164 | |
---|
[fdf4efb] | 165 | int * values = alloc( size ); // values to be sorted, too large to put on stack |
---|
| 166 | for ( counter; size ) { // generate unsorted numbers |
---|
[90449e4] | 167 | values[counter] = size - counter; // descending values |
---|
| 168 | } // for |
---|
[921cd82] | 169 | for ( i; 200 ) { // random shuffle a few values |
---|
[fdf4efb] | 170 | swap( values[rand() % size], values[rand() % size] ); |
---|
| 171 | } // for |
---|
[90449e4] | 172 | { |
---|
[f0322e20] | 173 | Quicksort QS = { values, size - 1, depth }; // sort values |
---|
[90449e4] | 174 | } // wait until sort tasks terminate |
---|
| 175 | |
---|
[3aa1d22] | 176 | // for ( counter; size - 1 ) { // check sorting |
---|
[90449e4] | 177 | // if ( values[counter] > values[counter + 1] ) abort(); |
---|
| 178 | // } // for |
---|
| 179 | |
---|
| 180 | delete( values ); |
---|
| 181 | } // if |
---|
| 182 | } // main |
---|
| 183 | |
---|
[fdf4efb] | 184 | // for depth in 0 1 2 3 4 5 ; do echo "sort 500000000 values with ${depth} depth" ; time -f "%Uu %Ss %E %Mkb" a.out -t 500000000 ${depth} ; done |
---|
| 185 | |
---|
[90449e4] | 186 | // Local Variables: // |
---|
| 187 | // tab-width: 4 // |
---|
[f8cd310] | 188 | // compile-command: "cfa quickSort.cfa" // |
---|
[90449e4] | 189 | // End: // |
---|