[5adf4f4] | 1 | #include <iostream> |
---|
| 2 | #include <algorithm> |
---|
| 3 | using namespace std; |
---|
| 4 | #include <chrono> |
---|
| 5 | using namespace chrono; |
---|
| 6 | #include <uActor.h> |
---|
| 7 | |
---|
| 8 | unsigned int xr = 3'072, xc = 3'072, yc = 3'072, Processors = 1; // default values |
---|
| 9 | |
---|
| 10 | struct WorkMsg : public uActor::Message { // derived message |
---|
| 11 | int * Z; |
---|
| 12 | const int * const X, * const * Y; |
---|
| 13 | WorkMsg( int Z[], const int X[], const int * const Y[] ) : |
---|
| 14 | Message( uActor::Finished ), Z( Z ), X( X ), Y( Y ) {} // one-shot |
---|
| 15 | }; // WorkMsg |
---|
| 16 | |
---|
| 17 | time_point<steady_clock> starttime; |
---|
| 18 | |
---|
| 19 | _Actor MatrixMult { |
---|
| 20 | Allocation receive( Message & msg ) { |
---|
| 21 | Case ( WorkMsg, msg ) { |
---|
| 22 | int * z = msg_d->Z; // optimizations |
---|
| 23 | const int * const x = msg_d->X, * const * y = msg_d->Y; |
---|
| 24 | for ( unsigned int i = 0; i < yc; i += 1 ) { // multiply X_row by Y_col and sum products |
---|
| 25 | z[i] = 0; |
---|
| 26 | for ( unsigned int j = 0; j < xc; j += 1 ) { |
---|
| 27 | z[i] += x[j] * y[j][i]; |
---|
| 28 | } // for |
---|
| 29 | } // for |
---|
| 30 | } // Case |
---|
| 31 | |
---|
| 32 | return Finished; |
---|
| 33 | } // MatrixMult:::receive |
---|
| 34 | }; // MatrixMult |
---|
| 35 | |
---|
| 36 | int main( int argc, char * argv[] ) { |
---|
| 37 | locale loc( getenv("LANG") ); |
---|
| 38 | cout.imbue( loc ); |
---|
| 39 | |
---|
| 40 | switch ( argc ) { |
---|
| 41 | case 5: |
---|
| 42 | if ( strcmp( argv[4], "d" ) != 0 ) { // default ? |
---|
| 43 | Processors = stoi( argv[4] ); |
---|
| 44 | if ( Processors < 1 ) goto Usage; |
---|
| 45 | } // if |
---|
| 46 | case 4: |
---|
| 47 | if ( strcmp( argv[3], "d" ) != 0 ) { // default ? |
---|
| 48 | xr = stoi( argv[3] ); |
---|
| 49 | if ( xr < 1 ) goto Usage; |
---|
| 50 | } // if |
---|
| 51 | case 3: |
---|
| 52 | if ( strcmp( argv[2], "d" ) != 0 ) { // default ? |
---|
| 53 | xc = stoi( argv[2] ); |
---|
| 54 | if ( xc < 1 ) goto Usage; |
---|
| 55 | } // if |
---|
| 56 | case 2: |
---|
| 57 | if ( strcmp( argv[1], "d" ) != 0 ) { // default ? |
---|
| 58 | yc = stoi( argv[1] ); |
---|
| 59 | if ( yc < 1 ) goto Usage; |
---|
| 60 | } // if |
---|
| 61 | case 1: // use defaults |
---|
| 62 | break; |
---|
| 63 | default: |
---|
| 64 | Usage: |
---|
| 65 | cerr << "Usage: " << argv[0] |
---|
| 66 | << " [ yc (> 0) | 'd' (default " << yc |
---|
| 67 | << ") ] [ xc (> 0) | 'd' (default " << xc |
---|
| 68 | << ") ] [ xr (> 0) | 'd' (default " << xr |
---|
| 69 | << ") ] [ processors (> 0) | 'd' (default " << Processors |
---|
| 70 | << ") ]" << endl; |
---|
| 71 | exit( EXIT_FAILURE ); |
---|
| 72 | } // switch |
---|
| 73 | |
---|
| 74 | unsigned int r, c; |
---|
| 75 | int * Z[xr], * X[xr], * Y[xc]; |
---|
| 76 | |
---|
| 77 | for ( r = 0; r < xr; r += 1 ) { // create/initialize X matrix |
---|
| 78 | X[r] = new int[xc]; |
---|
| 79 | for ( c = 0; c < xc; c += 1 ) { |
---|
| 80 | X[r][c] = r * c % 37; // for timing |
---|
| 81 | } // for |
---|
| 82 | } // for |
---|
| 83 | for ( r = 0; r < xc; r += 1 ) { // create/initialize Y matrix |
---|
| 84 | Y[r] = new int[yc]; |
---|
| 85 | for ( c = 0; c < yc; c += 1 ) { |
---|
| 86 | Y[r][c] = r * c % 37; // for timing |
---|
| 87 | } // for |
---|
| 88 | } // for |
---|
| 89 | for ( r = 0; r < xr; r += 1 ) { // create Z matrix |
---|
| 90 | Z[r] = new int[yc]; |
---|
| 91 | } // for |
---|
| 92 | |
---|
| 93 | uExecutor * executor = new uExecutor( Processors, Processors, Processors == 1 ? 1 : Processors * 32, true, 0 ); |
---|
| 94 | uActor::start( executor ); // start actor system |
---|
| 95 | uNoCtor<MatrixMult> * multiply = new uNoCtor<MatrixMult>[xr]; |
---|
| 96 | uNoCtor<WorkMsg> * workMsg = new uNoCtor<WorkMsg>[xr]; |
---|
| 97 | |
---|
| 98 | for ( unsigned int r = 0; r < xr; r += 1 ) { |
---|
| 99 | multiply[r].ctor(); |
---|
| 100 | workMsg[r].ctor( Z[r], X[r], (const int * const *)Y ); |
---|
| 101 | } // for |
---|
| 102 | |
---|
| 103 | starttime = steady_clock::now(); |
---|
| 104 | for ( unsigned int r = 0; r < xr; r += 1 ) { |
---|
| 105 | *multiply[r] | *workMsg[r]; |
---|
| 106 | } // for |
---|
| 107 | |
---|
| 108 | uActor::stop(); // wait for all actors to terminate |
---|
| 109 | |
---|
| 110 | cout << (steady_clock::now() - starttime).count() / 1'000'000'000.0 << endl; |
---|
| 111 | |
---|
| 112 | for ( r = 0; r < xr; r += 1 ) { // deallocate X and Z matrices |
---|
| 113 | delete [] X[r]; |
---|
| 114 | delete [] Z[r]; |
---|
| 115 | } // for |
---|
| 116 | for ( r = 0; r < xc; r += 1 ) { // deallocate Y matrix |
---|
| 117 | delete [] Y[r]; |
---|
| 118 | } // for |
---|
| 119 | |
---|
| 120 | // malloc_stats(); |
---|
| 121 | } // main |
---|
| 122 | |
---|
| 123 | // /usr/bin/time -f "%Uu %Ss %Er %Mkb" a.out |
---|
| 124 | |
---|
| 125 | // Local Variables: // |
---|
| 126 | // compile-command: "u++-work -g -Wall -Wextra -O3 -nodebug -DNDEBUG -multi uC++Matrix.cc" // |
---|
| 127 | // End: // |
---|