#include <stdlib.h>
#include <stdio.h>
#include <inttypes.h>
#include <time.h>
#include <mpi.h>
#if MPI_VERSION < 3
#define OTF2_MPI_UINT64_T MPI_UNSIGNED_LONG
#define OTF2_MPI_INT64_T MPI_LONG
#endif
get_time( void )
{
double t = MPI_Wtime() * 1e9;
return ( uint64_t )t;
}
pre_flush( void* userData,
void* callerData,
bool final )
{
}
post_flush( void* userData,
{
return get_time();
}
{
.otf2_post_flush = post_flush
};
enum
{
REGION_MPI_INIT,
REGION_MPI_FINALIZE,
REGION_MPI_COMM_SPLIT,
REGION_MPI_INTERCOMM_CREATE,
REGION_MPI_COMM_FREE,
REGION_MPI_BCAST,
REGION_MPI_IBARRIER,
REGION_MPI_TEST,
REGION_MPI_WAIT
};
enum
{
COMM_WORLD,
COMM_SPLIT_0,
COMM_SPLIT_1,
COMM_INTERCOMM
};
int
main( int argc,
char** argv )
{
MPI_Init( &argc, &argv );
int size;
MPI_Comm_size( MPI_COMM_WORLD, &size );
int rank;
MPI_Comm_rank( MPI_COMM_WORLD, &rank );
"ArchiveName",
1024 * 1024 ,
4 * 1024 * 1024 ,
MPI_COMM_WORLD,
MPI_COMM_NULL );
rank );
struct timespec epoch_timestamp_spec;
clock_gettime( CLOCK_REALTIME, &epoch_timestamp_spec );
uint64_t epoch_start = get_time();
NULL,
get_time(),
REGION_MPI_INIT );
NULL,
get_time() );
MPI_Barrier( MPI_COMM_WORLD );
NULL,
get_time(),
COMM_WORLD );
NULL,
get_time(),
COMM_WORLD,
0 ,
0 );
NULL,
get_time(),
REGION_MPI_INIT );
NULL,
get_time(),
REGION_MPI_IBARRIER );
uint64_t barrier_request_id = 1;
NULL,
get_time(),
barrier_request_id );
MPI_Request barrier_request;
MPI_Ibarrier( MPI_COMM_WORLD, &barrier_request );
NULL,
get_time(),
REGION_MPI_IBARRIER );
MPI_Comm split_comm;
NULL,
get_time(),
REGION_MPI_COMM_SPLIT );
NULL,
get_time() );
MPI_Comm_split( MPI_COMM_WORLD, rank % 2, rank, &split_comm );
if ( 0 == rank % 2 )
{
NULL,
get_time(),
COMM_SPLIT_0 );
}
else
{
NULL,
get_time(),
COMM_SPLIT_1 );
}
NULL,
get_time(),
COMM_WORLD,
0 ,
0 );
NULL,
get_time(),
REGION_MPI_COMM_SPLIT );
MPI_Comm inter_comm;
NULL,
get_time(),
REGION_MPI_INTERCOMM_CREATE );
NULL,
get_time() );
if ( 0 == rank % 2 )
{
MPI_Intercomm_create( split_comm, 0, MPI_COMM_WORLD, 1, 1, &inter_comm );
}
else
{
MPI_Intercomm_create( split_comm, 0, MPI_COMM_WORLD, 0, 1, &inter_comm );
}
NULL,
get_time(),
COMM_INTERCOMM );
NULL,
get_time(),
COMM_WORLD,
0 ,
0 );
NULL,
get_time(),
REGION_MPI_INTERCOMM_CREATE );
NULL,
get_time(),
REGION_MPI_COMM_FREE );
NULL,
get_time() );
MPI_Comm_free( &split_comm );
if ( 0 == rank % 2 )
{
NULL,
get_time(),
COMM_SPLIT_0 );
NULL,
get_time(),
COMM_SPLIT_0,
0 ,
0 );
}
else
{
NULL,
get_time(),
COMM_SPLIT_1 );
NULL,
get_time(),
COMM_SPLIT_1,
0 ,
0 );
}
NULL,
get_time(),
REGION_MPI_COMM_FREE );
NULL,
get_time(),
REGION_MPI_TEST );
NULL,
get_time(),
barrier_request_id );
NULL,
get_time(),
REGION_MPI_TEST );
NULL,
get_time(),
REGION_MPI_BCAST );
NULL,
get_time() );
int res = -1;
if ( rank % 2 == 0 )
{
if ( rank == 0 )
{
res = 1;
MPI_Bcast( &res, 1, MPI_INT, MPI_ROOT, inter_comm );
NULL,
get_time(),
COMM_INTERCOMM,
0 ,
0 );
}
else
{
MPI_Bcast( &res, 1, MPI_INT, MPI_PROC_NULL, inter_comm );
NULL,
get_time(),
COMM_INTERCOMM,
0 ,
0 );
}
}
else if ( rank % 2 == 1 )
{
MPI_Bcast( &res, 1, MPI_INT, 0, inter_comm );
NULL,
get_time(),
COMM_INTERCOMM,
0 ,
0 ,
0 );
}
NULL,
get_time(),
REGION_MPI_BCAST );
NULL,
get_time(),
REGION_MPI_COMM_FREE );
NULL,
get_time() );
MPI_Comm_free( &inter_comm );
NULL,
get_time(),
COMM_INTERCOMM );
NULL,
get_time(),
COMM_INTERCOMM,
0 ,
0 );
NULL,
get_time(),
REGION_MPI_COMM_FREE );
NULL,
get_time(),
REGION_MPI_WAIT );
MPI_Status barrier_status;
MPI_Wait( &barrier_request, &barrier_status );
NULL,
get_time(),
COMM_WORLD,
0 ,
0 ,
barrier_request_id );
NULL,
get_time(),
REGION_MPI_WAIT );
NULL,
get_time(),
REGION_MPI_FINALIZE );
NULL,
get_time() );
MPI_Barrier( MPI_COMM_WORLD );
NULL,
get_time(),
COMM_WORLD );
NULL,
get_time(),
COMM_WORLD,
0 ,
0 );
NULL,
get_time(),
REGION_MPI_FINALIZE );
uint64_t epoch_end = get_time();
rank );
uint64_t epoch_timestamp = epoch_timestamp_spec.tv_sec * 1000000000 + epoch_timestamp_spec.tv_nsec;
struct
{
uint64_t timestamp;
int index;
} epoch_start_pair, global_epoch_start_pair;
epoch_start_pair.timestamp = epoch_start;
epoch_start_pair.index = rank;
MPI_Allreduce( &epoch_start_pair,
&global_epoch_start_pair,
1, MPI_LONG_INT, MPI_MINLOC,
MPI_COMM_WORLD );
if ( epoch_start_pair.index != 0 )
{
if ( rank == 0 )
{
epoch_start_pair.index, 0, MPI_COMM_WORLD, MPI_STATUS_IGNORE );
}
else
{
0, 0, MPI_COMM_WORLD );
}
}
uint64_t global_epoch_end;
MPI_Reduce( &epoch_end,
&global_epoch_end,
0, MPI_COMM_WORLD );
if ( 0 == rank )
{
1000000000,
global_epoch_start_pair.timestamp,
global_epoch_end - global_epoch_start_pair.timestamp + 1,
epoch_timestamp );
REGION_MPI_INIT,
2 ,
3 ,
0 ,
22 ,
0 ,
0 );
REGION_MPI_FINALIZE,
4 ,
5 ,
0 ,
22 ,
0 ,
0 );
REGION_MPI_COMM_SPLIT,
6 ,
7 ,
0 ,
22 ,
0 ,
0 );
REGION_MPI_INTERCOMM_CREATE,
8 ,
9 ,
0 ,
22 ,
0 ,
0 );
REGION_MPI_COMM_FREE,
10 ,
11 ,
0 ,
22 ,
0 ,
0 );
REGION_MPI_BCAST,
12 ,
13 ,
0 ,
22 ,
0 ,
0 );
REGION_MPI_IBARRIER,
14 ,
15 ,
0 ,
22 ,
0 ,
0 );
REGION_MPI_TEST,
16 ,
17 ,
0 ,
22 ,
0 ,
0 );
REGION_MPI_WAIT,
18 ,
19 ,
0 ,
22 ,
0 ,
0 );
0 ,
20 ,
21 ,
for ( int r = 0; r < size; r++ )
{
char process_name[ 32 ];
snprintf( process_name, sizeof( process_name ), "MPI Rank %d", r );
27 + r,
process_name );
r ,
27 + r ,
0 ,
r ,
1 ,
43 ,
r );
}
uint64_t comm_locations[ size ];
for ( int r = 0; r < size; r++ )
{
comm_locations[ r ] = r;
}
0 ,
24 ,
size,
comm_locations );
1 ,
0 ,
size,
comm_locations );
COMM_WORLD,
23 ,
1 ,
for ( int r = 0; r < size; r += 2 )
{
comm_locations[ r / 2 ] = r;
}
2 ,
0 ,
( size + 1 ) / 2,
comm_locations );
COMM_SPLIT_0,
24 ,
2 ,
COMM_WORLD,
for ( int r = 1; r < size; r += 2 )
{
comm_locations[ r / 2 ] = r;
}
3 ,
0 ,
size / 2,
comm_locations );
COMM_SPLIT_1,
25 ,
3 ,
COMM_WORLD,
COMM_INTERCOMM,
26 ,
2 ,
3 ,
COMM_WORLD,
global_def_writer );
}
MPI_Barrier( MPI_COMM_WORLD );
MPI_Finalize();
return EXIT_SUCCESS;
}