|
| 1 | +#include <mpi.h> |
| 2 | +#include <stdio.h> |
| 3 | +#include <stddef.h> |
| 4 | +#include <stdlib.h> |
| 5 | +#include <string.h> |
| 6 | + |
| 7 | +#include "ompi_config.h" |
| 8 | +#include "ompi/datatype/ompi_datatype.h" |
| 9 | +#include "opal/runtime/opal.h" |
| 10 | +#include "opal/datatype/opal_convertor.h" |
| 11 | +#include "opal/datatype/opal_datatype_internal.h" |
| 12 | + |
| 13 | +#define MAX_IOVEC 10 |
| 14 | +#define MAX_CHUNK (1024*1024*1024) /* 1GB */ |
| 15 | + |
| 16 | +static size_t |
| 17 | +count_length_via_convertor_raw(MPI_Datatype dtype, int count) |
| 18 | +{ |
| 19 | + opal_convertor_t* pconv; |
| 20 | + struct iovec iov[MAX_IOVEC]; |
| 21 | + uint32_t iov_count = MAX_IOVEC, i; |
| 22 | + size_t length = MAX_CHUNK, packed_iovec = 0, packed = 0; |
| 23 | + |
| 24 | + pconv = opal_convertor_create( opal_local_arch, 0 ); |
| 25 | + opal_convertor_prepare_for_send(pconv, (const struct opal_datatype_t *)dtype, 1, NULL); |
| 26 | + while( 0 == opal_convertor_raw(pconv, iov, &iov_count, &length) ) { |
| 27 | + printf("iov_count = %d packed_iovec = %"PRIsize_t"\n", iov_count, packed_iovec); |
| 28 | + packed += length; |
| 29 | + for( i = 0; i < iov_count; i++ ) { |
| 30 | + packed_iovec += iov[i].iov_len; |
| 31 | + } |
| 32 | + if( packed != packed_iovec ) { |
| 33 | + printf( "Packed send amount diverges %"PRIsize_t" != %"PRIsize_t"\n", packed, packed_iovec); |
| 34 | + exit(-1); |
| 35 | + } |
| 36 | + iov_count = MAX_IOVEC; /* number of available iov */ |
| 37 | + length = MAX_CHUNK; |
| 38 | + } |
| 39 | + packed += length; |
| 40 | + for( i = 0; i < iov_count; i++ ) { |
| 41 | + packed_iovec += iov[i].iov_len; |
| 42 | + } |
| 43 | + if( packed != packed_iovec ) { |
| 44 | + printf( "Packed send amount diverges %"PRIsize_t" != %"PRIsize_t"\n", packed, packed_iovec); |
| 45 | + exit(-1); |
| 46 | + } |
| 47 | + return packed_iovec; |
| 48 | +} |
| 49 | + |
| 50 | +int main(int argc, char * argv[]) |
| 51 | +{ |
| 52 | + |
| 53 | + int const per_process = 192; |
| 54 | + int const per_type = 20000000; |
| 55 | + |
| 56 | + int scounts[2] = {per_process, per_process}; |
| 57 | + int sdispls[2] = {3*per_process, 0*per_process}; |
| 58 | + int rcounts[2] = {per_process, per_process}; |
| 59 | + int rdispls[2] = {1*per_process, 2*per_process}; |
| 60 | + |
| 61 | + MPI_Datatype ddt, stype, rtype; |
| 62 | + |
| 63 | + opal_init_util(&argc, &argv); |
| 64 | + ompi_datatype_init(); |
| 65 | + |
| 66 | + ompi_datatype_create_contiguous( per_type, MPI_FLOAT, &ddt); |
| 67 | + ompi_datatype_create_indexed(2, scounts, sdispls, ddt, &stype); |
| 68 | + ompi_datatype_commit(&stype); |
| 69 | + ompi_datatype_create_indexed(2, rcounts, rdispls, ddt, &rtype); |
| 70 | + ompi_datatype_commit(&rtype); |
| 71 | + |
| 72 | + size_t packed = count_length_via_convertor_raw(stype, 1); |
| 73 | + size_t length; |
| 74 | + opal_datatype_type_size(&stype->super, &length); |
| 75 | + if( length != packed ) { |
| 76 | + printf("Mismatched length of packed data to datatype size (%"PRIsize_t" != %"PRIsize_t")\n", |
| 77 | + packed, length); |
| 78 | + exit(-2); |
| 79 | + } |
| 80 | + |
| 81 | + packed = count_length_via_convertor_raw(rtype, 1); |
| 82 | + opal_datatype_type_size(&rtype->super, &length); |
| 83 | + if( length != packed ) { |
| 84 | + printf("Mismatched length of packed data to datatype size (%"PRIsize_t" != %"PRIsize_t")\n", |
| 85 | + packed, length); |
| 86 | + exit(-2); |
| 87 | + } |
| 88 | + |
| 89 | + ompi_datatype_destroy(&stype); |
| 90 | + ompi_datatype_destroy(&rtype); |
| 91 | + |
| 92 | + return 0; |
| 93 | +} |
0 commit comments