Transfers strided data to a specified processing element (PE).
#include <shmem.h> void shmem_int_iput(int *target, const int *source, ptrdiff_t tst, ptrdiff_t sst, size_t len, int pe);
This routine provides a high-performance method for copying a strided array from the local PE to a contiguous data object on a different PE
This routine returns when the data has been copied out of the source array on the local PE, but not necessarily before the data has been delivered to the remote data object. To enforce the ordering/completion of the iput routines, the use of shmem_fence, shmem_quiet, shmem_barrier or shmem_barrier_all is needed.
The function shmem_int_iput() writes strided array of type integer to the remote PE.
Please refer to Atomicity and Coherency section for atomicity and coherence model in the OpenSHMEM documentation
#include <stdlib.h> #include <stdio.h> #include <shmem.h> #define GLOBAL_ARRAY_SIZE 20 #define SOURCE_STRIDE 3 #define TARGET_STRIDE 4 #define NUM_OF_TRANS_ELEM 5 static int gIntArray[GLOBAL_ARRAY_SIZE] = {0}; int main (int argc, char* argv[]) { int total_tasks = -1; int my_task = -1; start_pes(0); total_tasks = _num_pes(); if (total_tasks <= 0) { printf("FAILED\n"); exit(1); } else { printf("number of pes is %d\n", total_tasks); } if (total_tasks < 2 || total_tasks % 2) { printf("FAILED: The number of pes should be an even number. (at least 2)\n"); exit(1); } my_task = _my_pe(); if (my_task < 0){ printf("FAILED\n"); exit(1); } else { printf("my pe id is %d\n", my_task); } printf("The address of gIntArray is %p\n", gIntArray); // even tasks put value to odd tasks if (my_task%2 == 0) { int tgt_task = my_task + 1; //for int for (int i=0; i<GLOBAL_ARRAY_SIZE; i++) { gIntArray[i] = i; } printf("The Source Stride is: %d, the following data will be put.\n", SOURCE_STRIDE); for (int i=0; i<SOURCE_STRIDE*NUM_OF_TRANS_ELEM; i=i+SOURCE_STRIDE) { printf("array[%d] is: %d\n", i, gIntArray[i]); } shmem_int_iput(gIntArray, gIntArray, TARGET_STRIDE, SOURCE_STRIDE, NUM_OF_TRANS_ELEM, tgt_task); } shmem_barrier_all(); // odd tasks check value if (my_task%2 == 1) { //for int printf("The Targe Stride is: %d, the following data have been received.\n", TARGET_STRIDE); for (int i=0; i<TARGET_STRIDE*NUM_OF_TRANS_ELEM; i=i+TARGET_STRIDE) { printf("array[%d] is: %d\n", i, gIntArray[i]); } for (int i=0; i<TARGET_STRIDE*NUM_OF_TRANS_ELEM; i=i+TARGET_STRIDE) { if (gIntArray[i] != i*SOURCE_STRIDE/TARGET_STRIDE) { printf("FAILED, array[%d] should be %d instead of %d\n", i, i*SOURCE_STRIDE/TARGET_STRIDE, gIntArray[i]); exit(1); } } } shmem_barrier_all(); printf("PASSED\n"); return 0; }
Subroutines: shmem_barrier, shmem_put, shmem_fence, shmem_iput, shmem_quiet