⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 fetchandadd_tree.c

📁 fortran并行计算包
💻 C
字号:
/* -*- Mode: C; c-basic-offset:4 ; -*- *//* *  (C) 2001 by Argonne National Laboratory. *      See COPYRIGHT in top-level directory. */#include "mpi.h" #include "stdio.h"#include "stdlib.h"#include "mpitest.h"/* This is the tree-based scalable version of the fetch-and-add   example from Using MPI-2, pg 206-207. The code in the book (Fig   6.16) has bugs that are fixed below. */ #define NTIMES 20  /* no of times each process calls the counter                      routine */int localvalue=0;  /* contribution of this process to the counter. We                    define it as a global variable because attribute                    caching on the window is not enabled yet. */ void Get_nextval_tree(MPI_Win win, int *get_array, MPI_Datatype get_type,                 MPI_Datatype acc_type, int nlevels, int *value);int compar(const void *a, const void *b);int main(int argc, char *argv[]) {     int rank, nprocs, i, *counter_mem, *get_array, *get_idx, *acc_idx,        mask, nlevels, level, idx, tmp_rank, pof2;    MPI_Datatype get_type, acc_type;    MPI_Win win;    int errs = 0, *results, *counter_vals;     MPI_Init(&argc,&argv);     MPI_Comm_size(MPI_COMM_WORLD,&nprocs);     MPI_Comm_rank(MPI_COMM_WORLD,&rank);     if (rank == 0) {        /* allocate counter memory and initialize to 0 */        /* find the next power-of-two >= nprocs */        pof2 = 1;        while (pof2 < nprocs) pof2 *= 2;        counter_mem = (int *) calloc(pof2*2, sizeof(int));        MPI_Win_create(counter_mem, pof2*2*sizeof(int), sizeof(int),                       MPI_INFO_NULL, MPI_COMM_WORLD, &win);        MPI_Win_free(&win);         free(counter_mem);        /* gather the results from other processes, sort them, and check            whether they represent a counter being incremented by 1 */        results = (int *) malloc(NTIMES*nprocs*sizeof(int));        for (i=0; i<NTIMES*nprocs; i++)            results[i] = -1;        MPI_Gather(MPI_IN_PLACE, 0, MPI_DATATYPE_NULL, results, NTIMES, MPI_INT,                    0, MPI_COMM_WORLD);        qsort(results+NTIMES, NTIMES*(nprocs-1), sizeof(int), compar);        for (i=NTIMES+1; i<(NTIMES*nprocs); i++)            if (results[i] != results[i-1] + 1)                errs++;                free(results);    }    else {        /* Get the largest power of two smaller than nprocs */         mask = 1;         nlevels = 0;        while (mask < nprocs) {            mask <<= 1;             nlevels++;        }        mask >>= 1;        get_array = (int *) malloc(nlevels * sizeof(int));        get_idx = (int *) malloc(nlevels * sizeof(int));        acc_idx = (int *) malloc(nlevels * sizeof(int));        level = 0;         idx   = 0;         tmp_rank = rank;        while (mask >= 1) {             if (tmp_rank < mask) {                 /* go to left for acc_idx, go to right for                   get_idx. set idx=acc_idx for next iteration */                 acc_idx[level] = idx + 1;                 get_idx[level] = idx + mask*2;                 idx            = idx + 1;             }             else {                 /* go to right for acc_idx, go to left for                   get_idx. set idx=acc_idx for next iteration */                 acc_idx[level] = idx + mask*2;                 get_idx[level] = idx + 1;                 idx            = idx + mask*2;             }             level++;            tmp_rank = tmp_rank % mask;            mask >>= 1;         } /*        for (i=0; i<nlevels; i++)            printf("Rank %d, acc_idx[%d]=%d, get_idx[%d]=%d\n", rank,                   i, acc_idx[i], i, get_idx[i]);*/        MPI_Type_create_indexed_block(nlevels, 1, get_idx, MPI_INT, &get_type);        MPI_Type_create_indexed_block(nlevels, 1, acc_idx, MPI_INT, &acc_type);        MPI_Type_commit(&get_type);        MPI_Type_commit(&acc_type);        /* allocate array to store the values obtained from the            fetch-and-add counter */        counter_vals = (int *) malloc(NTIMES * sizeof(int));        MPI_Win_create(NULL, 0, 1, MPI_INFO_NULL, MPI_COMM_WORLD, &win);         for (i=0; i<NTIMES; i++) {            Get_nextval_tree(win, get_array, get_type, acc_type,                             nlevels, counter_vals+i);             /* printf("Rank %d, counter %d\n", rank, value); */        }        MPI_Win_free(&win);        free(get_array);        free(get_idx);        free(acc_idx);        MPI_Type_free(&get_type);        MPI_Type_free(&acc_type);         /* gather the results to the root */        MPI_Gather(counter_vals, NTIMES, MPI_INT, NULL, 0, MPI_DATATYPE_NULL,                    0, MPI_COMM_WORLD);        free(counter_vals);   }    MTest_Finalize(errs);    MPI_Finalize();     return 0; } void Get_nextval_tree(MPI_Win win, int *get_array, MPI_Datatype get_type,                      MPI_Datatype acc_type, int nlevels, int *value){    int *one, i;    one = (int *) malloc(nlevels*sizeof(int));    for (i=0; i<nlevels; i++) one[i] = 1;    MPI_Win_lock(MPI_LOCK_EXCLUSIVE, 0, 0, win);    MPI_Accumulate(one, nlevels, MPI_INT, 0, 0, 1, acc_type,                   MPI_SUM, win);    MPI_Get(get_array, nlevels, MPI_INT, 0, 0, 1, get_type, win);    MPI_Win_unlock(0, win);    *value = localvalue;    for (i=0; i<nlevels; i++)        *value = *value + get_array[i];    localvalue++;    free(one);}int compar(const void *a, const void *b){    return (*((int *)a) - *((int *)b));}

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -