zoukankan html css js c++ java

使用MPI进行分布式内存编程（2）

MPI的英文全称为message passing interface,中文名为消息传递接口，他不是一种新的语言，而是一个可以被C，C++，Fortran程序调用的库。

预备知识

1.编译与执行

使用类似此形式进行编译 mpicc -g -Wall -o mpi_hello mpi_hello.c 进行编译，mpicc为C语言的包装脚本(wrapper script)而非编译器(compilier)。

执行的话，可以使用 mpiexec -n <number of processers> ./mpi_hello 来执行，在一些超算平台，如天河二号上，也可以使用yhrun等命令运行

2.MPI Init and MPI Finalize

MPI_Init是告知MPI系统进行所有必要的初始化设置，如为消息缓冲区分配消息，为进程分配进程号等。

MPI_Finallize告知MPI系统已使用完毕，将MPI占用的资源释放。

一般的MPI程序框架如下：

. . .
#include <mpi.h>
. . .
int main(int argc, char argv[]) f
. . .
/* No MPI calls before this */
MPI Init(&argc, &argv);
. . .
MPI Finalize();
/* No MPI calls after this */
. . .
return 0;

｝

3.通信子，MPI_Comm_size和MPI_Comm_rank

通信子:一组可以相互发送消息的进程集合。

MPI_Comm_size：可以得到通信子的进程数

MPI_Comm_rank：可以得到通信子的进程号

4.MPI_Send和MPI_Recv

MPI_Send语法结构如下：

int MPI_Send(
void msg_buf_p /* in */,
int msg_size /* in */,
MPI Datatype_msg_type /* in */,
int dest /* in */,
int tag /* in */,
MPI_Comm_communicator /* in */);

msg_buf_p ---->指向包含消息内容的内存块的指针

msg_size ---->发生的数据量

Datatype_msg_type --->由于C语言之中的类型，如int，char等不能作为参数传递给函数。所以要使用这个参数作为媒介。

dest--->指定了需要接收信息的进程号

tag --->一个非负int类型数，用于区分看上去完全一样的信息。

MPI_Comm_communicator ---->通信子。


MPI_Recv语法结构如下：

int MPI_Recv(
void msg_buf_p /* out */,
int buf_size /* in */,
MPI_Datatype buf_type /* in */,
int source /* in */,
int tag /* in */,
MPI_Comm communicator /* in */,
MPI_Status status_p /* out */);

msg_buf_p--->指向内存块

buf_size --->指定了内存块之中要储存对象的数量

buf_type --->说明对象的类型

source ---> 指定接受的信息应该由哪个进程发送而来

tag --->一个非负int类型数，用于区分看上去完全一样的信息,需要与发送消息的参数tag相匹配

communicator --->通信子，需要与发送消息的参数communicator 相匹配

status_p ----> 大部分情况下不进行调用。

实例见https://www.cnblogs.com/caishunzhe/p/12935439.html

为了编写能够使用scanf的MPI程序，我们根据进程号来选取分钟。0号进程复制读取数据，并将数据发送给其他进程。程序如下
pro3.5.c

#include<stdio.h>
#include<string.h>
#include<mpi.h>

double f(double x)
{
    return x*x+x*x*x+5;
}
double Trap(double left_endpt,double right_endpt,int trap_count,double base_len)
{
    
    
    double estimate,x;
    int i;
    estimate=(f(left_endpt)+f(right_endpt))/2.0; //梯形面积
    for(i =1;i<=trap_count-1;++i)
    {
        x=left_endpt+i*base_len;
        estimate+=f(x);
    }
    estimate=estimate*base_len;
    return estimate;
}

void Get_input(
    int my_rank,
    int comm_sz,
    double* a_p,
    double* b_p,
    int* n_p
)
{    
    int dest;
    if(my_rank==0)
    {
        printf("Enter a,b,and n
");
        scanf("%lf %lf %d",a_p,b_p,n_p);
        for(dest=1;dest<comm_sz;++dest)
        {
            MPI_Send(a_p,1,MPI_DOUBLE,dest,0,MPI_COMM_WORLD);
            MPI_Send(b_p,1,MPI_DOUBLE,dest,0,MPI_COMM_WORLD);
            MPI_Send(n_p,1,MPI_INT,dest,0,MPI_COMM_WORLD);
        }
    }
    else //rank!=0;
    {
        MPI_Recv(a_p,1,MPI_DOUBLE,0,0,MPI_COMM_WORLD,MPI_STATUS_IGNORE);
        MPI_Recv(b_p,1,MPI_DOUBLE,0,0,MPI_COMM_WORLD,MPI_STATUS_IGNORE);
        MPI_Recv(n_p,1,MPI_INT,0,0,MPI_COMM_WORLD,MPI_STATUS_IGNORE);
    }
}




int main()
{
    /*
    int my_rank,comm_sz,n=1024,local_n;
    double a=0.0,b=3.0,h,local_a,local_b;
    */
    int my_rank,comm_sz,n,local_n;
    double a,b,h,local_a,local_b;
    double local_int,total_int;
    int source;
    
    MPI_Init(NULL,NULL); //初始化
    MPI_Comm_size(MPI_COMM_WORLD,&comm_sz); //返回进程数
    MPI_Comm_rank(MPI_COMM_WORLD,&my_rank); //返回进程号
    
    //新加入的函数，处理输入问题
    Get_input(my_rank,comm_sz,&a,&b,&n);
    
    h=(b-a)/n;
    local_n=n/comm_sz;
    
    local_a=a+my_rank*local_n*h;
    local_b=local_a+local_n*h;
    local_int=Trap(local_a,local_b,local_n,h);
    
    if(my_rank!=0)
    {
        MPI_Send(&local_int,1,MPI_DOUBLE,0,0,MPI_COMM_WORLD);
    }
    else
    {
        total_int=local_int;
        for(source=1;source<comm_sz;source++)
        {
            MPI_Recv(&local_int,1,MPI_DOUBLE,source,0,MPI_COMM_WORLD,MPI_STATUS_IGNORE); //接受其他节点信息
            total_int+=local_int;
        }
    }
    
    if(my_rank==0)
    {
        printf("With n=%d trapezoids,our estimated
",n);
        printf("of the intergral from %f to %f=%.15e
",a,b,total_int);
    }
    
    MPI_Finalize();
    return 0;
    
    
    
    
    
    
    
    
}

从0积分到50，划分的小间隔为100，1000,10000，理论上原函数为F(x)=1/3*x^3+1/4*x^4+5x ,积分值为F(50)-F(0)=1604416.6667

天河超算平台结果

可以看见，随着n的增大，划分的越来越细，结果越接近真实值。

实例上面是比较基本的实现，仔细分析之后发现其通信开销太大，0号进程需要负责所有进程的累加，如果又8个进程，那么就得加7次，随着进程的增长耗时线性增长
我们可以对其进行相应的改进，使用树型结构。
如下图的两种方法均可以，随进程数增长，时间为log（N）

我们选取第一种策略

#include<stdio.h>
#include<string.h>
#include<mpi.h>
/*只考虑最简单的2的幂次方情况*/

double f(double x)
{
    return x*x+x*x*x+5;
}
double Trap(double left_endpt,double right_endpt,int trap_count,double base_len)
{
    
    
    double estimate,x;
    int i;
    estimate=(f(left_endpt)+f(right_endpt))/2.0; //梯形面积
    for(i =1;i<=trap_count-1;++i)
    {
        x=left_endpt+i*base_len;
        estimate+=f(x);
    }
    estimate=estimate*base_len;
    return estimate;
}

void Get_input(
    int my_rank,
    int comm_sz,
    double* a_p,
    double* b_p,
    int* n_p
)
{    
    int dest;
    if(my_rank==0)
    {
        printf("Enter a,b,and n
");
        scanf("%lf %lf %d",a_p,b_p,n_p);
        for(dest=1;dest<comm_sz;++dest)
        {
            MPI_Send(a_p,1,MPI_DOUBLE,dest,0,MPI_COMM_WORLD);
            MPI_Send(b_p,1,MPI_DOUBLE,dest,0,MPI_COMM_WORLD);
            MPI_Send(n_p,1,MPI_INT,dest,0,MPI_COMM_WORLD);
        }
    }
    else //rank!=0;
    {
        MPI_Recv(a_p,1,MPI_DOUBLE,0,0,MPI_COMM_WORLD,MPI_STATUS_IGNORE);
        MPI_Recv(b_p,1,MPI_DOUBLE,0,0,MPI_COMM_WORLD,MPI_STATUS_IGNORE);
        MPI_Recv(n_p,1,MPI_INT,0,0,MPI_COMM_WORLD,MPI_STATUS_IGNORE);
    }
}




int main()
{
    /*
    int my_rank,comm_sz,n=1024,local_n;
    double a=0.0,b=3.0,h,local_a,local_b;
    */
    //comm_sz-->进程数  my_rank--->进程号
    int my_rank,comm_sz,n,local_n;
    double a,b,h,local_a,local_b;
    double local_int,total_int;
    int source;
    int t;
    MPI_Init(NULL,NULL); //初始化
    MPI_Comm_size(MPI_COMM_WORLD,&comm_sz); //返回进程数
    MPI_Comm_rank(MPI_COMM_WORLD,&my_rank); //返回进程号
    
    //新加入的函数，处理输入问题
    Get_input(my_rank,comm_sz,&a,&b,&n);
    
    h=(b-a)/n;
    local_n=n/comm_sz;
    
    local_a=a+my_rank*local_n*h;
    local_b=local_a+local_n*h;
    local_int=Trap(local_a,local_b,local_n,h);
    /*
    if(my_rank!=0)
    {
        MPI_Send(&local_int,1,MPI_DOUBLE,0,0,MPI_COMM_WORLD);
    }
    else //my_rank=0
    {
        total_int=local_int;
        for(source=1;source<comm_sz;source++)
        {
            MPI_Recv(&local_int,1,MPI_DOUBLE,source,0,MPI_COMM_WORLD,MPI_STATUS_IGNORE); //接受其他节点信息
            total_int+=local_int;
        }
    }
    */
    
    
    /*
    if(my_rank%2!=0)//奇数向小一位的偶数发送,然后退休
    {
        MPI_Send(&local_int,1,MPI_DOUBLE,my_rank-1,0,MPI_COMM_WORLD);
    }
    else //偶数先接受奇数还可能有进一步的行动
    {
        //接受奇数节点信息
        total_int=local_int;
        MPI_Recv(&local_int,1,MPI_DOUBLE,my_rank+1,0,MPI_COMM_WORLD,MPI_STATUS_IGNORE); //接受其他节点信息
        total_int+=local_int;
        local_int=total_int;
        
        for(t=2;t<comm_sz;t<<1)
        {
            for(source=t;source<comm_sz;source+=2*t)
            {
                if(my_rank==source)
                    MPI_Send(&local_int,1,MPI_DOUBLE,my_rank-t,0,MPI_COMM_WORLD);
            }
            for(source=0;source<comm_sz;source+=2*t)
            {
                if(my_rank==source)
                {
                    total_int=local_int;
                    MPI_Recv(&local_int,1,MPI_DOUBLE,my_rank+t,0,MPI_COMM_WORLD,MPI_STATUS_IGNORE); //接受其他节点信息
                    total_int+=local_int;
                    local_int=total_int;
                }
            }
        }
        
    }
    */
        for(t=1;t<comm_sz;t*=2)
        {
            for(source=t;source<comm_sz;source+=2*t)
            {
                if(my_rank==source)
                {
                    MPI_Send(&local_int,1,MPI_DOUBLE,my_rank-t,0,MPI_COMM_WORLD);
                    break;
                }
            }
            for(source=0;source<comm_sz;source+=2*t)
            {
                if(my_rank==source)
                {
                    total_int=local_int;
                    MPI_Recv(&local_int,1,MPI_DOUBLE,my_rank+t,0,MPI_COMM_WORLD,MPI_STATUS_IGNORE); //接受其他节点信息
                    total_int+=local_int;
                    local_int=total_int;
                    break;
                }
            }
        }
    
    
    
        
    
    
    if(my_rank==0)
    {
        printf("With n=%d trapezoids,our estimated
",n);
        printf("of the intergral from %f to %f=%.15e
",a,b,total_int);
        //printf("comm_sz=%d",comm_sz);
    }
    
    MPI_Finalize();
    return 0;
    
    
    
    
    
    
    
    
}

天河超算平台结果

查看全文

相关阅读:
Atitit.eclise的ide特性abt 编译
 Atitit python3.0 3.3 3.5 3.6 新特性 Python2.7新特性1Python 3_x 新特性1python3.4新特性1python3.5新特性1值得关注的新特性1Pyth
Atitit. Atiposter 发帖机新特性 poster new feature v7 q39
Atitit.eclipse 4.3 4.4 4.5 4.6新特性
 atitit.错误：找不到或无法加载主类的解决 v4 qa15.doc
Atitit RSA非对称加密原理与解决方案
 Atitti.数字证书体系cer pfx attilax总结
 Atitit ftp原理与解决方案
 Atitit qzone qq空间博客自动点赞与评论工具的设计与实现
 Atitit 软件国际化原理与概论

原文地址：https://www.cnblogs.com/caishunzhe/p/12958222.html