python - 用 mpi4py 替换 multiprocessing pool.map-6ren

python - 用 mpi4py 替换 multiprocessing pool.map

转载作者：行者123 更新时间：2023-12-04 13:24:45

我是使用 MPI 的初学者，我仍在阅读文档。然而，当谈到 mpi4py 时，几乎没有什么可做的。我编写的代码目前使用多处理模块在多个内核上运行，但我需要用 mpi4py 替换它，以便我可以使用多个节点来运行我的代码。我的代码在下面，使用多处理模块时，也没有。

多处理

import numpy as np
import multiprocessing 


start_time = time.time()

E = 0.1
M = 5
n = 1000
G = 1
c = 1
stretch = [10, 1]


#Point-Distribution Generator Function 
def CDF_inv(x, e, m):
    A = 1/(1 + np.log(m/e))
    if x == 1:
        return m
    elif 0 <= x <= A:
        return e * x / A
    elif A < x < 1:
        return e * np.exp((x / A) - 1)

#Elliptical point distribution Generator Function

def get_coor_ellip(dist=CDF_inv, params=[E, M], stretch=stretch):
    R = dist(random.random(), *params)
    theta = random.random() * 2 * np.pi
    return (R * np.cos(theta) * stretch[0], R * np.sin(theta) * stretch[1])


def get_dist_sq(x_array, y_array):
    return x_array**2 + y_array**2


#Function to obtain alpha

def get_alpha(args):
    zeta_list_part, M_list_part, X, Y = args
    alpha_x = 0
    alpha_y = 0
    for key in range(len(M_list_part)):
        z_m_z_x = X - zeta_list_part[key][0]
        z_m_z_y = Y - zeta_list_part[key][1]
        dist_z_m_z = get_dist_sq(z_m_z_x, z_m_z_y)
        alpha_x += M_list_part[key] * z_m_z_x / dist_z_m_z
        alpha_y += M_list_part[key] * z_m_z_y / dist_z_m_z
    return (alpha_x, alpha_y)

#The part of the process containing the loop that needs to be parallelised, where I use pool.map()

if __name__ == '__main__':
    # n processes, scale accordingly
    num_processes = 10
    pool = multiprocessing.Pool(processes=num_processes)
    random_sample = [CDF_inv(x, E, M)
                     for x in [random.random() for e in range(n)]]
    zeta_list = [get_coor_ellip() for e in range(n)]
    x1, y1 = zip(*zeta_list)
    zeta_list = np.column_stack((np.array(x1), np.array(y1)))
    x = np.linspace(-3, 3, 100)
    y = np.linspace(-3, 3, 100)
    X, Y = np.meshgrid(x, y)
    print len(x)*len(y)*n,'calculations to be carried out.'
    M_list = np.array([.001 for i in range(n)])
    # split zeta_list, M_list, X, and Y
    zeta_list_split = np.array_split(zeta_list, num_processes, axis=0)
    M_list_split = np.array_split(M_list, num_processes)
    X_list = [X for e in range(num_processes)]
    Y_list = [Y for e in range(num_processes)]

    alpha_list = pool.map(
            get_alpha, zip(zeta_list_split, M_list_split, X_list, Y_list))
    alpha_x = 0  
    alpha_y = 0
    for e in alpha_list:
        alpha_x += e[0] * 4 * G / (c**2)
        alpha_y += e[1] * 4 * G / (c**2)

print("%f seconds" % (time.time() - start_time))

没有多处理，

import numpy as np


E = 0.1
M = 5
G = 1
c = 1
M_list = [.1 for i in range(n)]

#Point-Distribution Generator Function 

def CDF_inv(x, e, m):
    A = 1/(1 + np.log(m/e))
    if x == 1:
        return m
    elif 0 <= x <= A:
        return e * x / A
    elif A < x < 1:
        return e * np.exp((x / A) - 1)



n = 1000
random_sample = [CDF_inv(x, E, M)
                 for x in [random.random() for e in range(n)]]
stretch = [5, 2]

#Elliptical point distribution Generator Function

def get_coor_ellip(dist=CDF_inv, params=[E, M], stretch=stretch):
    R = dist(random.random(), *params)
    theta = random.random() * 2 * np.pi
    return (R * np.cos(theta) * stretch[0], R * np.sin(theta) * stretch[1])

#zeta_list is the list of coordinates of a distribution of points
zeta_list = [get_coor_ellip() for e in range(n)]
x1, y1 = zip(*zeta_list)
zeta_list = np.column_stack((np.array(x1), np.array(y1)))

#Creation of a X-Y Grid
x = np.linspace(-3, 3, 100)
y = np.linspace(-3, 3, 100)
X, Y = np.meshgrid(x, y)

def get_dist_sq(x_array, y_array):
    return x_array**2 + y_array**2


#Calculation of alpha, containing the loop that needs to be parallelised.

alpha_x = 0
alpha_y = 0
for key in range(len(M_list)):
    z_m_z_x = X - zeta_list[key][0]
    z_m_z_y = Y - zeta_list[key][1]
    dist_z_m_z = get_dist_sq(z_m_z_x, z_m_z_y)
    alpha_x += M_list[key] * z_m_z_x / dist_z_m_z
    alpha_y += M_list[key] * z_m_z_y / dist_z_m_z
alpha_x *= 4 * G / (c**2)
alpha_y *= 4 * G / (c**2)

基本上我的代码所做的是，它首先生成一个遵循特定分布的点列表。然后我应用一个方程，使用点之间的距离之间的不同关系来获得数量“alpha”。需要并行化的部分是涉及 alpha 计算的单个 for 循环。我想做的是使用 mpi4py 而不是多处理来执行此操作，但我不确定如何进行。

最佳答案

可以使用 scatter/gather 将 multiprocessing.map 版本转换为 MPI。在您的情况下，您已经将输入列表准备为每个等级的一个 block ，这很有用。主要区别在于，所有代码首先由所有级别执行，因此您必须将所有应该由 master rank 0 完成的事情设为条件。

if __name__ == '__main__':
    comm = MPI.COMM_WORLD
    if comm.rank == 0:
        random_sample = [CDF_inv(x, E, M)
                         for x in [random.random() for e in range(n)]]
        zeta_list = [get_coor_ellip() for e in range(n)]
        x1, y1 = zip(*zeta_list)
        zeta_list = np.column_stack((np.array(x1), np.array(y1)))
        x = np.linspace(-3, 3, 100)
        y = np.linspace(-3, 3, 100)
        X, Y = np.meshgrid(x, y)
        print len(x)*len(y)*n,'calculations to be carried out.'
        M_list = np.array([.001 for i in range(n)])
        # split zeta_list, M_list, X, and Y
        zeta_list_split = np.array_split(zeta_list, comm.size, axis=0)
        M_list_split = np.array_split(M_list, comm.size)
        X_list = [X for e in range(comm.size)]
        Y_list = [Y for e in range(comm.size)]
        work_list = list(zip(zeta_list_split, M_list_split, X_list, Y_list))
    else:
        work_list = None

    my_work = comm.scatter(work_list)
    my_alpha = get_alpha(my_work)

    alpha_list = comm.gather(my_alpha)
    if comm.rank == 0:
        alpha_x = 0  
        alpha_y = 0
        for e in alpha_list:
            alpha_x += e[0] * 4 * G / (c**2)
            alpha_y += e[1] * 4 * G / (c**2)

只要每个处理器获得相似的工作量，这种方法就可以正常工作。如果通信成为问题，您可能希望在处理器之间拆分数据生成，而不是全部在 master rank 0 上完成。

注意:有关代码的某些内容是伪造的，例如alpha_[xy] 最终成为 np.ndarray。串行版运行出错。

关于python - 用 mpi4py 替换 multiprocessing pool.map，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/43046037/

文章推荐： ethereum - 为什么两个 Uni V3 池有不同的字节码？

文章推荐： wcf - 不支持协议(protocol) 'net.tcp'

文章推荐： tfs - 我们可以迁移到新的TFS流程模板并保留历史记录吗？

python - manage.py 在同一文件夹中继续使用 django 的空白 settings.py 而不是 settings.py manage.py 位于
我使用的是 Windows 8.1 和 Python 2.7，我在特定文件路径中设置了所有文件(希望正确)，但每当我运行 python manage.py runserver 时，我都会收到此错误。
python - 如何为基本包设置配置 __main__.py、__init__.py 和 __setup__.py？
背景: 我有一个像这样的目录结构: Package/ setup.py src/ __init__.py __main__.py cod
pytest - py.test 给出 Coverage.py 警告 : Module sample. py 从未导入
我从这个线程运行了一个示例代码。 How to properly use coverage.py in Python? 但是，当我执行此命令时 py.test test.py --cov=sample
ipython - 为什么 `ipython foo.py bar.py` 只打印 `foo.py` 的输出？
IPython 0.13.1 文档说: $ ipython -h ... Usage ipython [subcommand] [options] [files] If invoked
python - 当我们需要使用 sudo python xxx.py 或只是 python xxx.py 或 xxx.py
我写了一个网站，让我困惑的是当我运行这个网站时，首先我需要启动应用程序，所以有 3 种方法: sudo python xxx.py python xxx.py xxx.py 每一个我都不清楚怎么用，目
Python:从 day_one.py 导入一个文件到 main.py，然后在 day_one 中我从 main.py 导入一个函数。错误无法导入
我不确定为什么它不起作用，这可能是一个您无法解决的问题，但我只是想知道为什么它不起作用。如果我浪费了您的时间，或者没有正确地提出问题，我很抱歉，我 16 岁，对 Python 还算陌生。在main.
Django 模型管理器.py 和模型.py
鉴于以下情况:models.py from .managers import PersonManager from django.db import models class Person(model
web.py - web.py 处理程序类的参数
有没有办法将参数传递给 web.py 处理程序类构造函数？例如。这些参数可能来自命令行(当主 web.py 脚本运行时)，在第一个参数(作为端口号)之后最佳答案当然，这取决于你的意思。毕竟都是p
manage.py - manage.py 文件究竟做了什么
我对 python/django 编程很陌生，因为我没有编程背景。我正在在线上课，我只想确切地知道 manage.py 文件的作用。我试过用谷歌搜索它，但除了在 django-admin.py 周围放
python - 如何使用 models.py 、 serializers.py 和 views.py 将解析的 json 数组值保存到 django python Rest api 中的数据库
我想将类别及其子类别保存到数据库中，这里每个类别都有多个子类别。您能帮我保存与类别相对应的用户、类别和多个子类别吗？Models.py、Serializers.py、Views .py 并附加传入请求
discord.py - 如何在 discord.py 中使用高级命令处理
所以我的机器人开始有很多命令，并且在 main.py 上变得有点困惑。我知道有一种方法可以将命令存储在其他文件中，然后在 discord.js 上触发它们时将它们应用于 main.py。在 disco
discord.py - 如何让我的 discord.py 机器人计算某个人发送的消息数量？
我正在尝试制作一个类似于 mee6 的 Discord 机器人，因为它会按特定时间间隔计算用户在我的 Discord 服务器中发送的消息。我已经在网上搜索过，但即使有类似的问题也找不到我要找的东西。例
discord.py - 有没有办法在 discord.py 中创建线程？
我正在尝试制作一个机器人，它根据特定 channel 中的消息创建线程。如果有在 discord.py 中的文本 channel 中创建线程的方法，请告诉我。最佳答案是的，但有一个问题。当前版本
discord.py - 分页 - Discord.py 重写
我一直在尝试制作一个命令来显示一些信息，然后当我对表情使用react时，它应该会显示另一组信息。我尝试使用 this 的部分内容，特别是第 335 到 393 行的部分让它工作。但是，它什么也不做。
discord.py - 当有人提到它时，我如何让机器人做出回应？不和谐.py
这是我试过的代码: @client.event async def on_message(message): if client.user.mention in message.content
discord.py - 用 discord.py 重写的数字猜谜游戏
我试过这段代码，机器人说猜但没有回应我的猜测。 @commands.command() async def game(self, ctx): number = random.randint(0
discord.py - 如何检查机器人是否连接到 channel ？ |不和谐.py
我决定尝试让我的不和谐机器人播放音乐，但我已经卡住了。主要是因为我找不到任何资源来帮助当前版本，我一直在从文档中获取所有内容。但是，我不知道如何检查机器人是否已连接到语音 channel 。我试过
python - 执行 .py 文件也会运行另一个 .py 文件
我在一个目录中有三个文件: # Untitled-1.py print("UTITLEDPY") if __name__== "__main__": from telegram.ext imp
python - 在 .py 文件内使用 .py 文件
我对 python 相当陌生，并且一直只使用 Jupyter Notebooks。当我需要运行我已保存在计算机中某处的 .py 文件时，我通常所做的就是使用魔术命令 %run %run '/home/
python - manage.py 和 other.py 文件不在同级文件中
我有 Django 1.4 和 Python 2.6.6当我使用“django-amdin.py startproject djproject”时，请按照网页中的步骤操作 https://www.ib

行者123

个人简介

我是一名优秀的程序员,十分优秀！

作者热门文章

滴滴打车优惠券免费领取

全站热门文章

首页

博学

6Ren·AI

商城

python - 用 mpi4py 替换 multiprocessing pool.map