【发布时间】:2022-01-22 04:02:21
【问题描述】:
我有一个 C++ 类,我打算从 python 的 mpi4py 接口调用它,这样每个节点都会生成该类。在 C++ 方面,我使用Open MPI 库(通过homebrew 安装)和pybind11。
C++类如下:
#include <pybind11/pybind11.h>
#include <iostream>
#include <chrono>
#include <thread>
#include <vector>
#include <mpi.h>
// #define PyMPI_HAVE_MPI_Message 1
// #include <mpi4py/mpi4py.h>
namespace py = pybind11;
class SomeComputation
{
float multiplier;
std::vector<int> test;
MPI_Comm comm_;
public:
void Init()
{
int rank;
MPI_Comm_rank(comm_, &rank);
test.clear();
test.resize(10, rank);
}
void set_comm(MPI_Comm comm){
this->comm_ = comm;
}
SomeComputation(float multiplier_) : multiplier(multiplier_){}
~SomeComputation() { std::cout << "Destructor Called!\n"; }
float compute(float input)
{
std::this_thread::sleep_for(std::chrono::milliseconds((int)input * 10));
for (int i = 0; i != 10; ++i)
{
std::cout << test[i] << " ";
}
std::cout << std::endl;
return multiplier * input;
}
};
PYBIND11_MODULE(module_name, handle)
{
py::class_<SomeComputation>(handle, "Cpp_computation")
.def(py::init<float>()) // args of constructers are template args
.def("set_comm", &SomeComputation::set_comm)
.def("compute", &SomeComputation::compute)
.def("cpp_init", &SomeComputation::Init);
}
这是生成相同 C++ 的 python 接口:
from build.module_name import *
import time
from mpi4py import MPI
comm = MPI.COMM_WORLD
rank = comm.Get_rank()
m = Cpp_computation(44.0) # send communicator to cpp
m.cpp_init()
i = 0
while i < 5:
print(m.compute(i))
time.sleep(1)
i+=1
我已经尝试过“Sharing an MPI communicator using pybind11”,但我遇到了一个长期无益的错误 (full message):
[...]
/Users/purusharth/Documents/hiwi/pympicontroller/pybind11/include/pybind11/pybind11.h:1398:22: required from 'pybind11::class_<type_, options>& pybind11::class_<type_, options>::def(const char*, Func&&, const Extra& ...) [with Func = void (SomeComputation::*)(ompi_communicator_t*); Extra = {}; type_ = SomeComputation; options = {}]'
/Users/purusharth/Documents/hiwi/pympicontroller/main.cpp:79:7: required from here
/opt/homebrew/Cellar/gcc/11.2.0_3/include/c++/11/type_traits:1372:38: error: invalid use of incomplete type 'struct ompi_communicator_t'
1372 | : public integral_constant<bool, __is_base_of(_Base, _Derived)>
| ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~
In file included from /Users/purusharth/Documents/hiwi/pympicontroller/main.cpp:6:
/opt/homebrew/Cellar/open-mpi/4.1.2/include/mpi.h:419:16: note: forward declaration of 'struct ompi_communicator_t'
419 | typedef struct ompi_communicator_t *MPI_Comm;
| ^~~~~~~~~~~~~~~~~~~
[...]
/Users/purusharth/Documents/hiwi/pympicontroller/pybind11/include/pybind11/pybind11.h:1398:22: required from 'pybind11::class_<type_, options>& pybind11::class_<type_, options>::def(const char*, Func&&, const Extra& ...) [with Func = void (SomeComputation::*)(ompi_communicator_t*); Extra = {}; type_ = SomeComputation; options = {}]'
/Users/purusharth/Documents/hiwi/pympicontroller/main.cpp:79:7: required from here
/Users/purusharth/Documents/hiwi/pympicontroller/pybind11/include/pybind11/detail/descr.h:40:19: error: invalid use of incomplete type 'struct ompi_communicator_t'
40 | return {{&typeid(Ts)..., nullptr}};
| ^~~~~~~~~~
In file included from /Users/purusharth/Documents/hiwi/pympicontroller/main.cpp:6:
/opt/homebrew/Cellar/open-mpi/4.1.2/include/mpi.h:419:16: note: forward declaration of 'struct ompi_communicator_t'
419 | typedef struct ompi_communicator_t *MPI_Comm;
| ^~~~~~~~~~~~~~~~~~~
[...]
from /Users/purusharth/Documents/hiwi/pympicontroller/main.cpp:1:
/Users/purusharth/Documents/hiwi/pympicontroller/pybind11/include/pybind11/detail/descr.h:40:42: error: could not convert '{{<expression error>, nullptr}}' from '<brace-enclosed initializer list>' to 'std::array<const std::type_info*, 3>'
40 | return {{&typeid(Ts)..., nullptr}};
| ^
| |
| <brace-enclosed initializer list>
[...]
In file included from /Users/purusharth/Documents/hiwi/pympicontroller/main.cpp:1:
/Users/purusharth/Documents/hiwi/pympicontroller/pybind11/include/pybind11/pybind11.h: In instantiation of 'void pybind11::cpp_function::initialize(Func&&, Return (*)(Args ...), const Extra& ...) [with Func = pybind11::cpp_function::cpp_function<void, SomeComputation, ompi_communicator_t*, pybind11::name, pybind11::is_method, pybind11::sibling>(void (SomeComputation::*)(ompi_communicator_t*), const pybind11::name&, const pybind11::is_method&, const pybind11::sibling&)::<lambda(SomeComputation*, ompi_communicator_t*)>; Return = void; Args = {SomeComputation*, ompi_communicator_t*}; Extra = {pybind11::name, pybind11::is_method, pybind11::sibling}]':
[..]
/Users/purusharth/Documents/hiwi/pympicontroller/pybind11/include/pybind11/pybind11.h:1398:22: required from 'pybind11::class_<type_, options>& pybind11::class_<type_, options>::def(const char*, Func&&, const Extra& ...) [with Func = void (SomeComputation::*)(ompi_communicator_t*); Extra = {}; type_ = SomeComputation; options = {}]'
/Users/purusharth/Documents/hiwi/pympicontroller/main.cpp:79:7: required from here
/Users/purusharth/Documents/hiwi/pympicontroller/pybind11/include/pybind11/pybind11.h:266:73: in 'constexpr' expansion of 'pybind11::detail::descr<18, SomeComputation, ompi_communicator_t>::types()'
/Users/purusharth/Documents/hiwi/pympicontroller/pybind11/include/pybind11/pybind11.h:266:39: error: 'constexpr' call flows off the end of the function
266 | PYBIND11_DESCR_CONSTEXPR auto types = decltype(signature)::types();
| ^~~~~
错误指向.def("set_comm", &SomeComputation::set_comm)
这些错误的原因是什么,应该如何解决?
更新:如this answer 中所述,使用自定义类型施法器在下面添加了答案。但这是唯一的方法吗?
【问题讨论】:
-
据我所知,MPI_comm 只是被声明而没有被定义,所以你应该把它保存在 (
MPI_comm* comm_;) 而不是直接用值。见stackoverflow.com/questions/8972588/… -
当然,这可能不是真正的问题。在这种情况下,您可以尝试发布完整的 main.cpp 吗?错误引用第 79 行,但您的代码比这短。
-
您是否可能没有从 MPI 导入所有必需的标头?有几个错误引用了一个不完整的类型,因此您可能缺少一个“完成”类型定义所需的包含。
-
所有信息都应添加到问题中(如site guidelines 和sample code guidelines 中所述),而不仅仅是linked to。一方面,外部页面消失了(关于 SO 有很多问题,OP 没想到会发生这种情况,但确实发生了)。在长错误的情况下(例如 C++ 编译输出),可以发布核心错误消息,并带有用于完整输出的链接。
-
(如果不确定如何编辑长错误消息,可以在聊天中请求帮助,只需要 20 个代表,或者可以对同一点发表评论。)