You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

io_remote.cpp 1.9 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051
  1. #include "./helper.h"
  2. #include "megbrain/comp_node_env.h"
  3. #include "megbrain/imperative/ops/autogen.h"
  4. #include "megbrain/opr/mm_handler.h"
  5. using namespace mgb;
  6. using namespace imperative;
  7. TEST(TestImperative, IORemote) {
  8. REQUIRE_GPU(2);
  9. const char* server_addr = "127.0.0.1";
  10. uint32_t port = 4567;
  11. mgb_assert(opr::create_zmqrpc_server(server_addr, port) > 0);
  12. HostTensorGenerator<> gen;
  13. CompNode cn0 = CompNode::load("gpu0"), cn1 = CompNode::load("gpu1");
  14. size_t vector_size = 233;
  15. auto host_x = gen({vector_size}, cn0), host_y = gen({vector_size}, cn1);
  16. auto expect = gen({vector_size});
  17. for (size_t i = 0; i < vector_size; ++i) {
  18. expect->ptr<float>()[i] = host_x->ptr<float>()[i];
  19. }
  20. auto run_send = [&](std::shared_ptr<HostTensorND> hnd) {
  21. auto def = imperative::RemoteSend::make(
  22. "io_remote_test", server_addr, port, 1, "nccl");
  23. auto inp = Tensor::make(*hnd);
  24. SmallVector<LogicalTensorDesc> output_descs;
  25. auto oup = OpDef::apply_on_physical_tensor(*def, {inp}, output_descs, false);
  26. };
  27. auto run_recv = [&](std::shared_ptr<HostTensorND> hnd) {
  28. auto def = imperative::RemoteRecv::make(
  29. "io_remote_test", server_addr, port, 0, CompNode::load("gpu1"),
  30. std::vector<int32_t>{(int32_t)vector_size}, dtype::Float32(), "nccl");
  31. auto inp = Tensor::make(*hnd);
  32. SmallVector<LogicalTensorDesc> output_descs;
  33. auto oup = OpDef::apply_on_physical_tensor(*def, {inp}, output_descs, false);
  34. HostTensorND host_v;
  35. host_v.copy_from(oup[0]->dev_tensor()).sync();
  36. MGB_ASSERT_TENSOR_NEAR(*expect, host_v, 1e-6);
  37. };
  38. std::thread t0(std::bind(run_send, host_x));
  39. std::thread t1(std::bind(run_recv, host_y));
  40. t0.join();
  41. t1.join();
  42. }
  43. // vim: syntax=cpp.doxygen foldmethod=marker foldmarker=f{{{,f}}}