Files
dgl/tests/cpp/test_zerocopy_serialize.cc
Hongzhi (Steve), Chen 33a2d9e1b6 [Misc] clang-format auto fix. (#4812)
* [Misc] clang-format auto fix.

* manual

Co-authored-by: Steve <ubuntu@ip-172-31-34-29.ap-northeast-1.compute.internal>
2022-11-04 14:24:20 +08:00

167 lines
5.1 KiB
C++

#include <dgl/array.h>
#include <dgl/immutable_graph.h>
#include <dgl/zerocopy_serializer.h>
#include <dmlc/memory_io.h>
#include <gtest/gtest.h>
#include <algorithm>
#include <iostream>
#include <vector>
#include "../../src/graph/heterograph.h"
#include "../../src/graph/unit_graph.h"
#include "./common.h"
#ifndef _WIN32
using namespace dgl;
using namespace dgl::aten;
using namespace dmlc;
// Function to convert an idarray to string
std::string IdArrayToStr(IdArray arr) {
arr = arr.CopyTo(DGLContext{kDGLCPU, 0});
int64_t len = arr->shape[0];
std::ostringstream oss;
oss << "(" << len << ")[";
if (arr->dtype.bits == 32) {
int32_t *data = static_cast<int32_t *>(arr->data);
for (int64_t i = 0; i < len; ++i) {
oss << data[i] << " ";
}
} else {
int64_t *data = static_cast<int64_t *>(arr->data);
for (int64_t i = 0; i < len; ++i) {
oss << data[i] << " ";
}
}
oss << "]";
return oss.str();
}
TEST(ZeroCopySerialize, NDArray) {
auto tensor1 = VecToIdArray<int64_t>({1, 2, 5, 3});
auto tensor2 = VecToIdArray<int64_t>({6, 6, 5, 7});
std::string nonzerocopy_blob;
dmlc::MemoryStringStream ifs(&nonzerocopy_blob);
static_cast<dmlc::Stream *>(&ifs)->Write(tensor1);
static_cast<dmlc::Stream *>(&ifs)->Write(tensor2);
std::string zerocopy_blob;
StreamWithBuffer zc_write_strm(&zerocopy_blob, true);
zc_write_strm.Write(tensor1);
zc_write_strm.Write(tensor2);
EXPECT_EQ(nonzerocopy_blob.size() - zerocopy_blob.size(), 126)
<< "Invalid save";
std::vector<void *> new_ptr_list;
// Use memcpy to mimic remote machine reconstruction
for (auto ptr : zc_write_strm.buffer_list()) {
auto new_ptr = malloc(ptr.size);
memcpy(new_ptr, ptr.data, ptr.size);
new_ptr_list.emplace_back(new_ptr);
}
NDArray loadtensor1, loadtensor2;
StreamWithBuffer zc_read_strm(&zerocopy_blob, new_ptr_list);
zc_read_strm.Read(&loadtensor1);
zc_read_strm.Read(&loadtensor2);
}
TEST(ZeroCopySerialize, ZeroShapeNDArray) {
auto tensor1 = VecToIdArray<int64_t>({6, 6, 5, 7});
auto tensor2 = VecToIdArray<int64_t>({});
auto tensor3 = VecToIdArray<int64_t>({6, 6, 2, 7});
std::vector<NDArray> ndvec;
ndvec.push_back(tensor1);
ndvec.push_back(tensor2);
ndvec.push_back(tensor3);
std::string zerocopy_blob;
StreamWithBuffer zc_write_strm(&zerocopy_blob, true);
zc_write_strm.Write(ndvec);
std::vector<void *> new_ptr_list;
// Use memcpy to mimic remote machine reconstruction
for (auto ptr : zc_write_strm.buffer_list()) {
auto new_ptr = malloc(ptr.size);
memcpy(new_ptr, ptr.data, ptr.size);
new_ptr_list.emplace_back(new_ptr);
}
std::vector<NDArray> ndvec_read;
StreamWithBuffer zc_read_strm(&zerocopy_blob, new_ptr_list);
zc_read_strm.Read(&ndvec_read);
EXPECT_EQ(ndvec_read[1]->ndim, 1);
EXPECT_EQ(ndvec_read[1]->shape[0], 0);
}
TEST(ZeroCopySerialize, SharedMem) {
auto tensor1 = VecToIdArray<int64_t>({1, 2, 5, 3});
DGLDataType dtype = {kDGLInt, 64, 1};
std::vector<int64_t> shape{4};
DGLContext cpu_ctx = {kDGLCPU, 0};
auto shared_tensor =
NDArray::EmptyShared("test", shape, dtype, cpu_ctx, true);
shared_tensor.CopyFrom(tensor1);
std::string nonzerocopy_blob;
dmlc::MemoryStringStream ifs(&nonzerocopy_blob);
static_cast<dmlc::Stream *>(&ifs)->Write(shared_tensor);
std::string zerocopy_blob;
StreamWithBuffer zc_write_strm(&zerocopy_blob, false);
zc_write_strm.Write(shared_tensor);
EXPECT_EQ(nonzerocopy_blob.size() - zerocopy_blob.size(), 51)
<< "Invalid save";
NDArray loadtensor1;
StreamWithBuffer zc_read_strm = StreamWithBuffer(&zerocopy_blob, false);
zc_read_strm.Read(&loadtensor1);
}
TEST(ZeroCopySerialize, HeteroGraph) {
auto src = VecToIdArray<int64_t>({1, 2, 5, 3});
auto dst = VecToIdArray<int64_t>({1, 6, 2, 6});
auto mg1 = dgl::UnitGraph::CreateFromCOO(2, 9, 8, src, dst);
src = VecToIdArray<int64_t>({6, 2, 5, 1, 8});
dst = VecToIdArray<int64_t>({5, 2, 4, 8, 0});
auto mg2 = dgl::UnitGraph::CreateFromCOO(1, 9, 9, src, dst);
std::vector<HeteroGraphPtr> relgraphs;
relgraphs.push_back(mg1);
relgraphs.push_back(mg2);
src = VecToIdArray<int64_t>({0, 0});
dst = VecToIdArray<int64_t>({1, 0});
auto meta_gptr = ImmutableGraph::CreateFromCOO(3, src, dst);
auto hrptr = std::make_shared<HeteroGraph>(meta_gptr, relgraphs);
std::string nonzerocopy_blob;
dmlc::MemoryStringStream ifs(&nonzerocopy_blob);
static_cast<dmlc::Stream *>(&ifs)->Write(hrptr);
std::string zerocopy_blob;
StreamWithBuffer zc_write_strm(&zerocopy_blob, true);
zc_write_strm.Write(hrptr);
EXPECT_EQ(nonzerocopy_blob.size() - zerocopy_blob.size(), 745)
<< "Invalid save";
std::vector<void *> new_ptr_list;
// Use memcpy to mimic remote machine reconstruction
for (auto ptr : zc_write_strm.buffer_list()) {
auto new_ptr = malloc(ptr.size);
memcpy(new_ptr, ptr.data, ptr.size);
new_ptr_list.emplace_back(new_ptr);
}
auto gptr = dgl::Serializer::make_shared<HeteroGraph>();
StreamWithBuffer zc_read_strm(&zerocopy_blob, new_ptr_list);
zc_read_strm.Read(&gptr);
EXPECT_EQ(gptr->NumVertices(0), 9);
EXPECT_EQ(gptr->NumVertices(1), 8);
}
#endif // _WIN32