Skip to content

Commit

Permalink
add show_mem (PaddlePaddle#249)
Browse files Browse the repository at this point in the history
Co-authored-by: root <[email protected]>
  • Loading branch information
huwei02 and root authored Apr 1, 2023
1 parent e126e56 commit 67d7ee9
Show file tree
Hide file tree
Showing 6 changed files with 48 additions and 37 deletions.
34 changes: 0 additions & 34 deletions paddle/fluid/framework/data_feed.cu
Original file line number Diff line number Diff line change
Expand Up @@ -1545,40 +1545,6 @@ int GraphDataGenerator::FillSlotFeature(uint64_t *d_walk, size_t key_num) {
return 0;
}

int GraphDataGenerator::FillFeatureBuf(uint64_t *d_walk,
uint64_t *d_feature,
size_t key_num) {
platform::CUDADeviceGuard guard(gpuid_);

auto gpu_graph_ptr = GraphGpuWrapper::GetInstance();
int ret = gpu_graph_ptr->get_feature_of_nodes(
gpuid_,
d_walk,
d_feature,
key_num,
slot_num_,
reinterpret_cast<int *>(d_slot_feature_num_map_->ptr()),
fea_num_per_node_);
return ret;
}

int GraphDataGenerator::FillFeatureBuf(
std::shared_ptr<phi::Allocation> d_walk,
std::shared_ptr<phi::Allocation> d_feature) {
platform::CUDADeviceGuard guard(gpuid_);

auto gpu_graph_ptr = GraphGpuWrapper::GetInstance();
int ret = gpu_graph_ptr->get_feature_of_nodes(
gpuid_,
reinterpret_cast<uint64_t *>(d_walk->ptr()),
reinterpret_cast<uint64_t *>(d_feature->ptr()),
buf_size_,
slot_num_,
reinterpret_cast<int *>(d_slot_feature_num_map_->ptr()),
fea_num_per_node_);
return ret;
}

// 对于deepwalk模式,尝试插入table,0表示插入成功,1表示插入失败;
// 对于sage模式,尝试插入table,table数量不够则清空table重新插入,返回值无影响。
int GraphDataGenerator::InsertTable(
Expand Down
3 changes: 0 additions & 3 deletions paddle/fluid/framework/data_feed.h
Original file line number Diff line number Diff line change
Expand Up @@ -907,9 +907,6 @@ class GraphDataGenerator {
int FillInferBuf();
void DoWalkandSage();
int FillSlotFeature(uint64_t* d_walk);
int FillFeatureBuf(uint64_t* d_walk, uint64_t* d_feature, size_t key_num);
int FillFeatureBuf(std::shared_ptr<phi::Allocation> d_walk,
std::shared_ptr<phi::Allocation> d_feature);
void FillOneStep(uint64_t* start_ids,
int etype_id,
uint64_t* walk,
Expand Down
40 changes: 40 additions & 0 deletions paddle/fluid/framework/fleet/heter_ps/gpu_graph_utils.h
Original file line number Diff line number Diff line change
Expand Up @@ -133,6 +133,46 @@ inline void debug_gpu_memory_info(const char* desc) {
<< "desc=" << desc;
}
}

inline void show_gpu_mem(const char* desc) {
CudaDeviceRestorer r;

int device_num = 0;
auto err = cudaGetDeviceCount(&device_num);
PADDLE_ENFORCE_EQ(
err,
cudaSuccess,
platform::errors::InvalidArgument("cudaGetDeviceCount failed!"));

size_t avail{0};
size_t total{0};
for (int i = 0; i < device_num; ++i) {
cudaSetDevice(i);
auto err = cudaMemGetInfo(&avail, &total);
PADDLE_ENFORCE_EQ(
err,
cudaSuccess,
platform::errors::InvalidArgument("cudaMemGetInfo failed!"));
VLOG(0) << "[" << desc << "] hbm on device " << i << ", "
<< "avail=" << avail / 1024.0 / 1024.0 / 1024.0 << "g, "
<< "total=" << total / 1024.0 / 1024.0 / 1024.0 << "g";
}
}

inline void show_cpu_mem(const char* desc) {
//MB
long virtual_mem = 0, resident_mem = 0;

FILE * fp = fopen("/proc/self/statm", "r");
if (NULL != fp) {
fscanf(fp, "%ld %ld", &virtual_mem, &resident_mem);
resident_mem = resident_mem * 4096 / 1000000;
virtual_mem = virtual_mem * 4096 / 1000000;
fclose(fp);
}

VLOG(0) << "[" << desc << "] mem used " << resident_mem << "MB";
}

}; // namespace framework
}; // namespace paddle
6 changes: 6 additions & 0 deletions paddle/fluid/framework/fleet/heter_ps/graph_gpu_wrapper.cu
Original file line number Diff line number Diff line change
Expand Up @@ -752,6 +752,12 @@ void GraphGpuWrapper::finalize() {
reinterpret_cast<GpuPsGraphTable *>(graph_table)->show_table_collisions();
}

void GraphGpuWrapper::show_mem(const char* msg)
{
show_cpu_mem(msg);
show_gpu_mem(msg);
}

// edge table
void GraphGpuWrapper::upload_batch(int table_type,
int slice_num,
Expand Down
1 change: 1 addition & 0 deletions paddle/fluid/framework/fleet/heter_ps/graph_gpu_wrapper.h
Original file line number Diff line number Diff line change
Expand Up @@ -198,6 +198,7 @@ class GraphGpuWrapper {
std::unordered_map<int, int>& get_graph_type_to_index();
std::string& get_node_type_size(std::string first_node_type);
std::string& get_edge_type_size();
void show_mem(const char* msg);

std::unordered_map<std::string, int> edge_to_id, node_to_id;
std::vector<std::string> id_to_feature, id_to_edge;
Expand Down
1 change: 1 addition & 0 deletions paddle/fluid/pybind/fleet_py.cc
Original file line number Diff line number Diff line change
Expand Up @@ -389,6 +389,7 @@ void BindGraphGpuWrapper(py::module* m) {
bool>(
&GraphGpuWrapper::load_edge_file))
.def("load_node_and_edge", &GraphGpuWrapper::load_node_and_edge)
.def("show_mem", &GraphGpuWrapper::show_mem)
.def("upload_batch",
py::overload_cast<int, int, const std::string&>(
&GraphGpuWrapper::upload_batch))
Expand Down

0 comments on commit 67d7ee9

Please sign in to comment.