Skip to content

Commit

Permalink
add pglbox big data benchmark (PaddlePaddle#988)
Browse files Browse the repository at this point in the history
* fix wide_deep gpups error when run in py>3.7

* set FLAGS_dynamic_static_unified_comm=False when psgpu

* [windows] bug fixs trainer divide-zero-bug

* add lightgcn and transformer_conv pglbox

* add centos PDC images for pglbox

* fix pscpu benchmark

* fix pscpu benchmark install paddle

* add pglbox big data benchmark
  • Loading branch information
fightfat authored Mar 12, 2024
1 parent b51e032 commit 052f058
Show file tree
Hide file tree
Showing 2 changed files with 44 additions and 3 deletions.
6 changes: 3 additions & 3 deletions test_tipc/prepare.sh
Original file line number Diff line number Diff line change
Expand Up @@ -542,21 +542,21 @@ elif [ ${model_name} == "dpin" ]; then
cp -r ./models/rank/dpin/data/* ./test_tipc/data/train
cp -r ./datasets/KDD2012_track2/test/* ./test_tipc/data/infer
fi
elif [ ${model_name} == "deep_walk" ]; then
elif [[ ${model_name} =~ "deep_walk" ]]; then
if [ ${MODE} = "benchmark_train" ];then
python -m pip install paddlenlp==2.0.0rc16
python -m pip install protobuf==3.20.0 -U
python -m pip install pgl -U
python -m pip install gpustat==1.0.0 -U
fi
elif [ ${model_name} == "lightgcn" ]; then
elif [[ ${model_name} =~ "lightgcn" ]]; then
if [ ${MODE} = "benchmark_train" ];then
python -m pip install paddlenlp==2.0.0rc16
python -m pip install protobuf==3.20.0 -U
python -m pip install pgl -U
python -m pip install gpustat==1.0.0 -U
fi
elif [ ${model_name} == "transformer_conv" ]; then
elif [[ ${model_name} =~ "transformer_conv" ]]; then
if [ ${MODE} = "benchmark_train" ];then
python -m pip install paddlenlp==2.0.0rc16
python -m pip install protobuf==3.20.0 -U
Expand Down
41 changes: 41 additions & 0 deletions test_tipc/test_train_inference_python.sh
Original file line number Diff line number Diff line change
Expand Up @@ -318,8 +318,49 @@ if [ ${MODE} = "benchmark_train" ]; then
sed -i '/tar -zxvf dependency_py310.tar.gz/d' tools/run_pglbox.sh
sed -i '/rm dependency_py310.tar.gz/d' tools/run_pglbox.sh
fi
if [[ ${SYS_JOB_NAME} && ${SYS_JOB_NAME} =~ 'CE' ]]; then
line=$(sed -n -e '/graph_data_fs_name:/=' $gpu_config_value)
new_graph_data_fs_name="graph_data_fs_name: \"${graph_data_fs_name}\""
sed -i "$line a${new_graph_data_fs_name}" $gpu_config_value
sed -i "$line d" $gpu_config_value

line=$(sed -n -e '/graph_data_fs_ugi:/=' $gpu_config_value)
new_graph_data_fs_ugi="graph_data_fs_ugi: \"${graph_data_fs_ugi}\""
sed -i "$line a${new_graph_data_fs_ugi}" $gpu_config_value
sed -i "$line d" $gpu_config_value

lines=$(sed -n -e '/graph_data_hdfs_path:/=' $gpu_config_value)
array_lines=(${lines})
line_num=${#array_lines[@]}
line=${array_lines[line_num-1]}
new_graph_data_hdfs_path="graph_data_hdfs_path: \"${graph_data_hdfs_path}\""
sed -i "$line a${new_graph_data_hdfs_path}" $gpu_config_value
sed -i "$line d" $gpu_config_value

lines=$(sed -n -e '/graph_data_local_path:/=' $gpu_config_value)
array_lines=(${lines})
line_num=${#array_lines[@]}
line=${array_lines[line_num-1]}
new_graph_data_local_path="graph_data_local_path: \"${graph_data_local_path}\""
sed -i "$line a${new_graph_data_local_path}" $gpu_config_value
sed -i "$line d" $gpu_config_value

lines=$(sed -n -e '/num_part:/=' $gpu_config_value)
array_lines=(${lines})
line_num=${#array_lines[@]}
line=${array_lines[line_num-1]}
new_num_part="num_part: 1000"
sed -i "$line a${new_num_part}" $gpu_config_value
sed -i "$line d" $gpu_config_value

wget ${graph_eval_url} --no-check-certificate -P tools/
fi
#执行训练脚本
sh -x tools/run_pglbox.sh
if [[ ${SYS_JOB_NAME} && ${SYS_JOB_NAME} =~ 'CE' ]]; then
sh tools/run_graph_eval.sh $gpu_config_value > ${BENCHMARK_LOG_DIR}/graph_eval.log 2>&1
rm -rf ${graph_data_local_path}
fi
fi
elif [ ${MODE} = "whole_infer" ] || [ ${MODE} = "klquant_whole_infer" ]; then
GPUID=$3
Expand Down

0 comments on commit 052f058

Please sign in to comment.