Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Support 0-size tensor in parameter creating, forward and backward #70504

Merged
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
Show all changes
23 commits
Select commit Hold shift + click to select a range
02aa39d
support 0-size tensor forward and backward under simple operations pr…
HydrogenSulfate Dec 27, 2024
a18f2cc
Merge branch 'develop' into support_0-size_fwd_bwd
HydrogenSulfate Dec 27, 2024
288b863
fix error message format
HydrogenSulfate Dec 31, 2024
665698a
support initializing for 0-size tensor
HydrogenSulfate Dec 31, 2024
a157537
add TestZeroSizeParameter
HydrogenSulfate Dec 31, 2024
130251d
update forward, backward with 0-size tensor in eager/static mode
HydrogenSulfate Dec 31, 2024
7b396b4
Merge branch 'develop' into support_0-size_fwd_bwd
HydrogenSulfate Dec 31, 2024
2442cde
TestZeroSizeBackward skip XPU for place issue
HydrogenSulfate Jan 2, 2025
fc4aff3
Merge branch 'develop' into support_0-size_fwd_bwd
HydrogenSulfate Jan 2, 2025
c9267a9
[PIR] Insert backward ops into insertion point
SigureMo Jan 2, 2025
b0a87da
fix 2 ut
SigureMo Jan 2, 2025
68f0af9
Merge branch 'PaddlePaddle:develop' into support_0-size_fwd_bwd
HydrogenSulfate Jan 3, 2025
49f235d
Merge branch '70595' into support_0-size_fwd_bwd
HydrogenSulfate Jan 3, 2025
7614038
fix add_n infermeta when meeting 0-size and update UT
HydrogenSulfate Jan 3, 2025
16744ee
Merge branch 'develop' into support_0-size_fwd_bwd
HydrogenSulfate Jan 3, 2025
2d7cbf1
remove warnings
HydrogenSulfate Jan 3, 2025
5f71752
remove print
HydrogenSulfate Jan 3, 2025
89f3195
Merge branch 'PaddlePaddle:develop' into support_0-size_fwd_bwd
HydrogenSulfate Jan 3, 2025
e026da1
remove unnecessary code
HydrogenSulfate Jan 5, 2025
d416e30
Merge branch 'support_0-size_fwd_bwd' of https://github.com/HydrogenS…
HydrogenSulfate Jan 5, 2025
942f58b
remove condition of define() for paddle::Tensor
HydrogenSulfate Jan 6, 2025
da2ede8
Merge branch 'develop' into support_0-size_fwd_bwd
HydrogenSulfate Jan 6, 2025
aca7ba3
fix
HydrogenSulfate Jan 6, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Prev Previous commit
fix
  • Loading branch information
HydrogenSulfate committed Jan 6, 2025
commit aca7ba3d0bc8b2ec3c29230a836940584b109ad5
8 changes: 4 additions & 4 deletions paddle/fluid/eager/grad_node_info.cc
Original file line number Diff line number Diff line change
Expand Up @@ -106,7 +106,7 @@ void GradNodeBase::SetGradInMeta(const paddle::Tensor& fwd_out,
}

if (!fwd_out.has_allocation()) {
if (fwd_out.is_dist_tensor() &&
if (fwd_out.defined() && fwd_out.is_dist_tensor() &&
phi::distributed::NeedComputationClipForPP(fwd_out.impl())) {
VLOG(3) << "Tensor " << fwd_out.name() << " is DistTensor,"
<< " and needs computation clip for pipeline parallel."
Expand Down Expand Up @@ -196,7 +196,7 @@ void GradNodeBase::SetGradInMeta(const std::vector<paddle::Tensor>& fwd_out,
}

if (!fwd_out_tensor.has_allocation()) {
if (fwd_out_tensor.is_dist_tensor() &&
if (fwd_out_tensor.defined() && fwd_out_tensor.is_dist_tensor() &&
phi::distributed::NeedComputationClipForPP(fwd_out_tensor.impl())) {
VLOG(3) << "Tensor " << fwd_out_tensor.name() << " is DistTensor,"
<< " and needs computation clip for pipeline parallel."
Expand Down Expand Up @@ -295,8 +295,8 @@ void GradNodeBase::SetGradInMeta(const std::vector<paddle::Tensor*>& fwd_out,
meta.SetStopGradient(fwd_out_meta->StopGradient());
}

if (!(fwd_out_tensor.has_allocation())) {
if (fwd_out_tensor.is_dist_tensor() &&
if (!fwd_out_tensor.has_allocation()) {
if (fwd_out_tensor.defined() && fwd_out_tensor.is_dist_tensor() &&
phi::distributed::NeedComputationClipForPP(fwd_out_tensor.impl())) {
VLOG(3) << "Tensor " << fwd_out_tensor.name() << " is DistTensor,"
<< " and needs computation clip for pipeline parallel."
Expand Down
4 changes: 2 additions & 2 deletions paddle/fluid/eager/tensor_wrapper.h
Original file line number Diff line number Diff line change
Expand Up @@ -92,7 +92,7 @@ class TensorWrapper {
} else {
#ifndef PADDLE_NO_PYTHON
if (egr::SavedTensorsHooks::GetInstance().IsEnable() &&
tensor.is_dense_tensor() && tensor.has_allocation()) {
tensor.has_allocation() && tensor.is_dense_tensor()) {
phi::DenseTensor* dense_tensor =
static_cast<phi::DenseTensor*>(tensor.impl().get());
intermediate_tensor_.set_impl(std::make_shared<phi::DenseTensor>(
Expand All @@ -102,7 +102,7 @@ class TensorWrapper {
unpack_hook_ = egr::SavedTensorsHooks::GetInstance().GetUnPackHook();
packed_value_ = (*pack_hook)(tensor);
} else if (egr::SavedTensorsHooks::GetInstance().IsEnable() &&
tensor.is_dist_tensor() && tensor.initialized()) {
tensor.initialized() && tensor.is_dist_tensor()) {
intermediate_tensor_.set_impl(
std::make_shared<phi::distributed::DistTensor>(
tensor.dims(),
Expand Down
6 changes: 3 additions & 3 deletions paddle/fluid/eager/utils.cc
Original file line number Diff line number Diff line change
Expand Up @@ -556,7 +556,7 @@ void EagerUtils::FillZeroForEmptyOptionalGradInput(
const std::vector<GradSlotMeta>& grad_in_metas) {
for (size_t i = 0; i < in_grads->size(); i++) {
paddle::Tensor& grad = (*in_grads)[i];
if (!grad.has_allocation() && grad_in_metas[i].HasTensorMeta()) {
if (!grad.initialized() && grad_in_metas[i].HasTensorMeta()) {
if (grad_in_metas[i].IsDistMeta()) {
grad.set_impl(std::make_shared<phi::distributed::DistTensor>(
grad_in_metas[i].DistTensorGlobalDims(),
Expand Down Expand Up @@ -591,8 +591,8 @@ void EagerUtils::FillZeroForEmptyOptionalGradOutput(
continue;
}
paddle::Tensor& grad = (*output_grads)[i];
if (!grad.has_allocation() && grad_output_metas[i].HasTensorMeta()) {
if (grad.is_selected_rows()) {
if (!grad.initialized() && grad_output_metas[i].HasTensorMeta()) {
if (grad.defined() && grad.is_selected_rows()) {
continue;
}
if (grad_output_metas[i].IsDistMeta()) {
Expand Down
Loading