fix normal memory issue on GPU (#2107)

lvyufeng · web-flow · commit 4391752a85bb · 2025-08-01T11:23:57.000+08:00
diff --git a/mindnlp/core/_tensor.py b/mindnlp/core/_tensor.py
@@ -797,6 +797,9 @@ def tobytes(self):
     Tensor.index_add_ = ops.inplace_index_add
     StubTensor.index_add_ = ops.inplace_index_add
 
+    Tensor.erfinv_ = ops.inplace_erfinv
+    StubTensor.erfinv_ = ops.inplace_erfinv
+
 def _rebuild_from_type_v2(func, new_type, args, state):
     ret = func(*args)
     return ret
diff --git a/mindnlp/core/ops/creation.py b/mindnlp/core/ops/creation.py
@@ -12,6 +12,7 @@
 from mindspore.ops._primitive_cache import _get_cache_prim
 from ..configs import use_pyboost, ON_ORANGE_PI
 from .._bind import get_default_dtype, get_default_device
+from .._dtype import dtype2np
 from .utils import py2dtype
 from .other import finfo
 
@@ -195,11 +196,15 @@ def empty(*size, dtype=None, device=None, requires_grad=False, pin_memory=False,
             device = 'meta'
 
     # To avoid the problem in irecv and recv of using empty.
-    if device != 'meta':
+    if device not in ['meta', 'GPU']:
         out = mindspore.mint.empty(size, dtype=dtype, device=device)
     else:
         out = CTensor(dtype=dtype, shape=size)
         out = mindspore.Tensor(out)
+    # else:
+    #     out = np.empty(size, dtype=dtype2np[dtype])
+    #     out = mindspore.Tensor(out)
+
     if requires_grad:
         out.requires_grad = True
     return out
diff --git a/mindnlp/core/ops/inplace.py b/mindnlp/core/ops/inplace.py
@@ -1,4 +1,5 @@
 import numbers
+import numpy as np
 import mindspore
 from mindspore import ops
 from mindspore._c_expression import typing
@@ -7,7 +8,7 @@
 from mindspore.ops.auto_generate.gen_ops_prim import inplace_normal_op, inplace_scatter_value_op, inplace_scatter_src_reduce_op, \
     inplace_scatter_src_op, inplace_fill_tensor_op, inplace_fill_scalar_op, inplace_zero_op, inplace_uniform_op, \
     inplace_masked_fill_scalar_op, inplace_masked_fill_tensor_op, inplace_random_op, inplace_clamp_scalar_op, \
-    inplace_clamp_tensor_op, inplace_copy_op, inplace_index_add_op
+    inplace_clamp_tensor_op, inplace_copy_op, inplace_index_add_op, inplace_erfinv_op
 
 from mindnlp import core
 from ..configs import use_pyboost
@@ -50,7 +51,7 @@ def inplace_normal(input, mean=0, std=1, *, generator=None):
     if input.device.type == 'npu':
         inplace_normal_op(input, mean, std, seed, offset)
     else:
-        input.data = ops.normal(input.shape, mean, std)
+        input.data = core.tensor(np.random.normal(mean, std, input.shape), dtype=input.dtype)
     return input
 
 # uniform_
@@ -77,7 +78,8 @@ def inplace_uniform(input, *args, **kwargs):
     if input.device.type == 'npu':
         inplace_uniform_op(input, from_, to_, seed, offset)
     else:
-        input.data = core.rand(input.shape, generator=generator_, dtype=input.dtype) * (to_ - from_) + from_
+        input.data = core.tensor(np.random.uniform(from_, to_, input.shape), dtype=input.dtype)
+        # core.rand(input.shape, generator=generator_, dtype=input.dtype) * (to_ - from_) + from_
     return input
 
 def inplace_add(input, other, alpha):
@@ -227,6 +229,13 @@ def inplace_clamp(self, min=None, max=None):
         self.data = ops.clamp(self, min, max)
     return self
 
+def inplace_erfinv(self):
+    if self.device.type == 'npu':
+        inplace_erfinv_op(self)
+    else:
+        self.data = core.erfinv(self)
+    return self
+
 __all__ = [
     'inplace_copy',
     'inplace_zero',
@@ -253,5 +262,6 @@ def inplace_clamp(self, min=None, max=None):
     'inplace_tril',
     'inplace_masked_fill',
     'inplace_random',
-    'inplace_clamp'
+    'inplace_clamp',
+    'inplace_erfinv'
 ]
diff --git a/mindnlp/core/ops/random.py b/mindnlp/core/ops/random.py
@@ -127,7 +127,8 @@ def randn(*size, generator=None, dtype=None, **kwargs):
         dtype = get_default_dtype()
     if use_pyboost() and has_randn:
         return mindspore.mint.randn(*new_size, generator=generator, dtype=dtype)
-    return ops.randn(*new_size, dtype=dtype)
+    # return ops.randn(*new_size, dtype=dtype)
+    return mindspore.Tensor(np.random.randn(*new_size), dtype=dtype)
 
 # randn_like
 has_randn_like = hasattr(mindspore.mint, 'randn_like')