Oneflow-Inc · mergify · Apr 9, 2022 · Apr 2, 2022 · Apr 2, 2022 · Apr 6, 2022
@@ -7,6 +7,8 @@ ONEFLOW.CUDA
     :members: is_available,
         device_count,
         current_device,
+        manual_seed_all,
+        manual_seed,
         HalfTensor,
         FloatTensor,
         DoubleTensor,

@@ -178,6 +178,11 @@ oneflow
             CharTensor,
             IntTensor,
             LongTensor,
+            seed,
+            manual_seed,
+            initial_seed,
+            get_rng_state,
+            set_rng_state,
 
 .. autofunction:: oneflow.relu
 .. autofunction:: oneflow.set_num_threads
diff --git a/oneflow/api/python/framework/random_generator.cpp b/oneflow/api/python/framework/random_generator.cpp
@@ -22,6 +22,18 @@ namespace py = pybind11;
 
 namespace oneflow {
 
+namespace {
+
+int64_t UnpackLong(PyObject* py_obj) {
+  int overflow = -1;
+  long long val = PyLong_AsLongLongAndOverflow(py_obj, &overflow);
+  if (val == -1 && PyErr_Occurred()) { throw std::runtime_error("Python exception occurs"); }
+  if (overflow != 0) { throw std::runtime_error("Overflow when unpacking long"); }
+  return (int64_t)val;
+}
+
+}  // namespace
+
 Maybe<one::Generator> CreateGenerator(const std::string& device_tag) {
   std::string device_name = "";
   int device_index = -1;
@@ -34,21 +46,36 @@ ONEFLOW_API_PYBIND11_MODULE("", m) {
       .def(py::init([](const std::string& device_tag) {
         return CreateGenerator(device_tag).GetPtrOrThrow();
       }))
-      .def("manual_seed", &one::Generator::set_current_seed)
+      .def("manual_seed",
+           [](std::shared_ptr<one::Generator> generator, const py::object& seed) {
+             int64_t seed_val = UnpackLong(seed.ptr());
+             generator->set_current_seed(seed_val);
+           })
       .def("initial_seed", &one::Generator::current_seed)
       .def("seed", &one::Generator::seed)
       .def_property_readonly("device", &one::Generator::device)
       .def("get_state", &one::Generator::GetState)
       .def("set_state", &one::Generator::SetState);
 
-  m.def("manual_seed", [](uint64_t seed) { return one::ManualSeed(seed); });
+  m.def("manual_seed", [](const py::object& seed) -> Maybe<one::Generator> {
+    int64_t seed_val = UnpackLong(seed.ptr());
+    return one::ManualSeed(seed_val);
+  });
+  m.def("manual_seed", [](const py::object& seed, const std::string& device, int device_index) {
+    int64_t seed_val = UnpackLong(seed.ptr());
+    return one::ManualSeed(seed_val, device, device_index);
+  });
   m.def("create_generator", &CreateGenerator);
   m.def("default_generator", [](const std::string& device_tag) -> Maybe<one::Generator> {
     std::string device_name = "";
     int device_index = -1;
     JUST(ParsingDeviceTag(device_tag, &device_name, &device_index));
     return one::DefaultGenerator(device_name, device_index);
   });
+  m.def("ManualSeedAllCudaGenerator", [](const py::object& seed) {
+    int64_t seed_val = UnpackLong(seed.ptr());
+    return one::ManualSeedAllCudaGenerator(seed_val);
+  });
 }
 
 }  // namespace oneflow
@@ -24,11 +24,35 @@ limitations under the License.
 namespace oneflow {
 namespace one {
 
-Maybe<void> ManualSeed(uint64_t seed) {
-  JUST(DefaultAutoGenerator())->set_current_seed(seed);
+Maybe<Generator> ManualSeed(uint64_t seed) {
+  const auto& default_auto_generator = JUST(DefaultAutoGenerator());
+  default_auto_generator->set_current_seed(seed);
+  return default_auto_generator;
+}
+
+Maybe<void> ManualSeed(uint64_t seed, const std::string& device, int device_index) {
+  if (device == "cpu") {
+    JUST(DefaultCPUGenerator())->set_current_seed(seed);
+  }
+#ifdef WITH_CUDA
+  else if (device == "cuda") {
+    JUST(DefaultCUDAGenerator(device_index))->set_current_seed(seed);
+  }
+#endif  // WITH_CUDA
+  else if (device == "auto") {
+    JUST(DefaultAutoGenerator())->set_current_seed(seed);
+  } else {
+    return Error::RuntimeError() << "Invalid device " << device
+                                 << " for making generator, please make sure the device is one of "
+                                 << PrintAvailableDevices();
+  }
   return Maybe<void>::Ok();
 }
 
+Maybe<void> ManualSeed(uint64_t seed, DeviceType device, int device_index) {
+  return ManualSeed(seed, DeviceTypeName(device), device_index);
+}
+
 namespace detail {
 
 uint64_t GetNonDeterministicRandom() {
@@ -99,6 +123,17 @@ Maybe<Generator> MakeCUDAGenerator(int device_index) {
 }
 #endif  // WITH_CUDA
 
+Maybe<void> ManualSeedAllCudaGenerator(uint64_t seed) {
+#ifdef WITH_CUDA
+  static int device_count = GetCudaDeviceCount();
+  FOR_RANGE(int, device_id, 0, device_count) {
+    const auto& cuda_gen = JUST(DefaultCUDAGenerator(device_id));
+    cuda_gen->set_current_seed(seed);
+  }
+#endif  // WITH_CUDA
+  return Maybe<void>::Ok();
+}
+
 Maybe<Generator> MakeGenerator(const std::string& device, int device_index) {
   if (device == "cpu") {
     return MakeCPUGenerator();

@@ -66,7 +66,10 @@ class Generator final {
   std::shared_ptr<GeneratorImpl> impl_;
 };
 
-Maybe<void> ManualSeed(uint64_t seed);
+Maybe<Generator> ManualSeed(uint64_t seed);
+
+Maybe<void> ManualSeed(uint64_t seed, const std::string& device, int device_index = -1);
+Maybe<void> ManualSeed(uint64_t seed, DeviceType device, int device_index = -1);
 
 Maybe<Generator> DefaultGenerator(const std::string& device, int device_index = -1);
 Maybe<Generator> DefaultGenerator(DeviceType device, int device_index = -1);
@@ -84,6 +87,7 @@ Maybe<Generator> MakeCPUGenerator();
 Maybe<Generator> DefaultCUDAGenerator(int device_index = -1);
 Maybe<Generator> MakeCUDAGenerator();
 #endif  // WITH_CUDA
+Maybe<void> ManualSeedAllCudaGenerator(uint64_t seed);
 
 }  // namespace one
 }  // namespace oneflow

@@ -16,13 +16,15 @@ limitations under the License.
 #include "oneflow/core/framework/random_generator_impl.h"
 
 #include "oneflow/core/common/util.h"
+#include "oneflow/core/common/cpp_attribute.h"
 #include "oneflow/core/framework/device.h"
 #include "oneflow/core/framework/instructions_builder.h"
 #include "oneflow/core/framework/tensor_util.h"
 #include "oneflow/core/functional/functional.h"
 #include "oneflow/core/job/env_global_objects_scope.h"
 #include "oneflow/core/register/ofblob.h"
 #include "oneflow/core/vm/vm_util.h"
+#include "oneflow/core/platform/include/pthread_fork.h"
 #ifdef WITH_CUDA
 #include "oneflow/core/device/cuda_util.h"
 #include <cuda.h>
@@ -224,7 +226,10 @@ void AutoGeneratorImpl::set_current_seed(uint64_t seed) {
   CHECK_JUST(CPUSynchronize());
   std::lock_guard<std::mutex> lock(mutex_);
   seed_ = seed;
-  for (const auto& it : generators_) { it.second->set_current_seed(seed); }
+  for (const auto& it : generators_) {
+    if (unlikely(pthread_fork::IsForkedSubProcess() && it.first.device_type == kCUDA)) { continue; }
+    it.second->set_current_seed(seed);
+  }
 }
 
 struct AutoGeneratorState {

diff --git a/python/oneflow/__init__.py b/python/oneflow/__init__.py
@@ -292,7 +292,9 @@ def atexit_hook(hook):
 from oneflow.framework.generator import create_generator as Generator
 from oneflow.framework.generator import (
     default_generator,
+    seed,
     manual_seed,
+    initial_seed,
     get_rng_state,
     set_rng_state,
 )

diff --git a/python/oneflow/cuda/__init__.py b/python/oneflow/cuda/__init__.py
@@ -33,3 +33,38 @@ def device_count() -> int:
 def current_device() -> int:
     r"""Returns local rank as device index."""
     return flow._oneflow_internal.GetCudaDeviceIndex()
+
+
+def manual_seed_all(seed) -> None:
+    r"""The documentation is referenced from:
+    https://pytorch.org/docs/stable/generated/torch.cuda.manual_seed_all.html?highlight=manual_seed_all
+
+    Sets the seed for generating random numbers on all GPUs.
+    It's safe to call this function if CUDA is not available; in that
+    case, it is silently ignored.
+
+    Args:
+        seed (int): The desired seed.
+    """
+    seed = int(seed)
+    flow._oneflow_internal.ManualSeedAllCudaGenerator(seed)
+
+
+def manual_seed(seed: int) -> None:
+    r"""The documentation is referenced from:
+    https://pytorch.org/docs/stable/generated/torch.cuda.manual_seed.html?highlight=manual_seed
+
+    Sets the seed for generating random numbers for the current GPU.
+    It's safe to call this function if CUDA is not available; in that
+    case, it is silently ignored.
+
+    Args:
+        seed (int): The desired seed.
+
+    .. warning::
+        If you are working with a multi-GPU model, this function is insufficient
+        to get determinism.  To seed all GPUs, use :func:`manual_seed_all`.
+    """
+    seed = int(seed)
+    idx = current_device()
+    flow._oneflow_internal.manual_seed(seed, "cuda", idx)
diff --git a/python/oneflow/framework/docstr/constant.py b/python/oneflow/framework/docstr/constant.py
@@ -67,7 +67,7 @@
     """
     new_ones(x, size=None, dtype=None, device=None, placement=None, sbp=None, requires_grad=False) -> Tensor
 
-    Returns a Tensor of size size filled with 1. By default, the returned Tensor has the same torch.dtype and torch.device as this tensor.
+    Returns a Tensor of size size filled with 1. By default, the returned Tensor has the same oneflow.dtype and oneflow.device as this tensor.
 
     Args:
         size (int...): a list, tuple, or flow.Size of integers defining the shape of the output tensor.

diff --git a/python/oneflow/framework/docstr/math_ops.py b/python/oneflow/framework/docstr/math_ops.py
@@ -1460,9 +1460,9 @@
     r"""
     Splits input, a tensor with one or more dimensions, into multiple tensors horizontally according to indices_or_sections.
     Each split is a view of input.
-    If input is one dimensional this is equivalent to calling torch.tensor_split(input, indices_or_sections, dim=0) 
+    If input is one dimensional this is equivalent to calling oneflow.tensor_split(input, indices_or_sections, dim=0) 
     (the split dimension is zero), and if input has two or more dimensions it’s equivalent to calling 
-    torch.tensor_split(input, indices_or_sections, dim=1) (the split dimension is 1), except that if indices_or_sections
+    oneflow.tensor_split(input, indices_or_sections, dim=1) (the split dimension is 1), except that if indices_or_sections
     is an integer it must evenly divide the split dimension or a runtime error will be thrown.
     The documentation is referenced from:
     https://pytorch.org/docs/stable/generated/torch.hsplit.html#torch.hsplit
@@ -1503,7 +1503,7 @@
     r"""
     Splits input, a tensor with two or more dimensions, into multiple tensors vertically according to indices_or_sections.
     Each split is a view of input.
-    This is equivalent to calling torch.tensor_split(input, indices_or_sections, dim=0) (the split dimension is 0),
+    This is equivalent to calling oneflow.tensor_split(input, indices_or_sections, dim=0) (the split dimension is 0),
     except that if indices_or_sections is an integer it must evenly divide the split dimension or a runtime error will be thrown.
     The documentation is referenced from:
     https://pytorch.org/docs/stable/generated/torch.vsplit.html#torch.vsplit

diff --git a/python/oneflow/framework/generator.py b/python/oneflow/framework/generator.py
@@ -23,8 +23,43 @@ def create_generator(device=None):
     return oneflow._oneflow_internal.create_generator(device)
 
 
-def manual_seed(seed):
+def seed() -> int:
+    r"""The documentation is referenced from:
+    https://pytorch.org/docs/stable/generated/torch.seed.html
+
+    Sets the seed for generating random numbers to a non-deterministic
+    random number. Returns a 64 bit number used to seed the RNG.
+    """
+    seed = default_generator.seed()
     oneflow._oneflow_internal.manual_seed(seed)
+    return seed
+
+
+def manual_seed(seed):
+    r"""The documentation is referenced from:
+    https://pytorch.org/docs/stable/generated/torch.manual_seed.html
+
+    Sets the seed for generating random numbers. Returns a
+    `oneflow.Generator` object.
+
+    Args:
+        seed (int): The desired seed. Value must be within the inclusive range
+            `[-0x8000_0000_0000_0000, 0xffff_ffff_ffff_ffff]`. Otherwise, a RuntimeError
+            is raised. Negative inputs are remapped to positive values with the formula
+            `0xffff_ffff_ffff_ffff + seed`.
+    """
+    seed = int(seed)
+    return oneflow._oneflow_internal.manual_seed(seed)
+
+
+def initial_seed() -> int:
+    r"""The documentation is referenced from:
+    https://pytorch.org/docs/stable/_modules/torch/random.html
+
+    Returns the initial seed for generating random numbers as a
+    Python `long`.
+    """
+    return default_generator.initial_seed()
 
 
 def _getstate(self):
@@ -37,15 +72,26 @@ def _setstate(self, state_dict):
 
 
 def get_rng_state():
-    """
-    returns the state of the default random number generator
+    r"""The documentation is referenced from:
+    https://pytorch.org/docs/stable/generated/torch.get_rng_state.html
+
+    Sets the random number generator state.
+
+    .. note: This function only works for CPU. For CUDA, please use
+             oneflow.manual_seed(seed), which works for both CPU and CUDA.
+
+    Args:
+        new_state (oneflow.ByteTensor): The desired state
     """
     return oneflow.default_generator.get_state()
 
 
 def set_rng_state(state):
-    """
-    sets the state of the default random number generator to the given state
+    """The documentation is referenced from:
+    https://pytorch.org/docs/stable/generated/torch.set_rng_state.html
+
+
+    Returns the random number generator state as a `oneflow.ByteTensor`.
     """
 
     return oneflow.default_generator.set_state(state)

diff --git a/python/oneflow/nn/modules/empty.py b/python/oneflow/nn/modules/empty.py
@@ -39,7 +39,7 @@ def empty_op(
         size (int... or oneflow.Size): Defining the shape of the output tensor.
           Can be a variable number of arguments or a collection like a list or tuple or oneflow.Size.
         dtype (flow.dtype, optional): The desired data type of returned tensor. Default: ``flow.float32``.
-        device (torch.device, optional): The desired device of returned local tensor. If None, uses the
+        device (oneflow.device, optional): The desired device of returned local tensor. If None, uses the
           current device.
         placement (flow.placement, optional): The desired device of returned global tensor. If None, will
           construct local tensor.