docs/api/random_8h_source.html

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *   http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
  * KIND, either express or implied.  See the License for the
  * specific language governing permissions and limitations
  * under the License.
  */

 #ifndef MSHADOW_RANDOM_H_
 #define MSHADOW_RANDOM_H_

 #include <cstdlib>
 #include <algorithm>
 #include <random>
 #include "./base.h"
 #include "./tensor.h"
 #include "./tensor_container.h"

 #if MSHADOW_IN_CXX11
 #include <random>  // use cxx11 random by default
 #endif

 #if _MSC_VER
 #define rand_r(x) rand()
 #endif


 namespace mshadow {
 template<typename Device, typename DType MSHADOW_DEFAULT_DTYPE>
 class Random {};

 template<typename DType>
 class Random<cpu, DType> {
  public:
   explicit Random(int seed) {
     this->Seed(seed);
     buffer_.Resize(Shape1(kRandBufferSize));
   }
   ~Random(void) {
   }
   inline void Seed(int seed) {
 #if MSHADOW_IN_CXX11
     rnd_engine_.seed(seed);
 #endif
     this->rseed_ = static_cast<unsigned>(seed);
   }
   inline unsigned GetSeed() const {
     return rseed_;
   }
   inline void set_stream(Stream<cpu> *stream) {
   }

 // These samplers are only avail in C++11.
 #if MSHADOW_IN_CXX11

   inline unsigned GetRandInt() {
     return rnd_engine_();
   }

   inline void GetRandInt(const Tensor<cpu, 1, unsigned>& dst) {
     std::generate_n(dst.dptr_, dst.size(0), [&](){ return rnd_engine_(); });
   }

   template<int dim, class Sampler>
   inline void SampleDistribution(Tensor<cpu, dim, DType> *dst, Sampler sampler) {
     if (dst->CheckContiguous()) {
       std::generate_n(dst->dptr_, dst->shape_.Size(), sampler);
     } else {
       Tensor<cpu, 2, DType> mat = dst->FlatTo2D();
       for (index_t i = 0; i < mat.size(0); ++i) {
         std::generate_n(mat[i].dptr_, mat.size(1), sampler);
       }
     }
   }

   template<int dim, typename PType>
   inline void SampleUniform(Tensor<cpu, dim, DType> *dst,
                             PType a = 0.0f , PType b = 1.0f ) {
     // Ensure that half_t is handled correctly.
     typedef typename std::conditional<std::is_floating_point<DType>::value,
                                       DType, double>::type FType;
     typedef typename std::conditional<std::is_integral<DType>::value,
                                       std::uniform_int_distribution<DType>,
                                       std::uniform_real_distribution<FType>>::type GType;
     GType dist_uniform(a, b);
     SampleDistribution(dst, [&](){ return dist_uniform(rnd_engine_);});
   }

   template<int dim, typename PType>
   inline void SampleGaussian(Tensor<cpu, dim, DType> *dst,
                              PType mu = 0.0f, PType sigma = 1.0f ) {
     if (sigma <= 0) {
       *dst = mu; return;
     }
     typedef typename std::conditional<std::is_floating_point<DType>::value,
                                       DType, double>::type GType;
     std::normal_distribution<GType> dist_normal(mu, sigma);
     SampleDistribution(dst, [&](){ return dist_normal(rnd_engine_);});
   }

   template<int dim, typename PType>
   inline void SampleGamma(Tensor<cpu, dim, DType> *dst,
                           PType alpha, PType beta) {
     typedef typename std::conditional<std::is_floating_point<DType>::value,
                                       DType, double>::type GType;
     std::gamma_distribution<GType> dist_gamma(alpha, beta);
     SampleDistribution(dst, [&](){ return dist_gamma(rnd_engine_);});
   }

   template<int dim, typename PType>
   inline void SampleExponential(Tensor<cpu, dim, DType> *dst, PType lambda ) {
     typedef typename std::conditional<std::is_floating_point<DType>::value,
                                       DType, double>::type GType;
     std::exponential_distribution<GType> dist_exp(lambda);
     SampleDistribution(dst, [&](){ return dist_exp(rnd_engine_);});
   }

   template<int dim, typename PType>
   inline void SamplePoisson(Tensor<cpu, dim, DType> *dst, PType lambda) {
     typedef typename std::conditional<std::is_integral<DType>::value, DType, int>::type GType;
     std::poisson_distribution<GType> dist_poisson(lambda);
     SampleDistribution(dst, [&](){ return static_cast<DType>(dist_poisson(rnd_engine_));});
   }

   template<int dim, typename PType1, typename PType2>
   inline void SampleNegativeBinomial(Tensor<cpu, dim, DType> *dst, PType1 k, PType2 p) {
     typedef typename std::conditional<std::is_integral<DType>::value, DType, int>::type GType;
     std::negative_binomial_distribution<GType> dist_negbinomial(k, p);
     SampleDistribution(dst, [&](){ return static_cast<DType>(dist_negbinomial(rnd_engine_));});
   }

   template<int dim, typename PType>
   inline void SampleGeneralizedNegativeBinomial(Tensor<cpu, dim, DType> *dst,
                                                 PType mu, PType alpha) {
     if (alpha == PType(0)) {
       SamplePoisson(dst, mu);  // limit of Poisson
     } else {
       PType r(PType(1) / alpha);
       PType beta = mu * alpha;
       std::gamma_distribution<> dist_gamma(r, beta);
       typedef typename std::conditional<std::is_integral<DType>::value, DType, int>::type GType;
       SampleDistribution(dst,
         [&](){ std::poisson_distribution<GType> dist_poisson(dist_gamma(rnd_engine_));
                return static_cast<DType>(dist_poisson(rnd_engine_));});
     }
   }
 #endif

   template<int dim>
   inline expr::ReshapeExp<Tensor<cpu, 1, DType>, DType, dim, 1>
   gaussian(Shape<dim> shape) {
     buffer_.Resize(Shape1(shape.Size()));
     this->SampleGaussian(&buffer_, 0.0f, 1.0f);
     return expr::reshape(buffer_, shape);
   }
   template<int dim>
   inline expr::ReshapeExp<Tensor<cpu, 1, DType>, DType, dim, 1>
   uniform(Shape<dim> shape) {
     buffer_.Resize(Shape1(shape.Size()));
     this->SampleUniform(&buffer_, 0.0f, 1.0f);
     return expr::reshape(buffer_, shape);
   }

   std::mt19937 &GetRndEngine() {
     return rnd_engine_;
   }

  private:
 #if MSHADOW_IN_CXX11

   std::mt19937 rnd_engine_;
   unsigned rseed_;

 #else

   unsigned rseed_;
   // functions
   template<int dim>
   inline void SampleUniform(Tensor<cpu, dim, DType> *dst,
                             DType a = 0.0f, DType b = 1.0f) {
     if (dst->CheckContiguous()) {
       this->GenUniform(dst->dptr_, dst->shape_.Size(), a, b);
     } else {
       Tensor<cpu, 2, DType> mat = dst->FlatTo2D();
       for (index_t i = 0; i < mat.size(0); ++i) {
         this->GenUniform(mat[i].dptr_, mat.size(1), a, b);
       }
     }
   }
   template<int dim>
   inline void SampleGaussian(Tensor<cpu, dim, DType> *dst,
                              DType mu = 0.0f, DType sigma = 1.0f) {
     if (sigma <= 0.0f) {
       *dst = mu; return;
     }
     if (dst->CheckContiguous()) {
       this->GenGaussian(dst->dptr_, dst->shape_.Size(), mu, sigma);
     } else {
       Tensor<cpu, 2, DType> mat = dst->FlatTo2D();
       for (index_t i = 0; i < mat.size(0); ++i) {
         this->GenGaussian(mat[i].dptr_, mat.size(1), mu, sigma);
       }
     }
   }
   inline void GenUniform(float *dptr, index_t size, float a, float b) {
     for (index_t j = 0; j < size; ++j) {
       dptr[j] = static_cast<float>(RandNext()) * (b - a) + a;
     }
   }
   inline void GenUniform(double *dptr, index_t size, double a, double b) {
     for (index_t j = 0; j < size; ++j) {
       dptr[j] = static_cast<double>(RandNext()) * (b - a) + a;
     }
   }
   inline void GenGaussian(float *dptr, index_t size, float mu, float sigma) {
     this->GenGaussianX(dptr, size, mu, sigma);
   }
   inline void GenGaussian(double *dptr, index_t size, double mu, double sigma) {
     this->GenGaussianX(dptr, size, mu, sigma);
   }
   inline void GenGaussianX(DType *dptr, index_t size, DType mu, DType sigma) {
     DType g1 = 0.0f, g2 = 0.0f;
     for (index_t j = 0; j < size; ++j) {
       if ((j & 1) == 0) {
         this->SampleNormal2D(&g1, &g2);
         dptr[j] = mu + g1 * sigma;
       } else {
         dptr[j] = mu + g2 * sigma;
       }
     }
   }
   inline DType RandNext(void) {
     return static_cast<DType>(rand_r(&rseed_)) /
         (static_cast<DType>(RAND_MAX) + 1.0f);
   }
   inline DType RandNext2(void) {
     return (static_cast<DType>(rand_r(&rseed_)) + 1.0f) /
         (static_cast<DType>(RAND_MAX) + 2.0f);
   }
   inline void SampleNormal2D(DType *xx_, DType *yy_) {
     DType &xx = *xx_, &yy = *yy_;
     DType x, y, s;
     do {
       x = 2.0f * RandNext2() - 1.0f;
       y = 2.0f * RandNext2() - 1.0f;
       s = x * x + y * y;
     } while (s >= 1.0f || s == 0.0f);
     DType t = std::sqrt(-2.0f * std::log(s) / s);
     xx = x * t; yy = y * t;
   }
 #endif

   TensorContainer<cpu, 1, DType> buffer_;
 };  // class Random<cpu, DType>

 // only allow GPU PRNG when cuda is enabled
 #if MSHADOW_USE_CUDA

 template<typename DType>
 class Random<gpu, DType> {
  public:
   explicit Random(int seed) : gen_(NULL) {
     this->Seed(seed);
     buffer_.Resize(Shape1(kRandBufferSize));
   }
   ~Random(void) MSHADOW_THROW_EXCEPTION {
     DeleteGenerator();
   }
   inline void set_stream(Stream<gpu> *stream) {
     curandStatus_t status;
     status = curandSetStream(gen_, Stream<gpu>::GetStream(stream));

     CHECK_EQ(status, CURAND_STATUS_SUCCESS) << "set_stream CURAND failed";
   }
   inline void Seed(int seed) {
     // Create a new rng, either initially or if the RNG type can't reset its offset.
     if (gen_ == NULL || (curandSetGeneratorOffset(gen_, 0ULL) != CURAND_STATUS_SUCCESS))
       CreateGenerator();
     // Now set the seed.
     curandStatus_t status;
     status = curandSetPseudoRandomGeneratorSeed(gen_, static_cast<uint64_t>(seed));
     CHECK_EQ(status, CURAND_STATUS_SUCCESS) << "Set CURAND seed failed.";
   }
   inline void GetRandInt(const Tensor<gpu, 1, unsigned>& dst) {
     curandStatus_t status = curandGenerate(gen_, dst.dptr_, dst.size(0));
     CHECK_EQ(status, CURAND_STATUS_SUCCESS) << "CURAND Gen rand ints failed.";
   }
   template<int dim>
   inline void SampleUniform(Tensor<gpu, dim, DType> *dst,
                             DType a = 0.0f, DType b = 1.0f);

   template<int dim>
   inline void SampleGaussian(Tensor<gpu, dim, DType> *dst,
                              DType mu = 0.0f, DType sigma = 1.0f);
   template<int dim>
   inline expr::ReshapeExp<Tensor<gpu, 1, DType>, DType, dim, 1>
   gaussian(Shape<dim> shape, DType mu = 0.0f, DType sigma = 1.0f);
   template<int dim>
   inline expr::ReshapeExp<Tensor<gpu, 1, DType>, DType, dim, 1>
   uniform(Shape<dim> shape);

  private:
   inline void GenGaussian(float *dptr, size_t size, float mu, float sigma) {
     curandStatus_t status;
     status = curandGenerateNormal(gen_, dptr, size, mu, sigma);
     CHECK_EQ(status, CURAND_STATUS_SUCCESS) << "CURAND Gen Normal float failed."
                                             << " size = " << size
                                             << ",mu = " << mu
                                             << ",sigma = " << sigma;
   }
   inline void GenGaussian(double *dptr, size_t size, double mu, double sigma) {
     curandStatus_t status;
     status = curandGenerateNormalDouble(gen_, dptr, size, mu, sigma);
     CHECK_EQ(status, CURAND_STATUS_SUCCESS) << "CURAND Gen Normal double failed."
                                             << " size = " << size
                                             << ",mu = " << mu
                                             << ",sigma = " << sigma;
   }
   inline void GenUniform(float *dptr, size_t size) {
     curandStatus_t status;
     status = curandGenerateUniform(gen_, dptr, size);
     CHECK_EQ(status, CURAND_STATUS_SUCCESS) << "CURAND Gen Uniform float failed."
                                             << " size = " << size;
   }
   inline void GenUniform(double *dptr, size_t size) {
     curandStatus_t status;
     status = curandGenerateUniformDouble(gen_, dptr, size);
     CHECK_EQ(status, CURAND_STATUS_SUCCESS) << "CURAND Gen Uniform double failed."
                                             << " size = " << size;
   }
   inline void CreateGenerator() {
     if (gen_ != NULL)
       DeleteGenerator();
     curandStatus_t status;
     status = curandCreateGenerator(&gen_, CURAND_RNG_PSEUDO_DEFAULT);
     CHECK_EQ(status, CURAND_STATUS_SUCCESS) << "Cannot create CURAND Generator";
   }
   inline void DeleteGenerator() {
     if (gen_ != NULL) {
       curandStatus_t status;
       status = curandDestroyGenerator(gen_);
       CHECK_EQ(status, CURAND_STATUS_SUCCESS) << "Destory CURAND Gen failed";
       gen_ = NULL;
     }
   }
   curandGenerator_t gen_;
   TensorContainer<gpu, 1, DType> buffer_;
 };  // class Random<gpu, DType>
 #endif  // MSHADOW_USE_CUDA

 #ifdef __CUDACC__
 // implementations that depends on cuda kernels
 template<typename DType>
 template<int dim>
 inline void Random<gpu, DType>::SampleUniform(
     Tensor<gpu, dim, DType> *dst, DType a, DType b) {
   if (a == 0.0f && b == 1.0f) {
     if (dst->CheckContiguous()) {
       this->GenUniform(dst->dptr_, dst->shape_.Size());
     } else {
       *dst = this->uniform(dst->shape_);
     }
   } else {
     *dst = this->uniform(dst->shape_) * (b - a) + a;
   }
 }
 template<typename DType>
 template<int dim>
 inline void Random<gpu, DType>::SampleGaussian(
     Tensor<gpu, dim, DType> *dst, DType mu, DType sigma) {
   // We need to check whether the shape size is even since CuRand supports only normal distribution
   // generation of even number of elements.
   if (dst->CheckContiguous() && (dst->shape_.Size() % 2 == 0)) {
     this->GenGaussian(dst->dptr_, dst->shape_.Size(), mu, sigma);
   } else {
     *dst = this->gaussian(dst->shape_, mu, sigma);
   }
 }

 template<typename DType>
 template<int dim>
 inline expr::ReshapeExp<Tensor<gpu, 1, DType>, DType, dim, 1>
 Random<gpu, DType>::gaussian(Shape<dim> shape, DType mu, DType sigma) {
   size_t aligned_sz = ((shape.Size() + 1UL) >> 1) << 1;
   // allocate alligned size
   buffer_.Resize(Shape1(aligned_sz));
   buffer_.Resize(Shape1(shape.Size()));
   this->GenGaussian(buffer_.dptr_, aligned_sz, mu, sigma);
   return expr::reshape(buffer_, shape);
 }

 template<typename DType>
 template<int dim>
 inline expr::ReshapeExp<Tensor<gpu, 1, DType>, DType, dim, 1>
 Random<gpu, DType>::uniform(Shape<dim> shape) {
   buffer_.Resize(Shape1(shape.Size()));
   this->GenUniform(buffer_.dptr_, buffer_.size(0));
   return expr::reshape(buffer_, shape);
 }
 #endif  // __CUDACC__
 }  // namespace mshadow
 #endif  // MSHADOW_RANDOM_H_
mshadow::Random< cpu, DType >::gaussian
expr::ReshapeExp< Tensor< cpu, 1, DType >, DType, dim, 1 > gaussian(Shape< dim > shape)
return a temporal expression storing standard gaussian random variables the temporal tensor is only v...
Definition: random.h:262

mshadow::Random
random number generator
Definition: random.h:52

mshadow::Random< gpu, DType >::Seed
void Seed(int seed)
seed random number generator using this seed
Definition: random.h:418

mshadow::Tensor::dptr_
DType * dptr_
pointer to the data
Definition: tensor.h:434

mshadow::Random< cpu, DType >::GetSeed
unsigned GetSeed() const
get random seed used in random generator
Definition: random.h:82

mshadow::Random< cpu, DType >::Seed
void Seed(int seed)
seed random number generator using this seed
Definition: random.h:72

mshadow::Shape< dim >

mshadow::Stream< gpu >
Definition: stream_gpu-inl.h:37

mshadow::Random< gpu, DType >::~Random
~Random(void) MSHADOW_THROW_EXCEPTION
Definition: random.h:401

mshadow::Tensor::shape_
Shape< dimension > shape_
shape of the tensor
Definition: tensor.h:436

mshadow::Random< cpu, DType >::~Random
~Random(void)
Definition: random.h:66

mshadow::Random< cpu, DType >::uniform
expr::ReshapeExp< Tensor< cpu, 1, DType >, DType, dim, 1 > uniform(Shape< dim > shape)
return a temporal expression storing standard uniform [0,1) the temporal tensor is only valid before ...
Definition: random.h:280

tensor.h
header file of tensor data structure and functions This lib requires explicit memory allocation and d...

mshadow::cpu
device name CPU
Definition: tensor.h:39

mshadow::gpu
device name GPU
Definition: tensor.h:46

mshadow::kRandBufferSize
const unsigned kRandBufferSize
buffer size for each random number generator
Definition: base.h:336

mxnet::SampleExponential
void SampleExponential(real_t lambda, NDArray *out)
Sample exponential distribution for each elements of out.

mshadow::index_t
int32_t index_t
type that will be used for index
Definition: base.h:343

mshadow::expr::reshape
ReshapeExp< SrcExp, DType, dimdst, ExpInfo< SrcExp >::kDim > reshape(const Exp< SrcExp, DType, etype > &src, Shape< dimdst > oshape)
a expression that reshapes a tensor to another shape
Definition: reshape.h:66

mxnet::SampleGaussian
void SampleGaussian(real_t mu, real_t sigma, NDArray *out)
Sample gaussian distribution for each elements of out.

mshadow::Tensor::FlatTo2D
MSHADOW_XINLINE Tensor< Device, 2, DType > FlatTo2D(void) const
flatten the tensor to 2 dimension, collapse the higher dimensions together
Definition: tensor.h:519

mshadow::TensorContainer
tensor container that does memory allocation and resize like STL, use it to save the lines of FreeSpa...
Definition: tensor_container.h:40

mshadow::Tensor::size
MSHADOW_XINLINE index_t size(int idx) const
return size of i-th dimension, start counting from highest dimension
Definition: tensor.h:505

mshadow::Tensor::CheckContiguous
MSHADOW_XINLINE bool CheckContiguous(void) const
Definition: tensor.h:491

mshadow::Shape1
MSHADOW_XINLINE Shape< 1 > Shape1(index_t s0)
construct a one dimension shape, stride will equal s0
Definition: tensor.h:206

mshadow::Random< gpu, DType >::GetRandInt
void GetRandInt(const Tensor< gpu, 1, unsigned > &dst)
get a set of random integers
Definition: random.h:430

mxnet::SampleUniform
void SampleUniform(real_t begin, real_t end, NDArray *out)
Sample uniform distribution for each elements of out.

mshadow::expr::ReshapeExp
reshape the content to another shape input: Tensor<Device,dimsrc>: ishape output: Tensor<Device...
Definition: reshape.h:39

mshadow::Random< cpu, DType >::GetRndEngine
std::mt19937 & GetRndEngine()
Definition: random.h:286

mshadow::Random< gpu, DType >::Random
Random(int seed)
constructor of random engine
Definition: random.h:397

tensor_container.h
tensor container that does memory allocation and resize like STL

mshadow::Random< cpu, DType >::set_stream
void set_stream(Stream< cpu > *stream)
set the stream of computation
Definition: random.h:89

mshadow::Random< cpu, DType >::Random
Random(int seed)
constructor of random engine
Definition: random.h:62

mshadow
overloaded + operator between half_t and bf16_t
Definition: base.h:334

MSHADOW_THROW_EXCEPTION
#define MSHADOW_THROW_EXCEPTION
Definition: base.h:260

mshadow::Tensor
general tensor
Definition: tensor.h:420

mxnet::SamplePoisson
void SamplePoisson(real_t lambda, NDArray *out)
Sample Poisson distribution for each elements of out.

base.h

mshadow::Random< gpu, DType >::set_stream
void set_stream(Stream< gpu > *stream)
set the stream of computation
Definition: random.h:408

mshadow::Shape::Size
MSHADOW_XINLINE index_t Size(void) const
Definition: tensor.h:144

mxnet::SampleGamma
void SampleGamma(real_t alpha, real_t beta, NDArray *out)
Sample gamma distribution for each elements of out.

mshadow::Stream
computaion stream structure, used for asynchronous computations
Definition: tensor.h:383