1.3.1/doxygen/include_2mxnet_2base_8h_source.html

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *   http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
  * KIND, either express or implied.  See the License for the
  * specific language governing permissions and limitations
  * under the License.
  */

 #ifndef MXNET_BASE_H_
 #define MXNET_BASE_H_

 #include <dmlc/base.h>
 #include <dmlc/io.h>
 #include <dmlc/type_traits.h>
 #include <dmlc/parameter.h>
 #include <mshadow/tensor.h>
 // nnvm headers for symbolic construction.
 #include <nnvm/op.h>
 #include <nnvm/tuple.h>
 #include <nnvm/symbolic.h>
 #include <string>

 #ifndef MXNET_USE_OPENCV
 #define MXNET_USE_OPENCV 1
 #endif

 #ifndef MXNET_USE_CUDA
 #define MXNET_USE_CUDA MSHADOW_USE_CUDA
 #endif

 #ifndef MXNET_USE_CUDNN
 #define MXNET_USE_CUDNN MSHADOW_USE_CUDNN
 #endif

 #ifndef MXNET_USE_CUSOLVER
 #define MXNET_USE_CUSOLVER MSHADOW_USE_CUSOLVER
 #endif

 #define MXNET_GPU_NOT_ENABLED_ERROR  "GPU is not enabled"

 #if DMLC_USE_CXX11 && defined(__GNUC__) && !defined(__clang_version__)
 #if __GNUC__ == 4 && __GNUC_MINOR__ < 8
 #error "Currently we need g++ 4.8 or higher to fully support c++11 features"
 #define override
 #define final
 #endif
 #endif

 #ifdef _MSC_VER
 #ifdef MXNET_EXPORTS
 #define MXNET_API __declspec(dllexport)
 #else
 #define MXNET_API __declspec(dllimport)
 #endif
 #else
 #define MXNET_API
 #endif

 #ifndef MXNET_PREDICT_ONLY
 #define MXNET_PREDICT_ONLY 0
 #endif

 #define MXNET_MAJOR 1

 #define MXNET_MINOR 3

 #define MXNET_PATCH 1

 #define MXNET_VERSION (MXNET_MAJOR*10000 + MXNET_MINOR*100 + MXNET_PATCH)

 #define MXNET_MAKE_VERSION(major, minor, patch) ((major)*10000 + (minor)*100 + patch)

 #define PROFILER_MESSAGE_FUNCNAME (__FUNCTION__)

 namespace mxnet {
 typedef mshadow::cpu cpu;
 typedef mshadow::gpu gpu;
 typedef mshadow::index_t index_t;
 typedef mshadow::default_real_t real_t;
 using TShape = nnvm::TShape;
 using Op = nnvm::Op;

 struct Context {
   enum DeviceType {
     kCPU = cpu::kDevMask,
     kGPU = gpu::kDevMask,
     kCPUPinned = 3,
     kCPUShared = 5,
   };
   DeviceType dev_type;
   int32_t dev_id;
   Context() : dev_type(kCPU), dev_id(0) {}
   inline DeviceType dev_mask() const {
     if (dev_type == kCPUPinned || dev_type == kCPUShared) return kCPU;
     return dev_type;
   }
   inline int real_dev_id() const {
     if (dev_type == kGPU) return dev_id;
     return 0;
   }
   inline bool operator<(const Context &b) const;
   inline bool operator==(const Context &b) const {
     return dev_type == b.dev_type && dev_id == b.dev_id;
   }
   inline bool operator!=(const Context &b) const {
     return !(*this == b);
   }
   inline void Save(dmlc::Stream *strm) const {
     strm->Write(&dev_type, sizeof(dev_type));
     strm->Write(&dev_id, sizeof(dev_id));
   }
   inline bool Load(dmlc::Stream *strm) {
     if (strm->Read(&dev_type, sizeof(dev_type)) != sizeof(dev_type)) return false;
     if (strm->Read(&dev_id, sizeof(int32_t)) != sizeof(int32_t)) return false;
     return true;
   }
   static const int32_t kMaxDevType = 6;
   static const int32_t kMaxDevID = 16;
   inline static Context Create(DeviceType dev_type, int32_t dev_id = -1);
   inline static Context CPU(int32_t dev_id = 0);
   inline static Context GPU(int32_t dev_id = -1);
   inline static int32_t GetGPUCount();
   inline static void GetGPUMemoryInformation(int dev, uint64_t *free, uint64_t *total);
   inline static Context CPUPinned(int32_t dev_id = -1);
   inline static Context CPUShared(int32_t dev_id = 0);
   inline static Context FromString(const std::string& str);
 };

 struct RunContext {
   Context ctx;
   void *stream;
   template<typename xpu>
   inline mshadow::Stream<xpu>* get_stream() const {
     return static_cast<mshadow::Stream<xpu>*>(stream);
   }
   inline const Context& get_ctx() const {
     return ctx;
   }
 };
 }  // namespace mxnet

 namespace mxnet {
 // implementing Context
 inline bool Context::operator<(const Context &b) const {
   if (dev_type == b.dev_type) {
     return dev_id < b.dev_id;
   } else {
     return dev_type < b.dev_type;
   }
 }
 inline Context Context::Create(DeviceType dev_type, int32_t dev_id) {
   Context ctx;
   ctx.dev_type = dev_type;
   if (dev_id < 0) {
     ctx.dev_id = 0;
     if (dev_type & kGPU) {
 #if MXNET_USE_CUDA
       CHECK_EQ(cudaGetDevice(&ctx.dev_id), cudaSuccess);
 #else
       LOG(FATAL) << "Please compile with CUDA enabled for cuda features";
 #endif
     }
   } else {
     ctx.dev_id = dev_id;
   }
   return ctx;
 }
 inline Context Context::CPU(int32_t dev_id) {
   return Create(kCPU, dev_id);
 }

 inline Context Context::CPUPinned(int32_t dev_id) {
   return Create(kCPUPinned, dev_id);
 }

 inline Context Context::CPUShared(int32_t dev_id) {
   return Create(kCPUShared, dev_id);
 }

 inline Context Context::GPU(int32_t dev_id) {
   return Create(kGPU, dev_id);
 }

 inline int32_t Context::GetGPUCount() {
 #if MXNET_USE_CUDA
   int32_t count;
   cudaError_t e = cudaGetDeviceCount(&count);
   if (e == cudaErrorNoDevice) {
     return 0;
   }
   CHECK_EQ(e, cudaSuccess) << " CUDA: " << cudaGetErrorString(e);
   return count;
 #else
   return 0;
 #endif
 }

 inline void Context::GetGPUMemoryInformation(int dev, uint64_t *free_mem,
                                              uint64_t *total_mem) {
 #if MXNET_USE_CUDA

   size_t memF, memT;
   cudaError_t e;

   int curDevice;
   e = cudaGetDevice(&curDevice);
   CHECK_EQ(e, cudaSuccess) << " CUDA: " << cudaGetErrorString(e);

   e = cudaSetDevice(dev);
   CHECK_EQ(e, cudaSuccess) << " CUDA: " << cudaGetErrorString(e);

   e = cudaMemGetInfo(&memF, &memT);
   CHECK_EQ(e, cudaSuccess) << " CUDA: " << cudaGetErrorString(e);

   e = cudaSetDevice(curDevice);
   CHECK_EQ(e, cudaSuccess) << " CUDA: " << cudaGetErrorString(e);

   *free_mem = static_cast<uint64_t>(memF);
   *total_mem = static_cast<uint64_t>(memT);

 #else
   LOG(FATAL)
       << "This call is only supported for MXNet built with CUDA support.";
 #endif
 }

 inline Context Context::FromString(const std::string& str) {
   Context ret;
   try {
     const std::string::size_type l = str.find('(');
     CHECK_NE(l, std::string::npos);
     const std::string::size_type r = str.find(')');
     CHECK_EQ(r, str.length()-1);

     const std::string type = str.substr(0, l);
     int id = std::stoi(str.substr(l+1, r-l-1));
     if (type == "cpu") {
       ret = CPU(id);
     } else if (type == "gpu") {
       ret = GPU(id);
     } else if (type == "cpu_pinned") {
       ret = CPUPinned(id);
     } else if (type == "cpu_shared") {
       ret = CPUShared(id);
     } else {
       LOG(FATAL) << "Invalid context string " << str;
     }
   } catch (...) {
     LOG(FATAL) << "Invalid context string " << str;
   }
   return ret;
 }

 inline std::ostream& operator<<(std::ostream &out, const Context &ctx) {
   if (ctx.dev_type == Context::kCPU) {
     out << "cpu(";
   } else if (ctx.dev_type == Context::kGPU) {
     out << "gpu(";
   } else if (ctx.dev_type == Context::kCPUPinned) {
     out << "cpu_pinned(";
   } else if (ctx.dev_type == Context::kCPUShared) {
     out << "cpu_shared(";
   } else {
     out << "unknown(";
   }
   out << ctx.dev_id << ")";
   return out;
 }

 // describe op registration point
 #define STRINGIZE_DETAIL(x) #x
 #define STRINGIZE(x) STRINGIZE_DETAIL(x)
 #define MXNET_DESCRIBE(...) describe(__VA_ARGS__ "\n\nFrom:" __FILE__ ":" STRINGIZE(__LINE__))
 #define ADD_FILELINE "\n\nDefined in " __FILE__ ":L" STRINGIZE(__LINE__)

 #if MXNET_USE_MKLDNN == 1
 constexpr size_t kMKLDNNAlign = 64;
 #endif

 }  // namespace mxnet

 namespace std {
 template<> struct hash<mxnet::Context> {
   size_t operator()(const mxnet::Context& ctx) const {
     size_t res = 0;
     res = dmlc::HashCombine(res, static_cast<size_t>(ctx.dev_type));
     res = dmlc::HashCombine(res, static_cast<size_t>(ctx.dev_id));
     return res;
   }
 };
 }

 #include "./tensor_blob.h"
 #endif  // MXNET_BASE_H_
mxnet::Context::dev_mask
DeviceType dev_mask() const
Get corresponding device mask.
Definition: base.h:151

mxnet::Context::kMaxDevID
static const int32_t kMaxDevID
the maximal device index
Definition: base.h:205

mxnet
namespace of mxnet
Definition: base.h:118

mxnet::Context::GetGPUMemoryInformation
static void GetGPUMemoryInformation(int dev, uint64_t *free, uint64_t *total)
get the free and total available memory on a GPU

mxnet::RunContext::get_stream
mshadow::Stream< xpu > * get_stream() const
get mshadow stream from Context
Definition: base.h:270

mxnet::Context::GetGPUCount
static int32_t GetGPUCount()

mxnet::Context::Load
bool Load(dmlc::Stream *strm)
load the content from binary stream
Definition: base.h:197

mxnet::real_t
mshadow::default_real_t real_t
data type that will be used to store ndarray
Definition: base.h:126

mxnet::Context::GPU
static Context GPU(int32_t dev_id=-1)

mxnet::TShape
nnvm::TShape TShape
Shape data structure used to record shape information.
Definition: base.h:128

mxnet::RunContext::ctx
Context ctx
base Context
Definition: base.h:259

mxnet::Context::operator<
bool operator<(const Context &b) const
Comparator, used to enable Context as std::map key.

mxnet::Context::kMaxDevType
static const int32_t kMaxDevType
the maximal device type
Definition: base.h:203

mxnet::RunContext
execution time context. The information needed in runtime for actual execution.
Definition: base.h:257

mxnet::Context::dev_type
DeviceType dev_type
the device type we run the op on
Definition: base.h:142

mxnet::Context::kCPU
Definition: base.h:136

mxnet::Context::dev_id
int32_t dev_id
device id we are going to run it on
Definition: base.h:144

mxnet::Context::kCPUPinned
Definition: base.h:138

mxnet::RunContext::stream
void * stream
the stream of the device, can be NULL or Stream<gpu>* in GPU mode
Definition: base.h:263

mxnet::Context::Save
void Save(dmlc::Stream *strm) const
save the content into binary stream
Definition: base.h:188

mxnet::gpu
mshadow::gpu gpu
mxnet gpu
Definition: base.h:122

mxnet::RunContext::get_ctx
const Context & get_ctx() const
get the base Context from RunContext
Definition: base.h:274

mxnet::Context::kGPU
Definition: base.h:137

mxnet::Context::DeviceType
DeviceType
Type of device.
Definition: base.h:135

mxnet::Context::CPUShared
static Context CPUShared(int32_t dev_id=0)

mxnet::cpu
mshadow::cpu cpu
mxnet cpu
Definition: base.h:120

mxnet::Context::real_dev_id
int real_dev_id() const
Returns dev_id for kGPU, 0 otherwise.
Definition: base.h:158

mxnet::Op
nnvm::Op Op
operator structure from NNVM
Definition: base.h:130

mxnet::Context::Context
Context()
default constructor
Definition: base.h:146

mxnet::Context::Create
static Context Create(DeviceType dev_type, int32_t dev_id=-1)
Create a new context.

mxnet::Context::operator!=
bool operator!=(const Context &b) const
check if current context not equals another one
Definition: base.h:181

mxnet::Context::CPU
static Context CPU(int32_t dev_id=0)

mxnet::cpp::operator<<
std::ostream & operator<<(std::ostream &out, const NDArray &ndarray)

mxnet::Context::CPUPinned
static Context CPUPinned(int32_t dev_id=-1)

mxnet::Context::kCPUShared
Definition: base.h:139

mxnet::Context::FromString
static Context FromString(const std::string &str)

mxnet::index_t
mshadow::index_t index_t
index type usually use unsigned
Definition: base.h:124

tensor_blob.h
TBlob class that holds common representation of arbirary dimension tensor, can be used to transformed...

mxnet::Context
Context information about the execution environment.
Definition: base.h:133

mxnet::Context::operator==
bool operator==(const Context &b) const
check if current context equals another one
Definition: base.h:173

mxnet::cpp::index_t
unsigned index_t
Definition: base.h:37