#ifndef CAFFE2_OPERATORS_BATCH_MOMENTS_OP_H_
|
#define CAFFE2_OPERATORS_BATCH_MOMENTS_OP_H_
|
|
#include "caffe2/core/context.h"
|
#include "caffe2/core/logging.h"
|
#include "caffe2/core/operator.h"
|
|
namespace caffe2 {
|
|
template <typename T, class Context>
|
class BatchMomentsOp final : public Operator<Context> {
|
public:
|
USE_OPERATOR_CONTEXT_FUNCTIONS;
|
|
template <class... Args>
|
explicit BatchMomentsOp(Args&&... args)
|
: Operator<Context>(std::forward<Args>(args)...),
|
order_(StringToStorageOrder(
|
this->template GetSingleArgument<std::string>("order", "NCHW"))) {
|
CAFFE_ENFORCE_NE(order_, StorageOrder::UNKNOWN);
|
}
|
|
bool RunOnDevice() override {
|
const auto& X = Input(0);
|
|
const int ndim = X.dim();
|
const int N = X.dim32(0);
|
const int C = order_ == StorageOrder::NCHW ? X.dim32(1) : X.dim32(ndim - 1);
|
const int HxW = X.numel() / (N * C);
|
auto* mu = Output(0, {C}, at::dtype<T>());
|
auto* var = Output(1, {C}, at::dtype<T>());
|
const T* X_data = X.template data<T>();
|
T* mu_data = mu->template mutable_data<T>();
|
T* var_data = var->template mutable_data<T>();
|
return order_ == StorageOrder::NCHW
|
? ComputeBatchMomentsNCHW(N, C, HxW, X_data, mu_data, var_data)
|
: ComputeBatchMomentsNHWC(N, C, HxW, X_data, mu_data, var_data);
|
}
|
|
private:
|
bool ComputeBatchMomentsNCHW(
|
const int N,
|
const int C,
|
const int HxW,
|
const T* X,
|
T* mu,
|
T* var);
|
|
bool ComputeBatchMomentsNHWC(
|
const int N,
|
const int C,
|
const int HxW,
|
const T* X,
|
T* mu,
|
T* var);
|
|
const StorageOrder order_;
|
};
|
|
template <typename T, class Context>
|
class BatchMomentsGradientOp final : public Operator<Context> {
|
public:
|
USE_OPERATOR_CONTEXT_FUNCTIONS;
|
|
template <class... Args>
|
explicit BatchMomentsGradientOp(Args&&... args)
|
: Operator<Context>(std::forward<Args>(args)...),
|
order_(StringToStorageOrder(
|
this->template GetSingleArgument<std::string>("order", "NCHW"))) {
|
CAFFE_ENFORCE_NE(order_, StorageOrder::UNKNOWN);
|
}
|
|
bool RunOnDevice() override {
|
const auto& dmu = Input(0);
|
const auto& dvar = Input(1);
|
const auto& X = Input(2);
|
|
const int ndim = X.dim();
|
const int N = X.dim32(0);
|
const int C = order_ == StorageOrder::NCHW ? X.dim32(1) : X.dim32(ndim - 1);
|
const int HxW = X.numel() / (N * C);
|
auto* dX = Output(0, X.sizes(), at::dtype<T>());
|
const T* dmu_data = dmu.template data<T>();
|
const T* dvar_data = dvar.template data<T>();
|
const T* X_data = X.template data<T>();
|
T* dX_data = dX->template mutable_data<T>();
|
return order_ == StorageOrder::NCHW
|
? ComputeBatchMomentsGradientNCHW(
|
N, C, HxW, dmu_data, dvar_data, X_data, dX_data)
|
: ComputeBatchMomentsGradientNHWC(
|
N, C, HxW, dmu_data, dvar_data, X_data, dX_data);
|
}
|
|
private:
|
bool ComputeBatchMomentsGradientNCHW(
|
const int N,
|
const int C,
|
const int HxW,
|
const T* dmu,
|
const T* dvar,
|
const T* X,
|
T* dX);
|
|
bool ComputeBatchMomentsGradientNHWC(
|
const int N,
|
const int C,
|
const int HxW,
|
const T* dmu,
|
const T* dvar,
|
const T* X,
|
T* dX);
|
|
const StorageOrder order_;
|
};
|
|
} // namespace caffe2
|
|
#endif // CAFFE2_OPERATORS_BATCH_MOMENTS_OP_H_
|