1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78
|
#pragma once
#include "caffe2/core/operator.h"
namespace caffe2 {
template <typename T>
struct FtrlParams {
explicit FtrlParams(OperatorBase* op)
: alphaInv(1.0 / op->GetSingleArgument<float>("alpha", 0.005f)),
beta(op->GetSingleArgument<float>("beta", 1.0f)),
lambda1(op->GetSingleArgument<float>("lambda1", 0.001f)),
lambda2(op->GetSingleArgument<float>("lambda2", 0.001f)) {}
T alphaInv;
T beta;
T lambda1;
T lambda2;
};
// TODO(dzhulgakov): implement GPU version if necessary
template <typename T, class Context>
class FtrlOp final : public Operator<Context> {
public:
USE_OPERATOR_CONTEXT_FUNCTIONS;
FtrlOp(const OperatorDef& operator_def, Workspace* ws)
: Operator<Context>(operator_def, ws), params_(this) {
CAFFE_ENFORCE(
!HasArgument("alpha") || ALPHA >= InputSize(),
"Cannot specify alpha by both input and argument");
}
bool RunOnDevice() override;
protected:
FtrlParams<T> params_;
INPUT_TAGS(VAR, N_Z, GRAD, ALPHA);
OUTPUT_TAGS(OUTPUT_VAR, OUTPUT_N_Z);
};
template <typename T>
class SparseFtrlOp final : public Operator<CPUContext> {
public:
SparseFtrlOp(const OperatorDef& operator_def, Workspace* ws)
: Operator<CPUContext>(operator_def, ws), params_(this) {
CAFFE_ENFORCE(
!HasArgument("alpha") || ALPHA >= InputSize(),
"Cannot specify alpha by both input and argument");
}
bool RunOnDevice() override {
// run time learning rate override
if (ALPHA < InputSize()) {
CAFFE_ENFORCE_EQ(Input(ALPHA).numel(), 1, "alpha should be real-valued");
params_.alphaInv = 1.0 / *(Input(ALPHA).template data<T>());
}
// Use run-time polymorphism
auto& indices = Input(INDICES);
if (indices.template IsType<int32_t>()) {
DoRun<int32_t>();
} else if (indices.template IsType<int64_t>()) {
DoRun<int64_t>();
} else {
LOG(FATAL) << "Unsupported type of INDICES in SparseFtrlOp: "
<< indices.dtype().name();
}
return true;
}
protected:
FtrlParams<T> params_;
INPUT_TAGS(VAR, N_Z, INDICES, GRAD, ALPHA);
OUTPUT_TAGS(OUTPUT_VAR, OUTPUT_N_Z);
private:
template <typename SIndex>
void DoRun();
};
}
|