File: resize_nearest_dnnlowp_op.cc

package info (click to toggle)

pytorch 1.13.1%2Bdfsg-4

links: PTS, VCS
area: main
in suites: bookworm
size: 139,252 kB
sloc: cpp: 1,100,274; python: 706,454; ansic: 83,052; asm: 7,618; java: 3,273; sh: 2,841; javascript: 612; makefile: 323; xml: 269; ruby: 185; yacc: 144; objc: 68; lex: 44

file content (58 lines) | stat: -rw-r--r-- 1,604 bytes

parent folder | download | duplicates (2)

#include "caffe2/quantization/server/resize_nearest_dnnlowp_op.h"

namespace caffe2 {

template <typename T>
bool ResizeNearestDNNLowPOp<T>::RunOnDevice() {
  using namespace dnnlowp;

  this->ParseDNNLowPOperatorArguments_();

  // Choose quantization params
  in_qparams_[0] = GetInputTensorQuantizationParamsOf(this, 0, qfactory_.get());

  const auto& X = InputTensorCPU_(0);
  auto* Y = OutputTensorCPU_(0);

  CAFFE_ENFORCE_EQ(X.ndim(), 4);
  const int N = X.dim32(0);
  const int IH = X.dim32(1);
  const int IW = X.dim32(2);
  const int C = X.dim32(3);
  const int OW = IW * width_scale_;
  const int OH = IH * height_scale_;

  Y->Resize(N, OH, OW, C);
  const T* X_data = X.template data<T>();
  T* Y_data = Y->template mutable_data<T>();

#ifdef _OPENMP
#pragma omp parallel for
#endif
  for (int n = 0; n < N; ++n) {
    for (int y = 0; y < OH; ++y) {
      const int in_y = std::min((int)(y / height_scale_), (IH - 1));
      for (int x = 0; x < OW; ++x) {
        const int in_x = std::min((int)(x / width_scale_), (IW - 1));
        std::memcpy(
            &Y_data[((n * OH + y) * OW + x) * C],
            &X_data[((n * IH + in_y) * IW + in_x) * C],
            C * sizeof(T));
      }
    }
  }

  // Even if there is a pre-chosen quantization parameters for the output,
  // it is ignored because resize nearest output quantization should be same
  // as the input.
  PropagateOutputTensorQuantizationParams(this, 0, in_qparams_[0]);

  return true;
}

REGISTER_CPU_OPERATOR_WITH_ENGINE(
    Int8ResizeNearest,
    DNNLOWP,
    ResizeNearestDNNLowPOp<uint8_t>);

} // namespace caffe2