1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75
|
#pragma once
#include <cstdint>
namespace caffe2 {
/**
* Optimized using AVX2 intrinsics for max pool 2D in NHWC layout
*/
void max_pool_avx2(
const std::uint8_t* Xdata,
int n,
int height,
int width,
int channels,
int pooled_height,
int pooled_width,
int kernel_h,
int kernel_w,
int stride_h,
int stride_w,
int pad_t,
int pad_l,
std::uint8_t* Ydata);
void average_pool_avx2(
const std::uint8_t* Xdata,
int n,
int height,
int width,
int channels,
int pooled_height,
int pooled_width,
int kernel_h,
int kernel_w,
int stride_h,
int stride_w,
int pad_t,
int pad_l,
std::uint8_t* Ydata,
float in_scale,
float out_scale,
int32_t in_zero_point,
int32_t out_zero_point,
int32_t minimum,
int32_t maximum);
void average_pool_3d_avx2(
const uint8_t* Xdata,
int n,
int height,
int width,
int depth,
int channels,
int pooled_height,
int pooled_width,
int pooled_depth,
int kernel_h,
int kernel_w,
int kernel_d,
int stride_h,
int stride_w,
int stride_d,
int pad_t,
int pad_l,
int pad_d,
uint8_t* Ydata,
float in_scale,
float out_scale,
int32_t in_zero_point,
int32_t out_zero_point,
int32_t minimum,
int32_t maximum);
} // namespace caffe2
|