1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74
|
/******************************************************************************
* Copyright (c) Intel Corporation - All rights reserved. *
* This file is part of the LIBXSMM library. *
* *
* For information on the license, see the LICENSE file. *
* Further information: https://github.com/hfp/libxsmm/ *
* SPDX-License-Identifier: BSD-3-Clause *
******************************************************************************/
/* Sasikanth Avancha, Dhiraj Kalamkar (Intel Corp.)
******************************************************************************/
#pragma once
#include <omp.h>
#include <assert.h>
#include <sys/time.h>
#include "common.hpp"
#include "check.hpp"
#include "Tensor.hpp"
typedef struct {
string node_name;
int bdims, tdims;
int nInput, nOutput;
int iDepth, iHeight, iWidth;
int oDepth, oHeight, oWidth;
int batch_size;
float negative_slope;
int data_type;
int algType;
int num_threads;
}ReLUImplParams;
class ReLUImpl
{
protected:
ReLUImplParams *gp;
int engine;
TensorLayoutType bot_layout_type, top_layout_type, gbot_layout_type;
void *bot_layout, *top_layout, *gbot_layout;
int top_compute_engine=-1;
int bot_compute_engine=-1;
public:
ReLUImpl(ReLUImplParams* gp_, int engine_): gp(gp_), engine(engine_) {}
void set_top_compute_engine(int e) { top_compute_engine = e;}
void set_bot_compute_engine(int e) { bot_compute_engine = e;}
// Assume external threading, e.g., #pragma omp
virtual void forwardPropagate(TensorBuf *inp, TensorBuf *outp, int tid) = 0;
virtual void backPropagate(TensorBuf* inp, TensorBuf *deloutp, TensorBuf *delinp, int tid) = 0;
virtual void forwardPropagate(TensorBuf *inp, TensorBuf *outp)
{
switch(engine)
{
case XSMM:
forwardPropagate(inp, outp, 0);
break;
}
}
virtual void backPropagate(TensorBuf* inp, TensorBuf *deloutp, TensorBuf *delinp)
{
switch(engine)
{
case XSMM:
backPropagate(inp, deloutp, delinp, 0);
break;
}
}
};
|