conv_layer.h

//Tencent is pleased to support the open source community by making FeatherCNN available.

//Copyright (C) 2018 THL A29 Limited, a Tencent company. All rights reserved.

//Licensed under the BSD 3-Clause License (the "License"); you may not use this file except
//in compliance with the License. You may obtain a copy of the License at
//
//https://opensource.org/licenses/BSD-3-Clause
//
//Unless required by applicable law or agreed to in writing, software distributed
//under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
//CONDITIONS OF ANY KIND, either express or implied. See the License for the
//specific language governing permissions and limitations under the License.

#pragma once

//#include "../layer.h"
#include "./utility/helper.h"
#include "./utility/common.h"
#include <assert.h>
#include <stdio.h>
#include <omp.h>

class ConvLayer
{
    public:
        ConvLayer(float *input, float *kernel, float *biasw, float *output_ref, size_t ic, size_t ih, size_t iw, size_t oc, size_t kh=3, size_t kw=3, size_t sh=1, size_t sw=1, size_t pad_left=1, size_t pad_right=1, size_t pad_top=1, size_t pad_bottom=1, size_t g=1, bool bias=0, size_t nt = 1, size_t iter = 10)
        {
            num_threads = nt;
            iterations  = iter;
            omp_set_num_threads(num_threads);

	        //Input
            input_channels = ic;
            input_height   = ih;
            input_width    = iw;
	        input_data     = input;	    
	    
	        //Kernel
	        output_channels=oc;	    
	        kernel_height = kh;
            kernel_width  = kw;
	        kernel_data   = kernel;
	    
	        //Bias
            bias_term = bias;
            if(bias_term)	bias_data = biasw;
            else		bias_data = NULL;


            group = g;
            stride_height = sh;
            stride_width  = sw;
	    
	        padding_left   = pad_left;
            padding_top    = pad_top;
            padding_right  = pad_right;
            padding_bottom = pad_bottom;


            if(group == 0 || stride_width  == 0 || stride_height == 0)
            assert(!(group == 0 || stride_width  == 0 || stride_height == 0));
	    
	        //Output
            this->output_ref = output_ref;

            output_width = (input_width + padding_left + padding_right - kernel_width) / stride_width + 1;
            output_height = (input_height + padding_top + padding_bottom - kernel_height) / stride_height + 1;
            input_data  = (float *) malloc(input_channels * input_width * input_height * sizeof(float));
            kernel_data = (float *) malloc((input_channels * output_channels * kw * kh + 16) * sizeof(float));
            bias_data   = (float *) malloc(output_channels * output_width * output_height * sizeof(float));

            memcpy(input_data, input, input_channels * input_width * input_height * sizeof(float));
            memcpy(kernel_data, kernel, input_channels * output_channels * kw * kh  * sizeof(float));
            if(biasw)
                memcpy(bias_data, biasw, output_channels * output_width * output_height * sizeof(float));

            output_data = (float *) malloc(output_channels * output_width * output_height * sizeof(float));
            //output_data should assert 
        }

        ~ConvLayer()
        {
            free(input_data);
            free(kernel_data);
            free(bias_data);
            free(output_data);
            input_data = NULL;
            kernel_data = NULL;
            output_data = NULL;
            bias_data  = NULL;
        }

        int get_output_height() {
            return this->output_height;
    	}

    	int get_output_width() {
        	return this->output_width;
    	}


        virtual int Init()
        {
            return -1;
        }

        virtual int Forward()
        {
            return -1;
        }

        virtual int Tuning()
        {
            return -1;
        }	
	
	    float *output_data;
    protected:
        size_t input_channels;
        size_t input_width;
        size_t input_height;

        size_t output_channels;
        size_t output_width;
        size_t output_height;

        size_t kernel_width;
        size_t kernel_height;

        size_t stride_width;
        size_t stride_height;

        size_t padding_left;
        size_t padding_right;
        size_t padding_top;
        size_t padding_bottom;

        size_t group;
        bool   bias_term;
	    size_t num_threads;
        size_t iterations;

	    float *input_data;
        float *kernel_data;
        float *bias_data;
        float *output_ref;
};