# Copyright 2018 The MACE Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


import math

import numpy as np
import six

from transform.transformer import Transformer
from transform.base_converter import DataFormat
from transform.base_converter import MaceOp
from transform.base_converter import MaceKeyword
from transform.base_converter import ConverterUtil
from utils.util import mace_check


class ShapeInference(object):
    """Currently we only use it to infer caffe shape, we use tensorflow engine
    to infer tensorflow op shapes, since tensorflow has too many ops."""

    def __init__(self, net, input_nodes):
        self._op_shape_inference = {
            MaceOp.Conv2D.name: self.infer_shape_conv_pool_shape,
            MaceOp.Deconv2D.name: self.infer_shape_deconv,
            MaceOp.DepthwiseConv2d.name: self.infer_shape_conv_pool_shape,
            MaceOp.DepthwiseDeconv2d.name: self.infer_shape_deconv,
            MaceOp.Eltwise.name: self.infer_shape_eltwise,
            MaceOp.BatchNorm.name: self.infer_shape_general,
            MaceOp.GroupNorm.name: self.infer_shape_general,
            MaceOp.AddN.name: self.infer_shape_general,
            MaceOp.Activation.name: self.infer_shape_general,
            MaceOp.Pooling.name: self.infer_shape_conv_pool_shape,
            MaceOp.Concat.name: self.infer_shape_concat,
            MaceOp.Split.name: self.infer_shape_slice,
            MaceOp.Softmax.name: self.infer_shape_general,
            MaceOp.FullyConnected.name: self.infer_shape_fully_connected,
            MaceOp.Crop.name: self.infer_shape_crop,
            MaceOp.BiasAdd.name: self.infer_shape_general,
            MaceOp.ChannelShuffle.name: self.infer_shape_channel_shuffle,
            MaceOp.Transpose.name: self.infer_shape_permute,
            MaceOp.PriorBox.name: self.infer_shape_prior_box,
            MaceOp.Reshape.name: self.infer_shape_reshape,
            MaceOp.ResizeBilinear.name: self.infer_shape_resize_bilinear,
            MaceOp.LpNorm.name: self.infer_shape_general,
            MaceOp.MVNorm.name: self.infer_shape_general,
            MaceOp.ResizeNearestNeighbor.name:
                self.infer_shape_nearest_neighbor,
            MaceOp.ArgMax.name: self.infer_shape_argmax,
        }

        self._net = net
        self._output_shape_cache = {}
        for input_node in input_nodes:
            input_shape = input_node.shape[:]
            # transpose input from NCHW to NHWC
            Transformer.transpose_shape(input_shape, [0, 3, 1, 2])
            self._output_shape_cache[input_node.name] = input_shape
        for tensor in net.tensors:
            self._output_shape_cache[tensor.name] = list(tensor.dims)

    def run(self):
        for op in self._net.op:
            mace_check(op.type in self._op_shape_inference,
                       "Mace does not support caffe op type %s yet"
                       % op.type)
            self._op_shape_inference[op.type](op)

    def add_output_shape(self, op, shapes):
        mace_check(len(op.output) == len(shapes),
                   "Op %s (%s) output count is different from "
                   "output shape count" % (
                       op.name, op.type))
        for i in six.moves.range(len(shapes)):
            output_name = op.output[i]
            output_shape = op.output_shape.add()
            output_shape.dims.extend(shapes[i])
            self._output_shape_cache[output_name] = shapes[i]

    def infer_shape_general(self, op):
        if len(op.input) > 0:
            mace_check(op.input[0] in self._output_shape_cache,
                       "Op %s input %s does not exist"
                       % (op.name, op.input[0]))
            input_shape = self._output_shape_cache[op.input[0]]
            self.add_output_shape(op, [input_shape])

    def infer_shape_conv_pool_shape(self, op):
        input_shape = self._output_shape_cache[op.input[0]]
        output_shape = np.zeros_like(input_shape)
        if op.type == MaceOp.Pooling:
            filter_shape = list(
                ConverterUtil.get_arg(op, MaceKeyword.mace_kernel_str).ints)
            if ConverterUtil.data_format(op) == DataFormat.NCHW:
                filter_shape = [input_shape[1], input_shape[1]] + filter_shape
                if ConverterUtil.get_arg(op,
                                         MaceKeyword.mace_global_pooling_str) \
                        is not None:
                    filter_shape[2] = input_shape[2]
                    filter_shape[3] = input_shape[3]
            else:  # NHWC
                filter_shape = filter_shape + [input_shape[1], input_shape[1]]
                if ConverterUtil.get_arg(op,
                                         MaceKeyword.mace_global_pooling_str) \
                        is not None:
                    filter_shape[0] = input_shape[1]
                    filter_shape[1] = input_shape[2]
        else:
            filter_shape = self._output_shape_cache[op.input[1]]

        paddings = ConverterUtil.get_arg(op,
                                         MaceKeyword.mace_padding_values_str).ints  # noqa
        strides = ConverterUtil.get_arg(op, MaceKeyword.mace_strides_str).ints
        dilations_arg = ConverterUtil.get_arg(op,
                                              MaceKeyword.mace_dilations_str)
        if dilations_arg is not None:
            dilations = dilations_arg.ints
        else:
            dilations = [1, 1]
        if op.type == MaceOp.Pooling:
            round_func = math.ceil
        else:
            round_func = math.floor

        output_shape[0] = input_shape[0]
        if ConverterUtil.data_format(op) == DataFormat.NCHW \
                and ConverterUtil.filter_format(self._net) == DataFormat.OIHW:
            # filter format: OIHW
            if op.type == MaceOp.DepthwiseConv2d.name:
                output_shape[1] = filter_shape[0] * filter_shape[1]
            else:
                output_shape[1] = filter_shape[0]
            output_shape[2] = int(
                round_func((input_shape[2] + paddings[0] - filter_shape[2] -
                            (filter_shape[2] - 1) *
                            (dilations[0] - 1)) / float(strides[0]))) + 1
            output_shape[3] = int(
                round_func((input_shape[3] + paddings[1] - filter_shape[3] -
                            (filter_shape[3] - 1) *
                            (dilations[1] - 1)) / float(strides[1]))) + 1
        else:
            mace_check(False,
                       "Mace can only infer shape for"
                       " NCHW input and OIHW filter")

        self.add_output_shape(op, [output_shape])

    def infer_shape_deconv(self, op):
        input_shape = self._output_shape_cache[op.input[0]]
        output_shape = np.zeros_like(input_shape)
        filter_shape = self._output_shape_cache[op.input[1]]

        paddings = ConverterUtil.get_arg(op,
                                         MaceKeyword.mace_padding_values_str).ints  # noqa
        strides = ConverterUtil.get_arg(op, MaceKeyword.mace_strides_str).ints
        dilations_arg = ConverterUtil.get_arg(op,
                                              MaceKeyword.mace_dilations_str)
        if dilations_arg is not None:
            dilations = dilations_arg.ints
        else:
            dilations = [1, 1]
        round_func = math.floor

        group_arg = ConverterUtil.get_arg(op,
                                          MaceKeyword.mace_group_str)
        output_shape[0] = input_shape[0]
        if ConverterUtil.data_format(op) == DataFormat.NCHW \
                and ConverterUtil.filter_format(self._net) == DataFormat.OIHW:
            # filter format: IOHW
            output_shape[1] = filter_shape[1]
            if group_arg is not None and group_arg.i > 1:
                output_shape[1] = group_arg.i * filter_shape[1]
            output_shape[2] = int(
                round_func((input_shape[2] - 1) * strides[0] +
                           (filter_shape[2] - 1) * (dilations[0] - 1) +
                           filter_shape[2] - paddings[0]))
            output_shape[3] = int(
                round_func((input_shape[3] - 1) * strides[1] +
                           (filter_shape[3] - 1) * (dilations[1] - 1) +
                           filter_shape[3] - paddings[1]))
        else:
            mace_check(False,
                       "Mace can only infer shape for"
                       " NCHW input and OIHW filter")
        print("deconv layer %s (%s) input:%s filter:%s output:%s" %
              (op.name, op.type, input_shape, filter_shape, output_shape))

        self.add_output_shape(op, [output_shape])

    def infer_shape_concat(self, op):
        output_shape = list(self._output_shape_cache[op.input[0]])
        axis = ConverterUtil.get_arg(op, MaceKeyword.mace_axis_str).i
        if axis < 0:
            axis = len(output_shape) + axis
        output_shape[axis] = 0
        for input_node in op.input:
            input_shape = list(self._output_shape_cache[input_node])
            output_shape[axis] = output_shape[axis] + input_shape[axis]
        self.add_output_shape(op, [output_shape])

    def infer_shape_slice(self, op):
        output_shape = self._output_shape_cache[op.input[0]]
        axis = ConverterUtil.get_arg(op, MaceKeyword.mace_axis_str).i
        output_shape[axis] = (int)(output_shape[axis] / len(op.output))
        output_shapes = []
        for _ in op.output:
            output_shapes.append(output_shape)
        self.add_output_shape(op, output_shapes)

    def infer_shape_fully_connected(self, op):
        input_shape = self._output_shape_cache[op.input[0]]
        weight_shape = self._output_shape_cache[op.input[1]]
        if ConverterUtil.data_format(op) == DataFormat.NCHW:
            output_shape = [input_shape[0], weight_shape[0], 1, 1]
        else:
            mace_check(False, "format %s is not supported"
                       % ConverterUtil.data_format(op))
        self.add_output_shape(op, [output_shape])

    def infer_shape_crop(self, op):
        mace_check(len(op.input) == 2, "crop layer needs two inputs")
        output_shape = self._output_shape_cache[op.input[0]]
        input1_shape = self._output_shape_cache[op.input[1]]
        offsets = ConverterUtil.get_arg(op, MaceKeyword.mace_offset_str).ints
        for i in range(len(offsets)):
            if offsets[i] >= 0:
                output_shape[i] = input1_shape[i]
        self.add_output_shape(op, [output_shape])

    def infer_shape_channel_shuffle(self, op):
        output_shape = self._output_shape_cache[op.input[0]]
        self.add_output_shape(op, [output_shape])

    def infer_shape_permute(self, op):
        output_shape = list(self._output_shape_cache[op.input[0]])
        dims = ConverterUtil.get_arg(op, MaceKeyword.mace_dims_str).ints
        for i in xrange(len(dims)):
            output_shape[i] = self._output_shape_cache[op.input[0]][dims[i]]
        self.add_output_shape(op, [output_shape])

    def infer_shape_prior_box(self, op):
        output_shape = [1, 2, 1]
        input_shape = list(self._output_shape_cache[op.input[0]])
        input_w = input_shape[3]
        input_h = input_shape[2]
        min_size = \
            ConverterUtil.get_arg(op, MaceKeyword.mace_min_size_str).floats
        max_size = \
            ConverterUtil.get_arg(op, MaceKeyword.mace_max_size_str).floats
        aspect_ratio = \
            ConverterUtil.get_arg(op, MaceKeyword.mace_aspect_ratio_str).floats
        num_prior = len(aspect_ratio) * len(min_size) + len(max_size)

        output_shape[2] = int(num_prior * input_h * input_w * 4)
        self.add_output_shape(op, [output_shape])

    def infer_shape_reshape(self, op):
        if ConverterUtil.get_arg(op, MaceKeyword.mace_dim_str) is not None:
            dim = ConverterUtil.get_arg(op, MaceKeyword.mace_dim_str).ints
            output_shape = list(dim)
            product = input_size = 1
            idx = -1
            for i in range(len(self._output_shape_cache[op.input[0]])):
                input_size *= self._output_shape_cache[op.input[0]][i]
            for i in range(len(dim)):
                if dim[i] == 0:
                    output_shape[i] = self._output_shape_cache[op.input[0]][i]
                    product *= self._output_shape_cache[op.input[0]][i]
                elif dim[i] == -1:
                    idx = i
                    output_shape[i] = 1
                else:
                    output_shape[i] = dim[i]
                    product *= dim[i]
            if idx != -1:
                output_shape[idx] = int(input_size / product)
            self.add_output_shape(op, [output_shape])
        else:
            output_shape = []
            axis = ConverterUtil.get_arg(op, MaceKeyword.mace_axis_str).i
            end_axis = ConverterUtil.get_arg(op,
                                             MaceKeyword.mace_end_axis_str).i
            end_axis = end_axis if end_axis > 0 else end_axis + len(
                list(self._output_shape_cache[op.input[0]]))
            dim = 1
            for i in range(0, axis):
                output_shape.append(self._output_shape_cache[op.input[0]][i])
            for i in range(axis, end_axis + 1):
                dim *= self._output_shape_cache[op.input[0]][i]
            output_shape.append(-1)
            for i in range(end_axis + 1, len(
                    list(self._output_shape_cache[op.input[0]]))):
                output_shape.append(self._output_shape_cache[op.input[0]][i])
            output_shape[axis] = dim
            self.add_output_shape(op, [output_shape])

    def infer_shape_resize_bilinear(self, op):
        input_shape = self._output_shape_cache[op.input[0]]
        size = ConverterUtil.get_arg(
            op, MaceKeyword.mace_resize_size_str).ints
        if ConverterUtil.data_format(op) == DataFormat.NCHW:
            output_shape = [input_shape[0], input_shape[1], size[0], size[1]]
        elif ConverterUtil.data_format(op) == DataFormat.NHWC:
            output_shape = [input_shape[0], size[0], size[1], input_shape[3]]
        else:
            output_shape = []
            mace_check(False, "format %s is not supported"
                       % ConverterUtil.data_format(op))
        self.add_output_shape(op, [output_shape])

    def infer_shape_nearest_neighbor(self, op):
        input_shape = self._output_shape_cache[op.input[0]]
        height_scale = \
            ConverterUtil.get_arg(op, MaceKeyword.mace_height_scale_str).f
        width_scale = \
            ConverterUtil.get_arg(op, MaceKeyword.mace_width_scale_str).f
        if ConverterUtil.data_format(op) == DataFormat.NCHW:
            output_shape = [input_shape[0], input_shape[1],
                            int(input_shape[2] * height_scale),
                            int(input_shape[3] * width_scale)]
        elif ConverterUtil.data_format(op) == DataFormat.NHWC:
            output_shape = [input_shape[0], int(input_shape[2] * height_scale),
                            int(input_shape[3] * width_scale), input_shape[3]]
        else:
            output_shape = []
            mace_check(False, "format %s is not supported"
                       % ConverterUtil.data_format(op))
        self.add_output_shape(op, [output_shape])

    def infer_shape_argmax(self, op):
        input_shape = self._output_shape_cache[op.input[0]]
        output_dim_num = len(input_shape)
        if output_dim_num < 3:
            output_dim_num = 3

        axis_arg = ConverterUtil.get_arg(op, MaceKeyword.mace_axis_str)
        has_axis = (axis_arg is not None)
        axis_value = 0
        if has_axis:
            axis_value = axis_arg.i
            if axis_value < 0:
                axis_value = len(input_shape) + axis_value

        top_k = ConverterUtil.get_arg(op, MaceKeyword.mace_top_k_str).i
        mace_check(top_k >= 1, "Invalid top_k value")
        out_val = ConverterUtil.get_arg(op, MaceKeyword.mace_out_val_str).i

        if has_axis:  # Produces max_ind or max_val per axis
            output_shape = input_shape
            output_shape[axis_value] = top_k
        else:
            output_shape = [1] * output_dim_num
            output_shape[0] = input_shape[0]
            output_shape[2] = top_k
            if out_val:  # Produces max_ind and max_val
                output_shape[1] = 2

        self.add_output_shape(op, [output_shape])

    def infer_shape_eltwise(self, op):
        input_num = len(op.input)
        mace_check(input_num > 0, "input num should > 0")

        max_idx = 0
        max_input_size = 0
        for i in range(0, input_num):
            mace_check(op.input[i] in self._output_shape_cache,
                       "Op %s input %s does not exist"
                       % (op.name, op.input[i]))
            input_shape = self._output_shape_cache[op.input[i]]
            input_size = 1
            for k in range(0, len(input_shape)):
                input_size *= input_shape[k]
            if input_size > max_input_size:
                max_idx = i
                max_input_size = input_size

        input_max_shape = self._output_shape_cache[op.input[max_idx]]
        self.add_output_shape(op, [input_max_shape])