python source code of bisenet

imgclsmob-master
- convert_models.py
- gluon
  - lr_scheduler.py
  - dataset_utils.py
  - datasets
    - coco_hpe2_dataset.py
    - cityscapes_seg_dataset.py
    - imagenet1k_rec_cls_dataset.py
    - hpatches_mch_dataset.py
    - coco_hpe1_dataset.py
    - svhn_cls_dataset.py
    - voc_seg_dataset.py
    - widerface_det_dataset.py
    - ade20k_seg_dataset.py
    - cifar10_cls_dataset.py
    - dataset_metainfo.py
    - coco_det_dataset.py
    - __init__.py
    - imagenet1k_cls_dataset.py
    - cifar100_cls_dataset.py
    - cub200_2011_cls_dataset.py
    - seg_dataset.py
    - coco_hpe3_dataset.py
    - coco_seg_dataset.py
  - weighted_random_sampler.py
  - losses.py
  - gluoncv2
    - models
      - pyramidnet_cifar.py
      - xdensenet.py
      - vgg.py
      - shakedropresnet_cifar.py
      - proxylessnas_cub.py
      - cbamresnet.py
      - spnasnet.py
      - irevnet.py
      - voca.py
      - seresnet_cub.py
      - crunet.py
      - sparsenet.py
      - alexnet.py
      - pnasnet.py
      - channelnet.py
      - shufflenet.py
      - simpleposemobile_coco.py
      - dpn.py
      - icnet.py
      - lffd.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet_cub.py
      - efficientnetedge.py
      - mobilenet.py
      - fcn8sd.py
      - mnasnet.py
      - proxylessnas.py
      - hrnet.py
      - darts.py
      - sknet.py
      - ibndensenet.py
      - mobilenetv2.py
      - squeezenet.py
      - fdmobilenet.py
      - wrn_cifar.py
      - centernet.py
      - resattnet.py
      - xception.py
      - ror_cifar.py
      - octresnet_cifar.py
      - sepreresnet_cifar.py
      - lwopenpose_cmupan.py
      - seresnext.py
      - bninception.py
      - diaresnet_cifar.py
      - inceptionv3.py
      - res2net.py
      - pspnet.py
      - airnext.py
      - densenet_cifar.py
      - igcv3.py
      - resnet_cifar.py
      - bamresnet.py
      - shakeshakeresnet_cifar.py
      - pyramidnet.py
      - darknet.py
      - msdnet.py
      - preresnet_cifar.py
      - fractalnet_cifar.py
      - resnet.py
      - others
        oth_alpha_pose.py
        oth_simple_pose_resnet.py
        oth_icnet.py
        oth_centernet.py
        oth_mobile_pose.py
        __init__.py
        oth_centernet2.py
      - isqrtcovresnet.py
      - nasnet.py
      - octresnet.py
      - xdensenet_cifar.py
      - diracnetv2.py
      - airnet.py
      - sharesnet.py
      - crunetb.py
      - resnet_cub.py
      - diapreresnet_cifar.py
      - selecsls.py
      - resnext_cifar.py
      - superpointnet.py
      - shufflenetv2b.py
      - polynet.py
      - menet.py
      - peleenet.py
      - densenet.py
      - dla.py
      - fishnet.py
      - shufflenetv2.py
      - ghostnet.py
      - efficientnet.py
      - diapreresnet.py
      - common.py
      - ibnresnext.py
      - resnetd.py
      - __init__.py
      - resneta.py
      - espnetv2.py
      - preresnet.py
      - hardnet.py
      - resdropresnet_cifar.py
      - drn.py
      - ibnbresnet.py
      - zfnet.py
      - nin_cifar.py
      - model_store.py
      - fbnet.py
      - mixnet.py
      - darknet53.py
      - ibppose_coco.py
      - simplepose_coco.py
      - fastseresnet.py
      - wrn.py
      - alphapose_coco.py
      - wrn1bit_cifar.py
      - ibnresnet.py
      - seresnet_cifar.py
      - resnext.py
      - ntsnet_cub.py
      - diaresnet.py
      - seresnet.py
      - deeplabv3.py
      - condensenet.py
      - vovnet.py
      - bagnet.py
      - sepreresnet.py
      - inceptionresnetv2.py
      - inceptionv4.py
      - senet.py
      - bisenet.py
      - rir_cifar.py
      - sinet.py
    - model_provider.py
    - __init__.py
  - setup.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - metrics
    - hpe_metrics.py
    - seg_metrics_nd.py
    - det_metrics.py
    - __init__.py
    - seg_metrics.py
    - cls_metrics.py
    - seg_metrics_np.py
  - LICENSE.txt
  - model_stats.py
- eval_ch.py
- examples
  - convert_tf2_to_tfl.py
  - demo_gl.py
  - demo_tf2.py
  - demo_pt.py
- eval_ke.py
- train_tf.py
- LICENSE
- common
  - logger_utils.py
  - train_log_param_saver.py
  - __init__.py
  - env_stats.py
- deploy
  - bootstrap_eval.sh
  - bootstrap_train_gl.sh
  - Dockerfile
- tensorflow_
  - setup.py
  - tensorflowcv
    - models
      - vgg.py
      - alexnet.py
      - channelnet.py
      - shufflenet.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet.py
      - mnasnet.py
      - mobilenetv2.py
      - squeezenet.py
      - seresnext.py
      - igcv3.py
      - darknet.py
      - resnet.py
      - others
        __init__.py
      - shufflenetv2b.py
      - menet.py
      - densenet.py
      - shufflenetv2.py
      - common.py
      - __init__.py
      - preresnet.py
      - zfnet.py
      - model_store.py
      - darknet53.py
      - resnext.py
      - seresnet.py
      - sepreresnet.py
      - senet.py
    - model_provider.py
    - __init__.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - LICENSE.txt
  - utils_tp.py
- sotabench.py
- eval_gl_det.py
- pytorch
  - dataset_utils.py
  - datasets
    - coco_hpe2_dataset.py
    - cityscapes_seg_dataset.py
    - mpii_hpe_dataset.py
    - hpatches_mch_dataset.py
    - coco_hpe1_dataset.py
    - svhn_cls_dataset.py
    - voc_seg_dataset.py
    - ade20k_seg_dataset.py
    - cifar10_cls_dataset.py
    - dataset_metainfo.py
    - coco_det_dataset.py
    - __init__.py
    - imagenet1k_cls_dataset.py
    - cifar100_cls_dataset.py
    - cub200_2011_cls_dataset.py
    - hpe_dataset.py
    - seg_dataset.py
    - coco_hpe3_dataset.py
    - coco_seg_dataset.py
  - setup.py
  - pytorchcv
    - models
      - pyramidnet_cifar.py
      - prnet.py
      - xdensenet.py
      - vgg.py
      - shakedropresnet_cifar.py
      - proxylessnas_cub.py
      - cbamresnet.py
      - spnasnet.py
      - irevnet.py
      - voca.py
      - seresnet_cub.py
      - sparsenet.py
      - alexnet.py
      - pnasnet.py
      - channelnet.py
      - shufflenet.py
      - simpleposemobile_coco.py
      - dpn.py
      - icnet.py
      - lffd.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet_cub.py
      - efficientnetedge.py
      - mobilenet.py
      - fcn8sd.py
      - mnasnet.py
      - proxylessnas.py
      - hrnet.py
      - darts.py
      - sknet.py
      - ibndensenet.py
      - mobilenetv2.py
      - squeezenet.py
      - fdmobilenet.py
      - wrn_cifar.py
      - centernet.py
      - resattnet.py
      - xception.py
      - ror_cifar.py
      - msdnet_cifar10.py
      - sepreresnet_cifar.py
      - lwopenpose_cmupan.py
      - seresnext.py
      - bninception.py
      - diaresnet_cifar.py
      - inceptionv3.py
      - pspnet.py
      - airnext.py
      - densenet_cifar.py
      - igcv3.py
      - resnet_cifar.py
      - bamresnet.py
      - shakeshakeresnet_cifar.py
      - pyramidnet.py
      - darknet.py
      - msdnet.py
      - preresnet_cifar.py
      - fractalnet_cifar.py
      - resnet.py
      - others
        oth_lffd.py
        oth_sinet.py
        oth_ibppose.py
        oth_bisenet1.py
        oth_lwopenpose2d.py
        oth_naivenet.py
        oth_lwopenpose3d.py
        __init__.py
        oth_lffd25.py
        oth_pose_resnet.py
        oth_prnet.py
        oth_ibppose1.py
      - isqrtcovresnet.py
      - nasnet.py
      - octresnet.py
      - xdensenet_cifar.py
      - diracnetv2.py
      - airnet.py
      - sharesnet.py
      - resnet_cub.py
      - diapreresnet_cifar.py
      - selecsls.py
      - resnext_cifar.py
      - superpointnet.py
      - shufflenetv2b.py
      - polynet.py
      - menet.py
      - peleenet.py
      - densenet.py
      - dla.py
      - fishnet.py
      - shufflenetv2.py
      - ghostnet.py
      - efficientnet.py
      - diapreresnet.py
      - common.py
      - ibnresnext.py
      - resnetd.py
      - __init__.py
      - resneta.py
      - espnetv2.py
      - preresnet.py
      - hardnet.py
      - resdropresnet_cifar.py
      - drn.py
      - ibnbresnet.py
      - zfnet.py
      - nin_cifar.py
      - model_store.py
      - fbnet.py
      - mixnet.py
      - darknet53.py
      - ibppose_coco.py
      - simplepose_coco.py
      - fastseresnet.py
      - wrn.py
      - alphapose_coco.py
      - revnet.py
      - wrn1bit_cifar.py
      - ibnresnet.py
      - seresnet_cifar.py
      - resnext.py
      - ntsnet_cub.py
      - diaresnet.py
      - seresnet.py
      - deeplabv3.py
      - condensenet.py
      - vovnet.py
      - bagnet.py
      - sepreresnet.py
      - inceptionresnetv2.py
      - inceptionv4.py
      - senet.py
      - bisenet.py
      - rir_cifar.py
      - sinet.py
    - model_provider.py
    - __init__.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - metrics
    - hpe_metrics.py
    - metric.py
    - ret_metrics.py
    - det_metrics.py
    - __init__.py
    - seg_metrics.py
    - cls_metrics.py
    - seg_metrics_np.py
  - LICENSE.txt
  - model_stats.py
- eval_tf2.py
- train_tf2.py
- eval_gl.py
- train_ch.py
- train_pt.py
- train_gl.py
- chainer_
  - dataset_utils.py
  - chainercv2
    - models
      - pyramidnet_cifar.py
      - xdensenet.py
      - vgg.py
      - shakedropresnet_cifar.py
      - proxylessnas_cub.py
      - cbamresnet.py
      - spnasnet.py
      - irevnet.py
      - voca.py
      - seresnet_cub.py
      - sparsenet.py
      - alexnet.py
      - pnasnet.py
      - channelnet.py
      - shufflenet.py
      - simpleposemobile_coco.py
      - dpn.py
      - icnet.py
      - lffd.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet_cub.py
      - efficientnetedge.py
      - mobilenet.py
      - fcn8sd.py
      - mnasnet.py
      - proxylessnas.py
      - hrnet.py
      - darts.py
      - sknet.py
      - mobilenetv2.py
      - squeezenet.py
      - fdmobilenet.py
      - wrn_cifar.py
      - centernet.py
      - resattnet.py
      - xception.py
      - ror_cifar.py
      - sepreresnet_cifar.py
      - lwopenpose_cmupan.py
      - seresnext.py
      - bninception.py
      - diaresnet_cifar.py
      - inceptionv3.py
      - pspnet.py
      - airnext.py
      - densenet_cifar.py
      - igcv3.py
      - resnet_cifar.py
      - bamresnet.py
      - shakeshakeresnet_cifar.py
      - pyramidnet.py
      - darknet.py
      - preresnet_cifar.py
      - resnet.py
      - others
        __init__.py
      - nasnet.py
      - octresnet.py
      - xdensenet_cifar.py
      - diracnetv2.py
      - airnet.py
      - sharesnet.py
      - resnet_cub.py
      - diapreresnet_cifar.py
      - selecsls.py
      - resnext_cifar.py
      - shufflenetv2b.py
      - polynet.py
      - menet.py
      - peleenet.py
      - densenet.py
      - dla.py
      - fishnet.py
      - shufflenetv2.py
      - ghostnet.py
      - efficientnet.py
      - diapreresnet.py
      - common.py
      - resnetd.py
      - __init__.py
      - resneta.py
      - espnetv2.py
      - preresnet.py
      - hardnet.py
      - resdropresnet_cifar.py
      - drn.py
      - zfnet.py
      - nin_cifar.py
      - model_store.py
      - fbnet.py
      - mixnet.py
      - darknet53.py
      - ibppose_coco.py
      - simplepose_coco.py
      - fastseresnet.py
      - wrn.py
      - alphapose_coco.py
      - wrn1bit_cifar.py
      - seresnet_cifar.py
      - resnext.py
      - ntsnet_cub.py
      - diaresnet.py
      - seresnet.py
      - deeplabv3.py
      - condensenet.py
      - vovnet.py
      - bagnet.py
      - sepreresnet.py
      - inceptionresnetv2.py
      - inceptionv4.py
      - senet.py
      - bisenet.py
      - rir_cifar.py
      - sinet.py
    - model_provider.py
    - __init__.py
  - datasets
    - coco_hpe2_dataset.py
    - cityscapes_seg_dataset.py
    - coco_hpe1_dataset.py
    - svhn_cls_dataset.py
    - voc_seg_dataset.py
    - ade20k_seg_dataset.py
    - cifar10_cls_dataset.py
    - dataset_metainfo.py
    - __init__.py
    - imagenet1k_cls_dataset.py
    - cifar100_cls_dataset.py
    - cub200_2011_cls_dataset.py
    - seg_dataset.py
    - coco_hpe3_dataset.py
    - coco_seg_dataset.py
  - setup.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - metrics
    - hpe_metrics.py
    - metric.py
    - det_metrics.py
    - __init__.py
    - seg_metrics.py
    - cls_metrics.py
    - seg_metrics_np.py
  - LICENSE.txt
- train_ke.py
- __init__.py
- eval_pt.py
- .travis.yml
- README.md
- tests
  - convert_gl2pt_dense.py
  - convert_gl2tf2_conv2d_b.py
  - convert_gl2tf2_conv2d.py
  - convert_gl2tf_conv2d.py
  - convert_gl2tf_batchnorm.py
  - convert_gl2tf_dwconv2d.py
  - convert_gl2tf_dense.py
  - convert_gl2tf_conv1x1.py
  - convert_gl2tf2_batchnorm.py
  - __init__.py
  - convert_gl2pt_batchnorm.py
  - convert_gl2tf_avgpool2d.py
  - convert_gl2tf2_dwconv2d.py
  - convert_gl2pt_conv2d.py
  - convert_gl2tf2_avgpool2d.py
  - convert_gl2tf_maxpool2d.py
  - convert_gl2tf_gconv2d.py
- requirements.txt
- keras_
  - setup.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - LICENSE.txt
  - kerascv
    - models
      - vgg.py
      - alexnet.py
      - shufflenet.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet.py
      - mnasnet.py
      - mobilenetv2.py
      - squeezenet.py
      - seresnext.py
      - igcv3.py
      - darknet.py
      - resnet.py
      - others
        __init__.py
      - shufflenetv2b.py
      - menet.py
      - densenet.py
      - shufflenetv2.py
      - efficientnet.py
      - common.py
      - __init__.py
      - preresnet.py
      - zfnet.py
      - model_store.py
      - darknet53.py
      - resnext.py
      - seresnet.py
      - sepreresnet.py
      - senet.py
    - model_provider.py
    - __init__.py
- .gitignore
- tensorflow2
  - dataset_utils.py
  - datasets
    - coco_hpe2_dataset.py
    - cityscapes_seg_dataset.py
    - coco_hpe1_dataset.py
    - svhn_cls_dataset.py
    - voc_seg_dataset.py
    - ade20k_seg_dataset.py
    - cifar10_cls_dataset.py
    - cls_dataset.py
    - dataset_metainfo.py
    - __init__.py
    - imagenet1k_cls_dataset.py
    - cifar100_cls_dataset.py
    - cub200_2011_cls_dataset.py
    - seg_dataset.py
    - coco_hpe3_dataset.py
    - coco_seg_dataset.py
  - tf2cv
    - models
      - pyramidnet_cifar.py
      - vgg.py
      - proxylessnas_cub.py
      - cbamresnet.py
      - spnasnet.py
      - voca.py
      - seresnet_cub.py
      - alexnet.py
      - pnasnet.py
      - shufflenet.py
      - simpleposemobile_coco.py
      - dpn.py
      - icnet.py
      - lffd.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet_cub.py
      - efficientnetedge.py
      - mobilenet.py
      - fcn8sd.py
      - mnasnet.py
      - proxylessnas.py
      - hrnet.py
      - sknet.py
      - ibndensenet.py
      - mobilenetv2.py
      - squeezenet.py
      - fdmobilenet.py
      - wrn_cifar.py
      - centernet.py
      - xception.py
      - sepreresnet_cifar.py
      - lwopenpose_cmupan.py
      - seresnext.py
      - bninception.py
      - inceptionv3.py
      - pspnet.py
      - airnext.py
      - densenet_cifar.py
      - igcv3.py
      - resnet_cifar.py
      - bamresnet.py
      - pyramidnet.py
      - darknet.py
      - preresnet_cifar.py
      - resnet.py
      - nasnet.py
      - diracnetv2.py
      - airnet.py
      - resnet_cub.py
      - selecsls.py
      - resnext_cifar.py
      - shufflenetv2b.py
      - polynet.py
      - menet.py
      - peleenet.py
      - densenet.py
      - dla.py
      - shufflenetv2.py
      - ghostnet.py
      - efficientnet.py
      - common.py
      - ibnresnext.py
      - resnetd.py
      - __init__.py
      - resneta.py
      - espnetv2.py
      - preresnet.py
      - hardnet.py
      - drn.py
      - ibnbresnet.py
      - zfnet.py
      - model_store.py
      - fbnet.py
      - mixnet.py
      - darknet53.py
      - ibppose_coco.py
      - simplepose_coco.py
      - fastseresnet.py
      - wrn.py
      - alphapose_coco.py
      - ibnresnet.py
      - seresnet_cifar.py
      - resnext.py
      - seresnet.py
      - grmiposelite_coco.py
      - deeplabv3.py
      - vovnet.py
      - bagnet.py
      - sepreresnet.py
      - inceptionresnetv2.py
      - inceptionv4.py
      - senet.py
      - bisenet.py
      - sinet.py
    - model_provider.py
    - __init__.py
  - setup.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - metrics
    - hpe_metrics.py
    - metric.py
    - det_metrics.py
    - __init__.py
    - seg_metrics.py
    - cls_metrics.py
    - seg_metrics_np.py
  - LICENSE.txt
- other
  - eval_pt_seg-.py
  - datasets
    - __init__.py
  - gluon
    - khpa
      - train_gl_khpa.py
      - khpa_utils.py
      - eval_gl_khpa.py
      - __init__.py
      - khpa_cls_dataset.py
    - __init__.py
    - seg_utils1.py
  - train_gl_cifar-.py
  - train_pt_cifar-.py
  - train_gl_seg.py
  - eval_gl_seg-.py
  - pytorch
    - cub200_2011_utils1.py
    - imagenet1k1.py
    - __init__.py
    - cifar1.py
    - seg_utils.py
  - eval_pt_mch.py
  - eval_ch_seg-.py
  - chainer_
    - imagenet1k1.py
    - train_ch_in1k.py
    - top_k_accuracy1.py
    - __init__.py
    - train_ch_cifar.py
    - cifar1.py
    - seg_utils1.py
  - __init__.py
  - eval_pt_cub-.py
  - eval_ch_cifar-.py
  - eval_gl_mch.py
  - eval_pt_cifar-.py
  - eval_ch_in1k-.py
- eval_tf.py

"""
    BiSeNet for CelebAMask-HQ, implemented in TensorFlow.
    Original paper: 'BiSeNet: Bilateral Segmentation Network for Real-time Semantic Segmentation,'
    https://arxiv.org/abs/1808.00897.
"""

__all__ = ['BiSeNet', 'bisenet_resnet18_celebamaskhq']

import os
import tensorflow as tf
import tensorflow.keras.layers as nn
from .common import conv1x1, conv1x1_block, conv3x3_block, InterpolationBlock, MultiOutputSequential, get_channel_axis,\
    get_im_size, is_channels_first
from .resnet import resnet18


class PyramidPoolingZeroBranch(nn.Layer):
    """
    Pyramid pooling zero branch.

    Parameters:
    ----------
    in_channels : int
        Number of input channels.
    out_channels : int
        Number of output channels.
    in_size : tuple of 2 int
        Spatial size of output image for the upsampling operation.
    data_format : str, default 'channels_last'
        The ordering of the dimensions in tensors.
    """
    def __init__(self,
                 in_channels,
                 out_channels,
                 in_size,
                 data_format="channels_last",
                 **kwargs):
        super(PyramidPoolingZeroBranch, self).__init__(**kwargs)
        self.in_size = in_size
        self.data_format = data_format

        self.pool = nn.GlobalAveragePooling2D(
            data_format=data_format,
            name="pool")
        self.conv = conv1x1_block(
            in_channels=in_channels,
            out_channels=out_channels,
            data_format=data_format,
            name="conv")
        self.up = InterpolationBlock(
            scale_factor=None,
            interpolation="bilinear",
            data_format=data_format,
            name="up")

    def call(self, x, training=None):
        in_size = self.in_size if self.in_size is not None else get_im_size(x, data_format=self.data_format)
        x = self.pool(x)
        axis = -1 if is_channels_first(self.data_format) else 1
        x = tf.expand_dims(tf.expand_dims(x, axis=axis), axis=axis)
        x = self.conv(x, training=training)
        x = self.up(x, size=in_size)
        return x


class AttentionRefinementBlock(nn.Layer):
    """
    Attention refinement block.

    Parameters:
    ----------
    in_channels : int
        Number of input channels.
    out_channels : int
        Number of output channels.
    data_format : str, default 'channels_last'
        The ordering of the dimensions in tensors.
    """
    def __init__(self,
                 in_channels,
                 out_channels,
                 data_format="channels_last",
                 **kwargs):
        super(AttentionRefinementBlock, self).__init__(**kwargs)
        self.data_format = data_format

        self.conv1 = conv3x3_block(
            in_channels=in_channels,
            out_channels=out_channels,
            data_format=data_format,
            name="conv1")
        self.pool = nn.GlobalAveragePooling2D(
            data_format=data_format,
            name="pool")
        self.conv2 = conv1x1_block(
            in_channels=out_channels,
            out_channels=out_channels,
            activation="sigmoid",
            data_format=data_format,
            name="conv2")

    def call(self, x, training=None):
        x = self.conv1(x, training=training)
        w = self.pool(x)
        axis = -1 if is_channels_first(self.data_format) else 1
        w = tf.expand_dims(tf.expand_dims(w, axis=axis), axis=axis)
        w = self.conv2(w, training=training)
        x = x * w
        return x


class PyramidPoolingMainBranch(nn.Layer):
    """
    Pyramid pooling main branch.

    Parameters:
    ----------
    in_channels : int
        Number of input channels.
    out_channels : int
        Number of output channels.
    scale_factor : float
        Multiplier for spatial size.
    data_format : str, default 'channels_last'
        The ordering of the dimensions in tensors.
    """
    def __init__(self,
                 in_channels,
                 out_channels,
                 scale_factor,
                 data_format="channels_last",
                 **kwargs):
        super(PyramidPoolingMainBranch, self).__init__(**kwargs)
        self.att = AttentionRefinementBlock(
            in_channels=in_channels,
            out_channels=out_channels,
            data_format=data_format,
            name="att")
        self.up = InterpolationBlock(
            scale_factor=scale_factor,
            interpolation="bilinear",
            data_format=data_format,
            name="up")
        self.conv = conv3x3_block(
            in_channels=out_channels,
            out_channels=out_channels,
            data_format=data_format,
            name="conv")

    def call(self, x, y, training=None):
        x = self.att(x, training=training)
        x = x + y
        x = self.up(x)
        x = self.conv(x, training=training)
        return x


class FeatureFusion(nn.Layer):
    """
    Feature fusion block.

    Parameters:
    ----------
    in_channels : int
        Number of input channels.
    out_channels : int
        Number of output channels.
    reduction : int, default 4
        Squeeze reduction value.
    data_format : str, default 'channels_last'
        The ordering of the dimensions in tensors.
    """
    def __init__(self,
                 in_channels,
                 out_channels,
                 reduction=4,
                 data_format="channels_last",
                 **kwargs):
        super(FeatureFusion, self).__init__(**kwargs)
        self.data_format = data_format
        mid_channels = out_channels // reduction

        self.conv_merge = conv1x1_block(
            in_channels=in_channels,
            out_channels=out_channels,
            data_format=data_format,
            name="conv_merge")
        self.pool = nn.GlobalAveragePooling2D(
            data_format=data_format,
            name="pool")
        self.conv1 = conv1x1(
            in_channels=out_channels,
            out_channels=mid_channels,
            data_format=data_format,
            name="conv1")
        self.activ = nn.ReLU()
        self.conv2 = conv1x1(
            in_channels=mid_channels,
            out_channels=out_channels,
            data_format=data_format,
            name="conv2")
        self.sigmoid = tf.nn.sigmoid

    def call(self, x, y, training=None):
        x = tf.concat([x, y], axis=get_channel_axis(self.data_format))
        x = self.conv_merge(x, training=training)
        w = self.pool(x)
        axis = -1 if is_channels_first(self.data_format) else 1
        w = tf.expand_dims(tf.expand_dims(w, axis=axis), axis=axis)
        w = self.conv1(w)
        w = self.activ(w)
        w = self.conv2(w)
        w = self.sigmoid(w)
        x_att = x * w
        x = x + x_att
        return x


class PyramidPooling(nn.Layer):
    """
    Pyramid Pooling module.

    Parameters:
    ----------
    x16_in_channels : int
        Number of input channels for x16.
    x32_in_channels : int
        Number of input channels for x32.
    y_out_channels : int
        Number of output channels for y-outputs.
    y32_out_size : tuple of 2 int
        Spatial size of the y32 tensor.
    data_format : str, default 'channels_last'
        The ordering of the dimensions in tensors.
    """
    def __init__(self,
                 x16_in_channels,
                 x32_in_channels,
                 y_out_channels,
                 y32_out_size,
                 data_format="channels_last",
                 **kwargs):
        super(PyramidPooling, self).__init__(**kwargs)
        z_out_channels = 2 * y_out_channels

        self.pool32 = PyramidPoolingZeroBranch(
            in_channels=x32_in_channels,
            out_channels=y_out_channels,
            in_size=y32_out_size,
            data_format=data_format,
            name="pool32")
        self.pool16 = PyramidPoolingMainBranch(
            in_channels=x32_in_channels,
            out_channels=y_out_channels,
            scale_factor=2,
            data_format=data_format,
            name="pool16")
        self.pool8 = PyramidPoolingMainBranch(
            in_channels=x16_in_channels,
            out_channels=y_out_channels,
            scale_factor=2,
            data_format=data_format,
            name="pool8")
        self.fusion = FeatureFusion(
            in_channels=z_out_channels,
            out_channels=z_out_channels,
            data_format=data_format,
            name="fusion")

    def call(self, x8, x16, x32, training=None):
        y32 = self.pool32(x32, training=training)
        y16 = self.pool16(x32, y32, training=training)
        y8 = self.pool8(x16, y16, training=training)
        z8 = self.fusion(x8, y8, training=training)
        return z8, y8, y16


class BiSeHead(nn.Layer):
    """
    BiSeNet head (final) block.

    Parameters:
    ----------
    in_channels : int
        Number of input channels.
    mid_channels : int
        Number of middle channels.
    out_channels : int
        Number of output channels.
    data_format : str, default 'channels_last'
        The ordering of the dimensions in tensors.
    """
    def __init__(self,
                 in_channels,
                 mid_channels,
                 out_channels,
                 data_format="channels_last",
                 **kwargs):
        super(BiSeHead, self).__init__(**kwargs)
        self.conv1 = conv3x3_block(
            in_channels=in_channels,
            out_channels=mid_channels,
            data_format=data_format,
            name="conv1")
        self.conv2 = conv1x1(
            in_channels=mid_channels,
            out_channels=out_channels,
            data_format=data_format,
            name="conv2")

    def call(self, x, training=None):
        x = self.conv1(x, training=training)
        x = self.conv2(x)
        return x


class BiSeNet(tf.keras.Model):
    """
    BiSeNet model from 'BiSeNet: Bilateral Segmentation Network for Real-time Semantic Segmentation,'
    https://arxiv.org/abs/1808.00897.

    Parameters:
    ----------
    backbone : func -> nn.Sequential
        Feature extractor.
    aux : bool, default True
        Whether to output an auxiliary results.
    fixed_size : bool, default True
        Whether to expect fixed spatial size of input image.
    in_channels : int, default 3
        Number of input channels.
    in_size : tuple of two ints, default (640, 480)
        Spatial size of the expected input image.
    classes : int, default 1000
        Number of classification classes.
    data_format : str, default 'channels_last'
        The ordering of the dimensions in tensors.
    """
    def __init__(self,
                 backbone,
                 aux=True,
                 fixed_size=True,
                 in_channels=3,
                 in_size=(640, 480),
                 classes=19,
                 data_format="channels_last",
                 **kwargs):
        super(BiSeNet, self).__init__(**kwargs)
        assert (in_channels == 3)
        self.in_size = in_size
        self.classes = classes
        self.data_format = data_format
        self.aux = aux
        self.fixed_size = fixed_size

        self.backbone, backbone_out_channels = backbone(
            data_format=data_format,
            name="backbone")

        y_out_channels = backbone_out_channels[0]
        z_out_channels = 2 * y_out_channels
        y32_out_size = (self.in_size[0] // 32, self.in_size[1] // 32) if fixed_size else None
        self.pool = PyramidPooling(
            x16_in_channels=backbone_out_channels[1],
            x32_in_channels=backbone_out_channels[2],
            y_out_channels=y_out_channels,
            y32_out_size=y32_out_size,
            data_format=data_format,
            name="pool")
        self.head_z8 = BiSeHead(
            in_channels=z_out_channels,
            mid_channels=z_out_channels,
            out_channels=classes,
            data_format=data_format,
            name="head_z8")
        self.up8 = InterpolationBlock(
            scale_factor=(8 if fixed_size else None),
            data_format=data_format,
            name="up8")

        if self.aux:
            mid_channels = y_out_channels // 2
            self.head_y8 = BiSeHead(
                in_channels=y_out_channels,
                mid_channels=mid_channels,
                out_channels=classes,
                data_format=data_format,
                name="head_y8")
            self.head_y16 = BiSeHead(
                in_channels=y_out_channels,
                mid_channels=mid_channels,
                out_channels=classes,
                data_format=data_format,
                name="head_y16")
            self.up16 = InterpolationBlock(
                scale_factor=(16 if fixed_size else None),
                data_format=data_format,
                name="up16")

    def call(self, x, training=None):
        assert is_channels_first(self.data_format) or ((x.shape[1] % 32 == 0) and (x.shape[2] % 32 == 0))
        assert (not is_channels_first(self.data_format)) or ((x.shape[2] % 32 == 0) and (x.shape[3] % 32 == 0))

        x8, x16, x32 = self.backbone(x, training=training)
        z8, y8, y16 = self.pool(x8, x16, x32, training=training)

        z8 = self.head_z8(z8, training=training)
        z8 = self.up8(z8)

        if self.aux:
            y8 = self.head_y8(y8, training=training)
            y16 = self.head_y16(y16, training=training)
            y8 = self.up8(y8)
            y16 = self.up16(y16)
            return z8, y8, y16
        else:
            return z8


def get_bisenet(model_name=None,
                pretrained=False,
                root=os.path.join("~", ".tensorflow", "models"),
                **kwargs):
    """
    Create BiSeNet model with specific parameters.

    Parameters:
    ----------
    model_name : str or None, default None
        Model name for loading pretrained model.
    pretrained : bool, default False
        Whether to load the pretrained weights for model.
    root : str, default '~/.tensorflow/models'
        Location for keeping the model parameters.
    """
    net = BiSeNet(
        **kwargs)

    if pretrained:
        if (model_name is None) or (not model_name):
            raise ValueError("Parameter `model_name` should be properly initialized for loading pretrained model.")
        from .model_store import get_model_file
        in_channels = kwargs["in_channels"] if ("in_channels" in kwargs) else 3
        input_shape = (1,) + (in_channels,) + net.in_size if net.data_format == "channels_first" else\
            (1,) + net.in_size + (in_channels,)
        net.build(input_shape=input_shape)
        net.load_weights(
            filepath=get_model_file(
                model_name=model_name,
                local_model_store_dir_path=root))

    return net


def bisenet_resnet18_celebamaskhq(pretrained_backbone=False, classes=19, **kwargs):
    """
    BiSeNet model on the base of ResNet-18 for face segmentation on CelebAMask-HQ from 'BiSeNet: Bilateral Segmentation
    Network for Real-time Semantic Segmentation,' https://arxiv.org/abs/1808.00897.

    Parameters:
    ----------
    pretrained_backbone : bool, default False
        Whether to load the pretrained weights for feature extractor.
    classes : int, default 19
        Number of classes.
    pretrained : bool, default False
        Whether to load the pretrained weights for model.
    root : str, default '~/.tensorflow/models'
        Location for keeping the model parameters.
    """
    def backbone(**bb_kwargs):
        features_raw = resnet18(pretrained=pretrained_backbone, **bb_kwargs).features
        features_raw._layers.pop()
        features = MultiOutputSequential(return_last=False, name="backbone")
        features.add(features_raw._layers[0])
        for i, stage in enumerate(features_raw._layers[1:]):
            if i != 0:
                stage.do_output = True
            features.add(stage)
        out_channels = [128, 256, 512]
        return features, out_channels
    return get_bisenet(backbone=backbone, classes=classes, model_name="bisenet_resnet18_celebamaskhq", **kwargs)


def _test():
    import numpy as np
    import tensorflow.keras.backend as K

    data_format = "channels_last"
    # data_format = "channels_first"
    in_size = (640, 480)
    aux = True
    pretrained = False

    models = [
        bisenet_resnet18_celebamaskhq,
    ]

    for model in models:

        net = model(pretrained=pretrained, in_size=in_size, aux=aux, data_format=data_format)

        batch = 14
        x = tf.random.normal((batch, 3, in_size[0], in_size[1]) if is_channels_first(data_format) else
                             (batch, in_size[0], in_size[1], 3))
        ys = net(x)
        y = ys[0] if aux else ys
        assert (y.shape[0] == x.shape[0])
        if is_channels_first(data_format):
            assert ((y.shape[1] == 19) and (y.shape[2] == x.shape[2]) and (y.shape[3] == x.shape[3]))
        else:
            assert ((y.shape[3] == 19) and (y.shape[1] == x.shape[1]) and (y.shape[2] == x.shape[2]))

        weight_count = sum([np.prod(K.get_value(w).shape) for w in net.trainable_weights])
        print("m={}, {}".format(model.__name__, weight_count))
        if aux:
            assert (model != bisenet_resnet18_celebamaskhq or weight_count == 13300416)
        else:
            assert (model != bisenet_resnet18_celebamaskhq or weight_count == 13150272)


if __name__ == "__main__":
    _test()