python source code of alexnet

imgclsmob-master
- convert_models.py
- gluon
  - lr_scheduler.py
  - dataset_utils.py
  - datasets
    - coco_hpe2_dataset.py
    - cityscapes_seg_dataset.py
    - imagenet1k_rec_cls_dataset.py
    - hpatches_mch_dataset.py
    - coco_hpe1_dataset.py
    - svhn_cls_dataset.py
    - voc_seg_dataset.py
    - widerface_det_dataset.py
    - ade20k_seg_dataset.py
    - cifar10_cls_dataset.py
    - dataset_metainfo.py
    - coco_det_dataset.py
    - __init__.py
    - imagenet1k_cls_dataset.py
    - cifar100_cls_dataset.py
    - cub200_2011_cls_dataset.py
    - seg_dataset.py
    - coco_hpe3_dataset.py
    - coco_seg_dataset.py
  - weighted_random_sampler.py
  - losses.py
  - gluoncv2
    - models
      - pyramidnet_cifar.py
      - xdensenet.py
      - vgg.py
      - shakedropresnet_cifar.py
      - proxylessnas_cub.py
      - cbamresnet.py
      - spnasnet.py
      - irevnet.py
      - voca.py
      - seresnet_cub.py
      - crunet.py
      - sparsenet.py
      - alexnet.py
      - pnasnet.py
      - channelnet.py
      - shufflenet.py
      - simpleposemobile_coco.py
      - dpn.py
      - icnet.py
      - lffd.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet_cub.py
      - efficientnetedge.py
      - mobilenet.py
      - fcn8sd.py
      - mnasnet.py
      - proxylessnas.py
      - hrnet.py
      - darts.py
      - sknet.py
      - ibndensenet.py
      - mobilenetv2.py
      - squeezenet.py
      - fdmobilenet.py
      - wrn_cifar.py
      - centernet.py
      - resattnet.py
      - xception.py
      - ror_cifar.py
      - octresnet_cifar.py
      - sepreresnet_cifar.py
      - lwopenpose_cmupan.py
      - seresnext.py
      - bninception.py
      - diaresnet_cifar.py
      - inceptionv3.py
      - res2net.py
      - pspnet.py
      - airnext.py
      - densenet_cifar.py
      - igcv3.py
      - resnet_cifar.py
      - bamresnet.py
      - shakeshakeresnet_cifar.py
      - pyramidnet.py
      - darknet.py
      - msdnet.py
      - preresnet_cifar.py
      - fractalnet_cifar.py
      - resnet.py
      - others
        oth_alpha_pose.py
        oth_simple_pose_resnet.py
        oth_icnet.py
        oth_centernet.py
        oth_mobile_pose.py
        __init__.py
        oth_centernet2.py
      - isqrtcovresnet.py
      - nasnet.py
      - octresnet.py
      - xdensenet_cifar.py
      - diracnetv2.py
      - airnet.py
      - sharesnet.py
      - crunetb.py
      - resnet_cub.py
      - diapreresnet_cifar.py
      - selecsls.py
      - resnext_cifar.py
      - superpointnet.py
      - shufflenetv2b.py
      - polynet.py
      - menet.py
      - peleenet.py
      - densenet.py
      - dla.py
      - fishnet.py
      - shufflenetv2.py
      - ghostnet.py
      - efficientnet.py
      - diapreresnet.py
      - common.py
      - ibnresnext.py
      - resnetd.py
      - __init__.py
      - resneta.py
      - espnetv2.py
      - preresnet.py
      - hardnet.py
      - resdropresnet_cifar.py
      - drn.py
      - ibnbresnet.py
      - zfnet.py
      - nin_cifar.py
      - model_store.py
      - fbnet.py
      - mixnet.py
      - darknet53.py
      - ibppose_coco.py
      - simplepose_coco.py
      - fastseresnet.py
      - wrn.py
      - alphapose_coco.py
      - wrn1bit_cifar.py
      - ibnresnet.py
      - seresnet_cifar.py
      - resnext.py
      - ntsnet_cub.py
      - diaresnet.py
      - seresnet.py
      - deeplabv3.py
      - condensenet.py
      - vovnet.py
      - bagnet.py
      - sepreresnet.py
      - inceptionresnetv2.py
      - inceptionv4.py
      - senet.py
      - bisenet.py
      - rir_cifar.py
      - sinet.py
    - model_provider.py
    - __init__.py
  - setup.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - metrics
    - hpe_metrics.py
    - seg_metrics_nd.py
    - det_metrics.py
    - __init__.py
    - seg_metrics.py
    - cls_metrics.py
    - seg_metrics_np.py
  - LICENSE.txt
  - model_stats.py
- eval_ch.py
- examples
  - convert_tf2_to_tfl.py
  - demo_gl.py
  - demo_tf2.py
  - demo_pt.py
- eval_ke.py
- train_tf.py
- LICENSE
- common
  - logger_utils.py
  - train_log_param_saver.py
  - __init__.py
  - env_stats.py
- deploy
  - bootstrap_eval.sh
  - bootstrap_train_gl.sh
  - Dockerfile
- tensorflow_
  - setup.py
  - tensorflowcv
    - models
      - vgg.py
      - alexnet.py
      - channelnet.py
      - shufflenet.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet.py
      - mnasnet.py
      - mobilenetv2.py
      - squeezenet.py
      - seresnext.py
      - igcv3.py
      - darknet.py
      - resnet.py
      - others
        __init__.py
      - shufflenetv2b.py
      - menet.py
      - densenet.py
      - shufflenetv2.py
      - common.py
      - __init__.py
      - preresnet.py
      - zfnet.py
      - model_store.py
      - darknet53.py
      - resnext.py
      - seresnet.py
      - sepreresnet.py
      - senet.py
    - model_provider.py
    - __init__.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - LICENSE.txt
  - utils_tp.py
- sotabench.py
- eval_gl_det.py
- pytorch
  - dataset_utils.py
  - datasets
    - coco_hpe2_dataset.py
    - cityscapes_seg_dataset.py
    - mpii_hpe_dataset.py
    - hpatches_mch_dataset.py
    - coco_hpe1_dataset.py
    - svhn_cls_dataset.py
    - voc_seg_dataset.py
    - ade20k_seg_dataset.py
    - cifar10_cls_dataset.py
    - dataset_metainfo.py
    - coco_det_dataset.py
    - __init__.py
    - imagenet1k_cls_dataset.py
    - cifar100_cls_dataset.py
    - cub200_2011_cls_dataset.py
    - hpe_dataset.py
    - seg_dataset.py
    - coco_hpe3_dataset.py
    - coco_seg_dataset.py
  - setup.py
  - pytorchcv
    - models
      - pyramidnet_cifar.py
      - prnet.py
      - xdensenet.py
      - vgg.py
      - shakedropresnet_cifar.py
      - proxylessnas_cub.py
      - cbamresnet.py
      - spnasnet.py
      - irevnet.py
      - voca.py
      - seresnet_cub.py
      - sparsenet.py
      - alexnet.py
      - pnasnet.py
      - channelnet.py
      - shufflenet.py
      - simpleposemobile_coco.py
      - dpn.py
      - icnet.py
      - lffd.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet_cub.py
      - efficientnetedge.py
      - mobilenet.py
      - fcn8sd.py
      - mnasnet.py
      - proxylessnas.py
      - hrnet.py
      - darts.py
      - sknet.py
      - ibndensenet.py
      - mobilenetv2.py
      - squeezenet.py
      - fdmobilenet.py
      - wrn_cifar.py
      - centernet.py
      - resattnet.py
      - xception.py
      - ror_cifar.py
      - msdnet_cifar10.py
      - sepreresnet_cifar.py
      - lwopenpose_cmupan.py
      - seresnext.py
      - bninception.py
      - diaresnet_cifar.py
      - inceptionv3.py
      - pspnet.py
      - airnext.py
      - densenet_cifar.py
      - igcv3.py
      - resnet_cifar.py
      - bamresnet.py
      - shakeshakeresnet_cifar.py
      - pyramidnet.py
      - darknet.py
      - msdnet.py
      - preresnet_cifar.py
      - fractalnet_cifar.py
      - resnet.py
      - others
        oth_lffd.py
        oth_sinet.py
        oth_ibppose.py
        oth_bisenet1.py
        oth_lwopenpose2d.py
        oth_naivenet.py
        oth_lwopenpose3d.py
        __init__.py
        oth_lffd25.py
        oth_pose_resnet.py
        oth_prnet.py
        oth_ibppose1.py
      - isqrtcovresnet.py
      - nasnet.py
      - octresnet.py
      - xdensenet_cifar.py
      - diracnetv2.py
      - airnet.py
      - sharesnet.py
      - resnet_cub.py
      - diapreresnet_cifar.py
      - selecsls.py
      - resnext_cifar.py
      - superpointnet.py
      - shufflenetv2b.py
      - polynet.py
      - menet.py
      - peleenet.py
      - densenet.py
      - dla.py
      - fishnet.py
      - shufflenetv2.py
      - ghostnet.py
      - efficientnet.py
      - diapreresnet.py
      - common.py
      - ibnresnext.py
      - resnetd.py
      - __init__.py
      - resneta.py
      - espnetv2.py
      - preresnet.py
      - hardnet.py
      - resdropresnet_cifar.py
      - drn.py
      - ibnbresnet.py
      - zfnet.py
      - nin_cifar.py
      - model_store.py
      - fbnet.py
      - mixnet.py
      - darknet53.py
      - ibppose_coco.py
      - simplepose_coco.py
      - fastseresnet.py
      - wrn.py
      - alphapose_coco.py
      - revnet.py
      - wrn1bit_cifar.py
      - ibnresnet.py
      - seresnet_cifar.py
      - resnext.py
      - ntsnet_cub.py
      - diaresnet.py
      - seresnet.py
      - deeplabv3.py
      - condensenet.py
      - vovnet.py
      - bagnet.py
      - sepreresnet.py
      - inceptionresnetv2.py
      - inceptionv4.py
      - senet.py
      - bisenet.py
      - rir_cifar.py
      - sinet.py
    - model_provider.py
    - __init__.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - metrics
    - hpe_metrics.py
    - metric.py
    - ret_metrics.py
    - det_metrics.py
    - __init__.py
    - seg_metrics.py
    - cls_metrics.py
    - seg_metrics_np.py
  - LICENSE.txt
  - model_stats.py
- eval_tf2.py
- train_tf2.py
- eval_gl.py
- train_ch.py
- train_pt.py
- train_gl.py
- chainer_
  - dataset_utils.py
  - chainercv2
    - models
      - pyramidnet_cifar.py
      - xdensenet.py
      - vgg.py
      - shakedropresnet_cifar.py
      - proxylessnas_cub.py
      - cbamresnet.py
      - spnasnet.py
      - irevnet.py
      - voca.py
      - seresnet_cub.py
      - sparsenet.py
      - alexnet.py
      - pnasnet.py
      - channelnet.py
      - shufflenet.py
      - simpleposemobile_coco.py
      - dpn.py
      - icnet.py
      - lffd.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet_cub.py
      - efficientnetedge.py
      - mobilenet.py
      - fcn8sd.py
      - mnasnet.py
      - proxylessnas.py
      - hrnet.py
      - darts.py
      - sknet.py
      - mobilenetv2.py
      - squeezenet.py
      - fdmobilenet.py
      - wrn_cifar.py
      - centernet.py
      - resattnet.py
      - xception.py
      - ror_cifar.py
      - sepreresnet_cifar.py
      - lwopenpose_cmupan.py
      - seresnext.py
      - bninception.py
      - diaresnet_cifar.py
      - inceptionv3.py
      - pspnet.py
      - airnext.py
      - densenet_cifar.py
      - igcv3.py
      - resnet_cifar.py
      - bamresnet.py
      - shakeshakeresnet_cifar.py
      - pyramidnet.py
      - darknet.py
      - preresnet_cifar.py
      - resnet.py
      - others
        __init__.py
      - nasnet.py
      - octresnet.py
      - xdensenet_cifar.py
      - diracnetv2.py
      - airnet.py
      - sharesnet.py
      - resnet_cub.py
      - diapreresnet_cifar.py
      - selecsls.py
      - resnext_cifar.py
      - shufflenetv2b.py
      - polynet.py
      - menet.py
      - peleenet.py
      - densenet.py
      - dla.py
      - fishnet.py
      - shufflenetv2.py
      - ghostnet.py
      - efficientnet.py
      - diapreresnet.py
      - common.py
      - resnetd.py
      - __init__.py
      - resneta.py
      - espnetv2.py
      - preresnet.py
      - hardnet.py
      - resdropresnet_cifar.py
      - drn.py
      - zfnet.py
      - nin_cifar.py
      - model_store.py
      - fbnet.py
      - mixnet.py
      - darknet53.py
      - ibppose_coco.py
      - simplepose_coco.py
      - fastseresnet.py
      - wrn.py
      - alphapose_coco.py
      - wrn1bit_cifar.py
      - seresnet_cifar.py
      - resnext.py
      - ntsnet_cub.py
      - diaresnet.py
      - seresnet.py
      - deeplabv3.py
      - condensenet.py
      - vovnet.py
      - bagnet.py
      - sepreresnet.py
      - inceptionresnetv2.py
      - inceptionv4.py
      - senet.py
      - bisenet.py
      - rir_cifar.py
      - sinet.py
    - model_provider.py
    - __init__.py
  - datasets
    - coco_hpe2_dataset.py
    - cityscapes_seg_dataset.py
    - coco_hpe1_dataset.py
    - svhn_cls_dataset.py
    - voc_seg_dataset.py
    - ade20k_seg_dataset.py
    - cifar10_cls_dataset.py
    - dataset_metainfo.py
    - __init__.py
    - imagenet1k_cls_dataset.py
    - cifar100_cls_dataset.py
    - cub200_2011_cls_dataset.py
    - seg_dataset.py
    - coco_hpe3_dataset.py
    - coco_seg_dataset.py
  - setup.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - metrics
    - hpe_metrics.py
    - metric.py
    - det_metrics.py
    - __init__.py
    - seg_metrics.py
    - cls_metrics.py
    - seg_metrics_np.py
  - LICENSE.txt
- train_ke.py
- __init__.py
- eval_pt.py
- .travis.yml
- README.md
- tests
  - convert_gl2pt_dense.py
  - convert_gl2tf2_conv2d_b.py
  - convert_gl2tf2_conv2d.py
  - convert_gl2tf_conv2d.py
  - convert_gl2tf_batchnorm.py
  - convert_gl2tf_dwconv2d.py
  - convert_gl2tf_dense.py
  - convert_gl2tf_conv1x1.py
  - convert_gl2tf2_batchnorm.py
  - __init__.py
  - convert_gl2pt_batchnorm.py
  - convert_gl2tf_avgpool2d.py
  - convert_gl2tf2_dwconv2d.py
  - convert_gl2pt_conv2d.py
  - convert_gl2tf2_avgpool2d.py
  - convert_gl2tf_maxpool2d.py
  - convert_gl2tf_gconv2d.py
- requirements.txt
- keras_
  - setup.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - LICENSE.txt
  - kerascv
    - models
      - vgg.py
      - alexnet.py
      - shufflenet.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet.py
      - mnasnet.py
      - mobilenetv2.py
      - squeezenet.py
      - seresnext.py
      - igcv3.py
      - darknet.py
      - resnet.py
      - others
        __init__.py
      - shufflenetv2b.py
      - menet.py
      - densenet.py
      - shufflenetv2.py
      - efficientnet.py
      - common.py
      - __init__.py
      - preresnet.py
      - zfnet.py
      - model_store.py
      - darknet53.py
      - resnext.py
      - seresnet.py
      - sepreresnet.py
      - senet.py
    - model_provider.py
    - __init__.py
- .gitignore
- tensorflow2
  - dataset_utils.py
  - datasets
    - coco_hpe2_dataset.py
    - cityscapes_seg_dataset.py
    - coco_hpe1_dataset.py
    - svhn_cls_dataset.py
    - voc_seg_dataset.py
    - ade20k_seg_dataset.py
    - cifar10_cls_dataset.py
    - cls_dataset.py
    - dataset_metainfo.py
    - __init__.py
    - imagenet1k_cls_dataset.py
    - cifar100_cls_dataset.py
    - cub200_2011_cls_dataset.py
    - seg_dataset.py
    - coco_hpe3_dataset.py
    - coco_seg_dataset.py
  - tf2cv
    - models
      - pyramidnet_cifar.py
      - vgg.py
      - proxylessnas_cub.py
      - cbamresnet.py
      - spnasnet.py
      - voca.py
      - seresnet_cub.py
      - alexnet.py
      - pnasnet.py
      - shufflenet.py
      - simpleposemobile_coco.py
      - dpn.py
      - icnet.py
      - lffd.py
      - squeezenext.py
      - mobilenetv3.py
      - mobilenet_cub.py
      - efficientnetedge.py
      - mobilenet.py
      - fcn8sd.py
      - mnasnet.py
      - proxylessnas.py
      - hrnet.py
      - sknet.py
      - ibndensenet.py
      - mobilenetv2.py
      - squeezenet.py
      - fdmobilenet.py
      - wrn_cifar.py
      - centernet.py
      - xception.py
      - sepreresnet_cifar.py
      - lwopenpose_cmupan.py
      - seresnext.py
      - bninception.py
      - inceptionv3.py
      - pspnet.py
      - airnext.py
      - densenet_cifar.py
      - igcv3.py
      - resnet_cifar.py
      - bamresnet.py
      - pyramidnet.py
      - darknet.py
      - preresnet_cifar.py
      - resnet.py
      - nasnet.py
      - diracnetv2.py
      - airnet.py
      - resnet_cub.py
      - selecsls.py
      - resnext_cifar.py
      - shufflenetv2b.py
      - polynet.py
      - menet.py
      - peleenet.py
      - densenet.py
      - dla.py
      - shufflenetv2.py
      - ghostnet.py
      - efficientnet.py
      - common.py
      - ibnresnext.py
      - resnetd.py
      - __init__.py
      - resneta.py
      - espnetv2.py
      - preresnet.py
      - hardnet.py
      - drn.py
      - ibnbresnet.py
      - zfnet.py
      - model_store.py
      - fbnet.py
      - mixnet.py
      - darknet53.py
      - ibppose_coco.py
      - simplepose_coco.py
      - fastseresnet.py
      - wrn.py
      - alphapose_coco.py
      - ibnresnet.py
      - seresnet_cifar.py
      - resnext.py
      - seresnet.py
      - grmiposelite_coco.py
      - deeplabv3.py
      - vovnet.py
      - bagnet.py
      - sepreresnet.py
      - inceptionresnetv2.py
      - inceptionv4.py
      - senet.py
      - bisenet.py
      - sinet.py
    - model_provider.py
    - __init__.py
  - setup.py
  - setup.cfg
  - __init__.py
  - README.md
  - utils.py
  - metrics
    - hpe_metrics.py
    - metric.py
    - det_metrics.py
    - __init__.py
    - seg_metrics.py
    - cls_metrics.py
    - seg_metrics_np.py
  - LICENSE.txt
- other
  - eval_pt_seg-.py
  - datasets
    - __init__.py
  - gluon
    - khpa
      - train_gl_khpa.py
      - khpa_utils.py
      - eval_gl_khpa.py
      - __init__.py
      - khpa_cls_dataset.py
    - __init__.py
    - seg_utils1.py
  - train_gl_cifar-.py
  - train_pt_cifar-.py
  - train_gl_seg.py
  - eval_gl_seg-.py
  - pytorch
    - cub200_2011_utils1.py
    - imagenet1k1.py
    - __init__.py
    - cifar1.py
    - seg_utils.py
  - eval_pt_mch.py
  - eval_ch_seg-.py
  - chainer_
    - imagenet1k1.py
    - train_ch_in1k.py
    - top_k_accuracy1.py
    - __init__.py
    - train_ch_cifar.py
    - cifar1.py
    - seg_utils1.py
  - __init__.py
  - eval_pt_cub-.py
  - eval_ch_cifar-.py
  - eval_gl_mch.py
  - eval_pt_cifar-.py
  - eval_ch_in1k-.py
- eval_tf.py

"""
    AlexNet for ImageNet-1K, implemented in Keras.
    Original paper: 'One weird trick for parallelizing convolutional neural networks,'
    https://arxiv.org/abs/1404.5997.
"""

__all__ = ['alexnet_model', 'alexnet', 'alexnetb']

import os
from keras import layers as nn
from keras.models import Model
from .common import conv_block, maxpool2d, is_channels_first, flatten, lrn


def alex_conv(x,
              in_channels,
              out_channels,
              kernel_size,
              strides,
              padding,
              use_lrn,
              name="alex_conv"):
    """
    AlexNet specific convolution block.

    Parameters:
    ----------
    x : keras.backend tensor/variable/symbol
        Input tensor/variable/symbol.
    in_channels : int
        Number of input channels.
    out_channels : int
        Number of output channels.
    kernel_size : int or tuple/list of 2 int
        Convolution window size.
    strides : int or tuple/list of 2 int
        Strides of the convolution.
    padding : int or tuple/list of 2 int
        Padding value for convolution layer.
    use_lrn : bool
        Whether to use LRN layer.
    name : str, default 'alex_conv'
        Block name.

    Returns
    -------
    keras.backend tensor/variable/symbol
        Resulted tensor/variable/symbol.
    """
    x = conv_block(
        x=x,
        in_channels=in_channels,
        out_channels=out_channels,
        kernel_size=kernel_size,
        strides=strides,
        padding=padding,
        use_bias=True,
        use_bn=False,
        name=name + "/conv")
    if use_lrn:
        x = lrn(x)
    return x


def alex_dense(x,
               in_channels,
               out_channels,
               name="alex_dense"):
    """
    AlexNet specific dense block.

    Parameters:
    ----------
    x : keras.backend tensor/variable/symbol
        Input tensor/variable/symbol.
    in_channels : int
        Number of input channels.
    out_channels : int
        Number of output channels.
    name : str, default 'alex_dense'
        Block name.

    Returns
    -------
    keras.backend tensor/variable/symbol
        Resulted tensor/variable/symbol.
    """
    x = nn.Dense(
        units=out_channels,
        input_dim=in_channels,
        name=name + "/fc")(x)
    x = nn.Activation("relu", name=name + "/activ")(x)
    x = nn.Dropout(
        rate=0.5,
        name=name + "/dropout")(x)
    return x


def alex_output_block(x,
                      in_channels,
                      classes,
                      name="alex_output_block"):
    """
    AlexNet specific output block.

    Parameters:
    ----------
    x : keras.backend tensor/variable/symbol
        Input tensor/variable/symbol.
    in_channels : int
        Number of input channels.
    classes : int
        Number of classification classes.
    name : str, default 'alex_output_block'
        Block name.

    Returns
    -------
    keras.backend tensor/variable/symbol
        Resulted tensor/variable/symbol.
    """
    mid_channels = 4096

    x = alex_dense(
        x=x,
        in_channels=in_channels,
        out_channels=mid_channels,
        name=name + "/fc1")
    x = alex_dense(
        x=x,
        in_channels=mid_channels,
        out_channels=mid_channels,
        name=name + "/fc2")
    x = nn.Dense(
        units=classes,
        input_dim=mid_channels,
        name=name + "/fc3")(x)
    return x


def alexnet_model(channels,
                  kernel_sizes,
                  strides,
                  paddings,
                  use_lrn,
                  in_channels=3,
                  in_size=(224, 224),
                  classes=1000):
    """
    AlexNet model from 'One weird trick for parallelizing convolutional neural networks,'
    https://arxiv.org/abs/1404.5997.

    Parameters:
    ----------
    channels : list of list of int
        Number of output channels for each unit.
    kernel_sizes : list of list of int
        Convolution window sizes for each unit.
    strides : list of list of int or tuple/list of 2 int
        Strides of the convolution for each unit.
    paddings : list of list of int or tuple/list of 2 int
        Padding value for convolution layer for each unit.
    use_lrn : bool
        Whether to use LRN layer.
    in_channels : int, default 3
        Number of input channels.
    in_size : tuple of two ints, default (224, 224)
        Spatial size of the expected input image.
    classes : int, default 1000
        Number of classification classes.
    """
    input_shape = (in_channels, in_size[0], in_size[1]) if is_channels_first() else\
        (in_size[0], in_size[1], in_channels)
    input = nn.Input(shape=input_shape)

    x = input
    for i, channels_per_stage in enumerate(channels):
        use_lrn_i = use_lrn and (i in [0, 1])
        for j, out_channels in enumerate(channels_per_stage):
            x = alex_conv(
                x=x,
                in_channels=in_channels,
                out_channels=out_channels,
                kernel_size=kernel_sizes[i][j],
                strides=strides[i][j],
                padding=paddings[i][j],
                use_lrn=use_lrn_i,
                name="features/stage{}/unit{}".format(i + 1, j + 1))
            in_channels = out_channels
        x = maxpool2d(
            x=x,
            pool_size=3,
            strides=2,
            padding=0,
            ceil_mode=True,
            name="features/stage{}/pool".format(i + 1))

    x = flatten(x, reshape=True)
    x = alex_output_block(
        x=x,
        in_channels=(in_channels * 6 * 6),
        classes=classes,
        name="output")

    model = Model(inputs=input, outputs=x)
    model.in_size = in_size
    model.classes = classes
    return model


def get_alexnet(version="a",
                model_name=None,
                pretrained=False,
                root=os.path.join("~", ".keras", "models"),
                **kwargs):
    """
    Create AlexNet model with specific parameters.

    Parameters:
    ----------
    version : str, default 'a'
        Version of AlexNet ('a' or 'b').
    model_name : str or None, default None
        Model name for loading pretrained model.
    pretrained : bool, default False
        Whether to load the pretrained weights for model.
    root : str, default '~/.keras/models'
        Location for keeping the model parameters.
    """
    if version == "a":
        channels = [[96], [256], [384, 384, 256]]
        kernel_sizes = [[11], [5], [3, 3, 3]]
        strides = [[4], [1], [1, 1, 1]]
        paddings = [[0], [2], [1, 1, 1]]
        use_lrn = True
    elif version == "b":
        channels = [[64], [192], [384, 256, 256]]
        kernel_sizes = [[11], [5], [3, 3, 3]]
        strides = [[4], [1], [1, 1, 1]]
        paddings = [[2], [2], [1, 1, 1]]
        use_lrn = False
    else:
        raise ValueError("Unsupported AlexNet version {}".format(version))

    net = alexnet_model(
        channels=channels,
        kernel_sizes=kernel_sizes,
        strides=strides,
        paddings=paddings,
        use_lrn=use_lrn,
        **kwargs)

    if pretrained:
        if (model_name is None) or (not model_name):
            raise ValueError("Parameter `model_name` should be properly initialized for loading pretrained model.")
        from .model_store import download_model
        download_model(
            net=net,
            model_name=model_name,
            local_model_store_dir_path=root)

    return net


def alexnet(**kwargs):
    """
    AlexNet model from 'One weird trick for parallelizing convolutional neural networks,'
    https://arxiv.org/abs/1404.5997.

    Parameters:
    ----------
    pretrained : bool, default False
        Whether to load the pretrained weights for model.
    root : str, default '~/.keras/models'
        Location for keeping the model parameters.
    """
    return get_alexnet(model_name="alexnet", **kwargs)


def alexnetb(**kwargs):
    """
    AlexNet-b model from 'One weird trick for parallelizing convolutional neural networks,'
    https://arxiv.org/abs/1404.5997. Non-standard version.

    Parameters:
    ----------
    pretrained : bool, default False
        Whether to load the pretrained weights for model.
    root : str, default '~/.keras/models'
        Location for keeping the model parameters.
    """
    return get_alexnet(version="b", model_name="alexnetb", **kwargs)


def _test():
    import numpy as np
    import keras

    pretrained = False

    models = [
        alexnet,
        alexnetb,
    ]

    for model in models:

        net = model(pretrained=pretrained)
        # net.summary()
        weight_count = keras.utils.layer_utils.count_params(net.trainable_weights)
        print("m={}, {}".format(model.__name__, weight_count))
        assert (model != alexnet or weight_count == 62378344)
        assert (model != alexnetb or weight_count == 61100840)

        if is_channels_first():
            x = np.zeros((1, 3, 224, 224), np.float32)
        else:
            x = np.zeros((1, 224, 224, 3), np.float32)
        y = net.predict(x)
        assert (y.shape == (1, 1000))


if __name__ == "__main__":
    _test()