python source code of test_multi_node_chain

chainer-master
- .github
  - PULL_REQUEST_TEMPLATE.md
  - CONTRIBUTING.md
  - ISSUE_TEMPLATE.md
  - stale.yml
- chainer_bibtex.txt
- onnx_chainer
  - export_testcase.py
  - functions
    - activation.py
    - opset_version.py
    - normalization.py
    - loss.py
    - pooling.py
    - noise.py
    - connection.py
    - array.py
    - __init__.py
    - converter.py
    - rnn.py
    - math.py
  - graph.py
  - mapping.py
  - examples
    - yolov2tiny
      - export.py
    - images
      - synset_words.txt
    - resnet50
      - export.py
  - export.py
  - replace_func.py
  - .flexci
    - README.md
    - run_test.sh
    - run_test.bat
    - Dockerfile
  - __init__.py
  - onnx_helper.py
  - context.py
  - testing
    - test_onnxruntime.py
    - test_mxnet.py
    - __init__.py
    - get_test_data_set.py
    - input_generator.py
- .coveragerc
- examples
  - seq2seq
    - wmt_preprocess.py
    - README.md
    - seq2seq.py
  - reinforcement_learning
    - ddpg_pendulum.py
    - README.md
    - dqn_cartpole.py
  - cifar
    - train_cifar_custom_loop.py
    - train_cifar.py
    - models
      - __init__.py
      - VGG.py
    - README.md
  - test_utils.py
  - text_classification
    - train_text_classifier.py
    - text_datasets.py
    - nets.py
    - run_text_classifier.py
    - nlp_utils.py
    - README.md
  - pos
    - postagging.py
    - README.md
  - serialization
    - load.py
    - save.py
    - model.py
    - README.md
  - pix2pix
    - facade_visualizer.py
    - train_facade.py
    - net.py
    - README.md
    - requirements.txt
    - facade_dataset.py
    - image
    - updater.py
  - static_graph_optimizations
    - cifar
      - train_cifar_custom_loop.py
      - train_cifar.py
      - models
        __init__.py
        VGG.py
      - README.md
    - README.md
    - mnist
      - train_mnist.py
      - README.md
      - train_mnist_custom_loop.py
    - ptb
      - train_ptb_custom_loop.py
      - README.md
  - dcgan
    - train_dcgan.py
    - net.py
    - README.md
    - visualize.py
    - updater.py
  - memnn
    - babi.py
    - test_memnn.py
    - download.py
    - README.md
    - memnn.py
    - train_memnn.py
  - wavenet
    - modules.py
    - generate.py
    - net.py
    - train.py
    - README.md
    - utils.py
    - requirements.txt
  - vae
    - train_vae.py
    - net.py
    - README.md
  - caffe_export
    - export.py
    - README.md
  - sentiment
    - data.py
    - test_thin_stack.py
    - train_sentiment.py
    - download.py
    - thin_stack.py
    - README.md
    - train_recursive_minibatch.py
  - word2vec
    - search.py
    - README.md
    - train_word2vec.py
  - README.md
  - mnist
    - train_mnist_data_parallel.py
    - .testdata
      - replacements
        train_mnist.py
    - train_mnist_data_parallel_updater.py
    - train_mnist_model_parallel.py
    - train_mnist.py
    - README.md
    - inference.py
    - train_mnist_custom_loop.py
    - .gitignore
  - tests
    - test_mnist.py
    - __init__.py
    - test_imagenet.py
  - glance
    - glance.py
    - README.md
  - .gitignore
  - modelzoo
    - download_mean_file.py
    - README.md
    - .gitignore
    - download_model.py
    - evaluate_caffe_net.py
  - imagenet
    - train_imagenet.py
    - googlenetbn.py
    - train_imagenet_data_parallel.py
    - alex.py
    - resnet50.py
    - dataset_util.py
    - dali_util.py
    - .testdata
      - images
      - replacements
        train_imagenet.py
      - data.txt
    - compute_mean.py
    - resnext50.py
    - googlenet.py
    - nin.py
    - README.md
  - image_captioning
    - download.py
    - predict.py
    - model.py
    - datasets.py
    - train.py
    - README.md
  - chainermn
    - seq2seq
      - europal.py
      - README.md
      - seq2seq.py
      - seq2seq_mp1.py
    - cifar
      - train_cifar.py
      - models
        __init__.py
        VGG.py
    - parallel_convolution
      - train.py
      - README.md
      - VGG.py
    - dcgan
      - train_dcgan.py
      - net.py
      - README.md
      - visualize.py
      - updater.py
    - mnist
      - train_mnist_model_parallel.py
      - train_mnist.py
      - README.md
      - train_mnist_dual_parallel.py
    - imagenet
      - train_imagenet.py
      - models
        googlenetbn.py
        alex.py
        resnet50.py
        googlenet.py
        nin.py
        __init__.py
      - compute_mean.py
  - ptb
    - train_ptb_custom_loop.py
    - gentxt.py
    - README.md
    - train_ptb.py
    - .gitignore
- readthedocs.yml
- chainermn_bibtex.txt
- codecov.yml
- LICENSE
- .pfnci
  - script.sh
  - chainermn-ci-prep.sh
  - hint.pbtxt
  - config.pbtxt
  - chainermn.Dockerfile
  - run.sh
  - .gitignore
  - py27and35.Dockerfile
  - py37.Dockerfile
- appveyor.yml
- appveyor
  - run_with_env.cmd
  - install.ps1
- setup.py
- chainerx
  - _docs
    - backprop.py
    - routines.py
    - array.py
    - __init__.py
    - utils.py
    - backend.py
    - context.py
    - device.py
  - py.typed
  - _ndarray.py
  - _cuda.py
  - __init__.pyi
  - manipulation
    - __init__.py
  - __init__.py
  - math
    - misc.py
    - __init__.py
  - random
    - distributions.py
    - __init__.py
  - linalg
    - __init__.pyi
  - creation
    - __init__.py
    - from_data.py
  - _fallback_workarounds.py
  - _device.py
  - testing
    - array.py
    - __init__.py
    - helper.py
    - dtypes.py
- docker
  - python3
    - Dockerfile
  - intel
    - python3
      - Dockerfile
    - README.md
- chainerx_cc
  - cmake
    - third-party.cmake
    - FindCuDNN.cmake
    - FindBLAS.cmake
    - clang-tidy.cmake
  - .coveragerc
  - examples
    - imagenet_py
      - train_imagenet.py
      - resnet50.py
      - image_dataset.py
    - CMakeLists.txt
    - mnist
      - mnist.cc
      - mnist.h
      - CMakeLists.txt
      - train_mnist.cc
    - mnist_py
      - train_mnist.py
      - README.md
      - .gitignore
      - download.sh
  - third_party
    - gsl-lite.cmake
    - pybind11.cmake
    - gtest.cmake
    - abseil.cmake
  - .clang-format
  - chainerx
    - backprop_mode.h
    - kernel_registry.h
    - slice.h
    - array_to_device_test.cc
    - index_iterator.h
    - indexable_array.h
    - kernel.h
    - device_test.cc
    - indexable_array_test.cc
    - graph.cc
    - backend.cc
    - shape.cc
    - reduction_kernel_arg.h
    - numeric.h
    - numerical_gradient_test.cc
    - kernels
      - normalization.h
      - binary.h
      - logic.h
      - linalg.h
      - indexing.h
      - explog.h
      - statistics.h
      - pooling.h
      - misc.h
      - creation.h
      - CMakeLists.txt
      - arithmetic.h
      - hyperbolic.h
      - rnn.h
      - reduction.h
      - sorting.h
      - rounding.h
      - trigonometric.h
      - connection.h
    - dtype.h
    - thread_local_state.h
    - scalar.h
    - check_backward_test.cc
    - dims.cc
    - array_node.h
    - indexer.h
    - squash_dims.h
    - reduction_kernel_arg.cc
    - numeric_limits_test.cc
    - thread_local_state_test.cc
    - thread_local_state.cc
    - context.h
    - numeric_test.cc
    - backward_test.cc
    - dynamic_lib.h
    - empty.cc
    - routines
      - n_step_rnn.h
      - normalization.h
      - routines_util.h
      - binary.h
      - normalization.cc
      - logic.h
      - logic.cc
      - linalg.h
      - loss.h
      - indexing.h
      - explog.h
      - misc.cc
      - binary.cc
      - manipulation.h
      - statistics.h
      - statistics_test.cc
      - linalg.cc
      - creation_test.cc
      - pooling.h
      - misc.h
      - statistics.cc
      - loss.cc
      - sorting.cc
      - type_util.h
      - activation.cc
      - type_util.cc
      - connection.cc
      - type_util_test.cc
      - reduction.cc
      - hyperbolic.cc
      - n_step_rnn.cc
      - creation.h
      - CMakeLists.txt
      - arithmetic.h
      - arithmetic.cc
      - hyperbolic.h
      - evaluation.h
      - indexing.cc
      - activation.h
      - reduction.h
      - manipulation.cc
      - creation.cc
      - sorting.h
      - rounding.h
      - trigonometric.cc
      - trigonometric.h
      - connection.h
      - explog.cc
      - pooling.cc
      - rounding.cc
      - evaluation.cc
    - scalar.cc
    - device_id.cc
    - backprop_mode_test.cc
    - cuda
      - cublas.h
      - cuda_device
        statistics.cu
        logic.cu
        conv.cc
        misc.cu
        arithmetic.cu
        exp_log.cu
        dot.cu
        copy.cu
        rnn.cu
        linalg.cu
        pool.cu
        trigonometric.cu
        indexing.cu
        memory.cc
        rounding.cu
        hyperbolic.cu
        binary.cu
        fill.cu
        reduction.cu
        batch_norm.cc
      - memory_pool_test.cc
      - memory_pool.h
      - cusolver.h
      - cuda_device.h
      - cuda_backend_test.cc
      - cuda_conv.h
      - cuda_device.cc
      - numeric_limits.cuh
      - data_type.cuh
      - cuda_conv.cc
      - cuda_conv_test.cc
      - cuda_backend.cc
      - cuda_device_test.cc
      - cuda.h
      - numeric.cuh
      - CMakeLists.txt
      - cuda_set_device_scope_test.cc
      - cusolver.cc
      - cudnn.h
      - cast.cuh
      - reduce.cuh
      - float16.cuh
      - cuda_runtime.h
      - cublas.cc
      - elementwise.cuh
      - cuda_backend.h
      - cuda.cc
      - cuda_set_device_scope.h
      - cuda_runtime_test.cc
      - cuda_runtime.cc
      - cudnn.cc
      - kernel_regist.h
      - memory_pool.cc
    - error.h
    - squash_dims_test.cc
    - backend.h
    - numerical_gradient.h
    - scalar_test.cc
    - backprop_scope.h
    - strides_test.cc
    - float16.h
    - util.h
    - shape.h
    - float16.cc
    - array_body.h
    - graph.h
    - stack_vector.h
    - numerical_gradient.cc
    - backprop_mode.cc
    - numeric_limits.h
    - chainerx.h
    - strides.cc
    - op_node.h
    - optional_container_arg_test.cc
    - backend_util.h
    - device.h
    - backward_context.cc
    - optional_container_arg.h
    - backward.cc
    - dims.h
    - array_body.cc
    - array.h
    - axes.h
    - array_test.cc
    - platform.cc
    - array_repr.cc
    - backward_builder.h
    - check_backward.h
    - array_index.h
    - arithmetic_ops.h
    - platform
      - windows.cc
      - windows.h
    - python
      - backprop_mode.h
      - slice.h
      - graph.cc
      - common.h
      - backend.cc
      - shape.cc
      - dtype.h
      - slice.cc
      - scalar.h
      - core_module.cc
      - context.h
      - routines.cc
      - scalar.cc
      - py_cached_objects.h
      - cuda
        cuda_module.h
        cuda_module.cc
      - error.h
      - backend.h
      - shape.h
      - graph.h
      - stack_vector.h
      - backprop_mode.cc
      - strides.cc
      - device.h
      - backward.cc
      - chainer_interop.cc
      - array.h
      - axes.h
      - check_backward.h
      - array_index.h
      - routines.h
      - dtype.cc
      - backward.h
      - CMakeLists.txt
      - array_index.cc
      - context.cc
      - chainer_interop.h
      - error.cc
      - strides.h
      - check_backward.cc
      - axes.cc
      - array.cc
      - common_export.h
      - kwarg.h
      - device.cc
      - testing
        device_buffer.cc
        testing_module.cc
        device_buffer.h
        testing_module.h
    - dtype.cc
    - dtype_test.cc
    - context_test.cc
    - numeric.cc
    - backward.h
    - kernel_registry_test.cc
    - backward_context.h
    - index_iterator_test.cc
    - CMakeLists.txt
    - dynamic_lib.cc
    - backward_fwd.h
    - array_index.cc
    - array_device_test.cc
    - native
      - native_backend.cc
      - elementwise.h
      - native_backend_test.cc
      - native_device
        pool.cc
        cblas.h
        logic.cc
        conv.cc
        rnn.cc
        misc.cc
        binary.cc
        linalg.cc
        statistics.cc
        fill.cc
        exp_log.cc
        dot.cc
        reduction.cc
        memory.cc
        hyperbolic.cc
        copy.cc
        arithmetic.cc
        indexing.cc
        trigonometric.cc
        rounding.cc
        batch_norm.cc
      - tensor_dot.cc
      - im2col.cc
      - col2im.h
      - data_type.h
      - CMakeLists.txt
      - reduce.h
      - native_device.h
      - native_device_test.cc
      - im2col.h
      - native_device.cc
      - col2im.cc
      - tensor_dot.h
      - kernel_regist.h
      - native_backend.h
    - array_fwd.h
    - context.cc
    - dims_test.cc
    - constant.h
    - strides.h
    - macro.h
    - backend_testdata
      - CMakeLists.txt
      - backend0.cc
      - backend1.cc
    - op_node.cc
    - check_backward.cc
    - backward_builder_test.cc
    - indexer_test.cc
    - array_repr_test.cc
    - axes.cc
    - shape_test.cc
    - array.cc
    - util.cc
    - backward_builder.cc
    - device_id.h
    - stack_vector_test.cc
    - hash_combine.h
    - array_body_leak_detection.h
    - array_body_leak_detection.cc
    - platform.h
    - enum.h
    - array_body_leak_detection_test.cc
    - array_repr.h
    - axes_test.cc
    - float16_test.cc
    - device.cc
    - testing
      - threading.h
      - routines.cc
      - routines_test.cc
      - array_check.h
      - util.h
      - device_session.h
      - context_session.h
      - array.h
      - array_test.cc
      - routines.h
      - CMakeLists.txt
      - gtest_main.cc
      - array_check.cc
      - util.cc
  - CMakeLists.txt
  - README.md
  - scripts
    - run-clang-tidy.sh
    - test-mnist.sh
    - run-clang-format.sh
    - run-cpplint.sh
  - CPPLINT.cfg
  - .clang-tidy
  - .gitignore
  - LICENSE.txt
- chainer2019_bibtex.txt
- setup.cfg
- .travis.yml
- README.md
- tests
  - chainer_tests
    - test_initializer.py
    - test_optimizer.py
    - training_tests
      - triggers_tests
        test_early_stopping_trigger.py
        test_manual_schedule_trigger.py
        test_once_trigger.py
        test_minmax_trigger.py
        test_interval_trigger.py
        __init__.py
        test_time_trigger.py
      - updaters_tests
        test_multiprocess_parallel_updater.py
        snippets
        child_reporter.py
        cuda_init.py
        raw_array.py
        __init__.py
        test_standard_updater.py
      - test_trainer.py
      - __init__.py
      - extensions_tests
        test_print_report.py
        test_plot_report.py
        test_exponential_shift.py
        test_step_shift.py
        test_snapshot_writers.py
        test_parameter_statistics.py
        test_snapshot.py
        test_variable_statistics_plot.py
        test_inverse_shift.py
        test_multistep_shift.py
        test_fail_on_nonnumber.py
        test_linear_shift.py
        test_computational_graph.py
        __init__.py
        test_evaluator.py
        test_polynomial_shift.py
        test_warmup_shift.py
      - test_extension.py
    - test_variable.py
    - test_backprop_utils.py
    - link_hooks_tests
      - test_weight_standardization.py
      - test_spectral_normalization.py
      - test_timer.py
    - test_chainer_objects.py
    - serializers_tests
      - test_hdf5.py
      - __init__.py
      - test_npz.py
    - test_function_hook.py
    - function_hooks_tests
      - test_timer.py
      - test_debug_print.py
      - test_cuda_profile.py
      - __init__.py
      - test_cupy_memory_profile.py
    - iterators_tests
      - test_iterator_compatibility.py
      - test_multithread_iterator.py
      - __init__.py
      - test_multiprocess_iterator.py
      - test_serial_iterator.py
    - links_tests
      - rnn_tests
        test_link_gru.py
        test_link_n_step_gru.py
        test_link_lstm.py
        test_link_n_step_lstm.py
        test_link_tree_lstm.py
        test_link_mgu.py
        test_link_n_step_rnn.py
        test_link_peephole.py
      - connection_tests
        test_zoneoutlstm.py
        test_deconvolution_2d.py
        test_inceptionbn.py
        test_bias.py
        test_convolution_2d.py
        test_depthwise_convolution_2d.py
        test_deconvolution_nd.py
        test_local_convolution_2d.py
        test_convolution_nd.py
        test_scale.py
        test_mlp_convolution_2d.py
        test_dilated_convolution_2d.py
        test_embed_id.py
        __init__.py
        test_highway.py
        test_inception.py
        test_deformable_convolution_2d.py
        test_bilinear.py
        test_linear.py
      - theano_tests
        test_theano_function.py
        __init__.py
      - caffe_tests
        __init__.py
        test_caffe_function.py
      - normalization_tests
        test_batch_normalization.py
        test_layer_normalization.py
        __init__.py
        test_group_normalization.py
        test_decorrelated_batch_normalization.py
        test_batch_renormalization.py
      - __init__.py
      - activation_tests
        test_simplified_dropconnect.py
        test_swish.py
        __init__.py
        test_prelu.py
        test_maxout.py
      - model_tests
        test_vision.py
        __init__.py
        test_classifier.py
      - loss_tests
        test_black_out.py
        test_negative_sampling.py
        test_hierarchical_softmax.py
        __init__.py
        test_crf1d.py
    - test_sequential.py
    - backends_tests
      - test_cpu.py
      - test_chainerx.py
      - test_cuda.py
      - test_intel64.py
    - dataset_tests
      - test_convert.py
      - __init__.py
      - test_dataset_mixin.py
      - tabular_tests
        test_from_data.py
        test_tabular_dataset.py
        test_slice.py
        test_asmode.py
        dummy_dataset.py
        test_concat.py
        __init__.py
        test_join.py
        test_transform.py
        test_delegate_dataset.py
        test_with_converter.py
      - test_download.py
    - test_init_docstring.py
    - datasets_tests
      - test_mnist.py
      - test_cifar.py
      - test_transform_dataset.py
      - test_pickle_dataset.py
      - test_concatenated_dataset.py
      - test_svhn.py
      - test_tuple_dataset.py
      - test_dict_dataset.py
      - image_dataset
        labeled_img.lst
        img.lst
        zipped_images_2.zip
        zipped_images_1.zip
        __init__.py
      - test_image_dataset.py
      - test_sub_dataset.py
      - text_dataset
        ascii_1.txt
        utf8_1.txt
        utf8sig.txt
        ascii_noeol.txt
        utf8_2.txt
        utf8_crlf.txt
        ascii_blank_line.txt
        ascii_2.txt
      - test_text_dataset.py
      - __init__.py
    - test_configuration.py
    - test_link.py
    - test_init.py
    - graph_optimization_tests
      - test_static_graph_models.py
      - __init__.py
    - test_backend.py
    - utils_tests
      - test_experimental.py
      - test_utils.py
      - test_cache.py
      - test_conv_nd_kernel.py
      - test_sparse.py
      - test_conv_nd.py
      - test_precision.py
      - test_array.py
      - test_conv.py
      - test_type_check.py
      - __init__.py
      - test_argument.py
      - test_walker_alias.py
    - test_reporter.py
    - optimizers_tests
      - test_optimizers.py
      - test_optimizers_by_linear_model.py
      - __init__.py
    - test_gradient_check.py
    - test_function_and_function_node.py
    - test_runnable.py
    - test_backprop.py
    - test_link_hook.py
    - test_computational_graph.py
    - __init__.py
    - test_function_node.py
    - optimizer_hooks_tests
      - test_gradient_hard_clipping.py
      - test_weight_decay.py
      - test_lasso.py
      - test_gradient_noise.py
      - test_gradient_clipping.py
      - utils.py
      - test_gradient_lars.py
    - exporters_tests
      - test_caffe.py
      - __init__.py
    - test_runtime_info.py
    - initializer_tests
      - test_sampling.py
      - test_orthogonal.py
      - test_constant.py
      - test_normal.py
      - test_init.py
      - test_uniform.py
      - __init__.py
    - distributions_tests
      - test_categorical.py
      - test_chisquare.py
      - test_utils.py
      - test_log_normal.py
      - test_gamma.py
      - test_multivariate_normal.py
      - test_gumbel.py
      - test_laplace.py
      - test_pareto.py
      - test_one_hot_categorical.py
      - test_exponential.py
      - test_normal.py
      - test_geometric.py
      - test_cauchy.py
      - test_dirichlet.py
      - test_poisson.py
      - test_uniform.py
      - test_bernoulli.py
      - test_kldivergence.py
      - __init__.py
      - test_beta.py
      - test_independent.py
    - testing_tests
      - test_function_link.py
      - test_training.py
      - test_condition.py
      - test_unary_math_function_test.py
      - test_array.py
      - test_serializer.py
      - __init__.py
      - test_parameterized.py
      - test_matrix.py
    - test_function.py
    - conftest.py
    - functions_tests
      - evaluation_tests
        test_r2_score.py
        test_classification_summary.py
        __init__.py
        test_binary_accuracy.py
        test_accuracy.py
      - rnn_tests
        test_function_slstm.py
        test_function_tree_lstm.py
        test_function_lstm.py
        test_function_n_step_gru.py
        test_function_n_step_rnn.py
        test_function_n_step_lstm.py
      - array_tests
        test_depth_2_space.py
        test_diagonal.py
        test_select_item.py
        test_stack.py
        test_moveaxis.py
        test_pad_sequence.py
        test_spatial_transformer_grid.py
        test_permutate.py
        test_expand_dims.py
        test_pad.py
        test_get_item.py
        test_space_2_depth.py
        test_flatten.py
        test_reshape.py
        test_repeat.py
        test_resize_images.py
        test_as_strided.py
        test_cast.py
        test_tile.py
        test_copy.py
        test_fliplr.py
        test_scatter_add.py
        test_concat.py
        test_vstack.py
        test_split_axis.py
        test_broadcast.py
        test_flip.py
        __init__.py
        test_spatial_transformer_sampler.py
        test_transpose.py
        test_where.py
        test_swapaxes.py
        test_transpose_sequence.py
        test_separate.py
        test_dstack.py
        test_hstack.py
        test_rollaxis.py
        test_squeeze.py
        test_im2col.py
        test_flipud.py
      - noise_tests
        test_dropout.py
        test_gaussian.py
        test_gumbel_softmax.py
        test_simplified_dropconnect.py
        __init__.py
        test_zoneout.py
      - connection_tests
        test_deconvolution_2d.py
        test_shift.py
        test_convolution_2d.py
        test_depthwise_convolution_2d.py
        test_deconvolution_nd.py
        test_local_convolution_2d.py
        test_convolution_nd.py
        test_deformable_convolution_2d_sampler.py
        test_dilated_convolution_2d.py
        test_embed_id.py
        __init__.py
        test_bilinear.py
        test_linear.py
      - pooling_tests
        test_upsampling_2d.py
        test_roi_max_pooling_2d.py
        test_average_pooling_nd.py
        test_roi_average_align_2d.py
        test_average_pooling_2d.py
        test_roi_average_pooling_2d.py
        test_spatial_pyramid_pooling_2d.py
        test_unpooling_2d.py
        test_roi_max_align_2d.py
        test_unpooling_nd.py
        test_roi_pooling_2d.py
        pooling_nd_helper.py
        __init__.py
        test_max_pooling_2d.py
        test_max_pooling_nd.py
        test_pooling_nd_kernel.py
      - normalization_tests
        test_batch_normalization.py
        test_l2_normalization.py
        test_local_response_normalization.py
        test_layer_normalization.py
        __init__.py
        test_group_normalization.py
        test_decorrelated_batch_normalization.py
        test_batch_renormalization.py
      - __init__.py
      - activation_tests
        test_rrelu.py
        test_clipped_relu.py
        test_sigmoid.py
        test_softmax.py
        test_log_softmax.py
        test_selu.py
        test_relu.py
        test_hard_sigmoid.py
        test_leaky_relu.py
        test_elu.py
        test_swish.py
        test_crelu.py
        __init__.py
        test_softplus.py
        test_prelu.py
        test_maxout.py
        test_tanh.py
      - loss_tests
        test_mean_absolute_error.py
        test_decov.py
        test_contrastive.py
        test_huber_loss.py
        test_absolute_error.py
        test_black_out.py
        test_discriminative_margin_based_clustering_loss.py
        test_cross_covariance.py
        test_ctc.py
        test_vae.py
        test_sigmoid_cross_entropy.py
        test_negative_sampling.py
        test_triplet.py
        test_squared_error.py
        __init__.py
        test_mean_squared_error.py
        test_hinge.py
        test_softmax_cross_entropy.py
        test_crf1d.py
      - util_tests
        test_forget.py
        __init__.py
      - math_tests
        test_inv.py
        test_sign.py
        test_average.py
        test_sparse_matmul.py
        test_logsumexp.py
        test_fix.py
        test_bias.py
        test_tensordot.py
        test_polygamma.py
        test_exponential_m1.py
        test_det.py
        test_erf.py
        test_ndtr.py
        test_einsum.py
        test_ndtri.py
        test_arctanh.py
        test_exponential.py
        test_clip.py
        test_ceil.py
        test_linear_interpolate.py
        test_cumprod.py
        test_erfinv.py
        test_trigonometric.py
        test_digamma.py
        test_sqrt.py
        test_cumsum.py
        test_minimum.py
        test_minmax.py
        test_erfc.py
        test_erfcx.py
        test_scale.py
        test_floor.py
        test_lgamma.py
        test_hyperbolic.py
        test_prod.py
        test_fft.py
        __init__.py
        test_batch_l2_norm_squared.py
        test_zeta.py
        test_log_ndtr.py
        test_matmul.py
        test_sum.py
        test_basic_math.py
        test_erfcinv.py
        test_fmod.py
        test_logarithm_1p.py
        test_maximum.py
        test_square.py
        test_cholesky.py
  - chainermn_tests
    - communicator_tests
      - test_node_aware_communicator_base.py
      - test_communicator.py
      - test_communication_utility.py
      - test_mpi.py
    - iterators_tests
      - test_multi_node_iterator.py
      - test_synchronized_iterator.py
      - test_iterator_compatibility.py
    - links_tests
      - test_batch_normalization.py
      - test_n_step_rnn.py
      - test_multi_node_chain_list.py
      - test_create_mnbn_model.py
    - datasets_tests
      - test_mnist.py
      - test_scatter.py
      - test_empty_dataset.py
    - optimizer_tests
      - test_multi_node_optimizer.py
      - test_double_buffering_optimizer.py
    - extensions_tests
      - test_multi_node_evaluator.py
      - test_allreduce_persistent.py
      - test_multi_node_snapshot.py
      - test_multi_node_early_stopping_trigger.py
      - test_checkpoint.py
      - test_observation_aggregator.py
    - testing_tests
      - test_device.py
    - conftest.py
    - functions_tests
      - test_point_to_point_communication.py
      - test_collective_communication.py
      - test_pseudo_connect.py
  - chainerx_tests
    - op_utils.py
    - math_utils.py
    - dtype_utils.py
    - cuda_utils.py
    - __init__.py
    - test_array_utils.py
    - unit_tests
      - test_backward.py
      - test_check_backward.py
      - test_backprop_mode.py
      - test_graph.py
      - test_context.py
      - test_array.py
      - test_backend.py
      - test_constants.py
      - __init__.py
      - test_dtype.py
      - test_cupy_interop.py
      - test_array_index.py
      - routines_tests
        test_activation.py
        test_misc.py
        test_evaluation.py
        test_linalg.py
        test_pooling.py
        test_loss.py
        test_indexing.py
        test_sorting.py
        test_creation.py
        test_logic.py
        test_connection.py
        test_manipulation.py
        test_trigonometric_hyperbolic.py
        test_rnn.py
        test_explog.py
        test_reduction.py
        __init__.py
        test_statistics.py
        test_normalization.py
        test_rounding.py
        test_arithmetic.py
        test_binary.py
      - test_device.py
      - test_core_module.py
      - testing_tests
        test_array.py
        test_helper.py
        test_device_buffer.py
        __init__.py
        test_dtypes.py
    - array_utils.py
    - conftest.py
  - conftest.py
  - onnx_chainer_tests
    - test_export_testcase.py
    - test_external_converter.py
    - test_inout.py
    - __init__.py
    - helper.py
    - conftest.py
    - functions_tests
      - test_activations.py
      - test_poolings.py
      - test_loss.py
      - test_arrays.py
      - test_rnn.py
      - __init__.py
      - test_normalizations.py
      - test_connections.py
      - test_maths.py
      - test_noises.py
    - test_replace_func.py
- CODE_OF_CONDUCT.md
- scripts
  - ci
    - travis
      - xpytest-hint-chainerx.pbtxt
      - steps.sh
      - run-step.sh
      - run-tests.sh
    - steps.sh
    - chainerx
      - setup-ubuntu.sh
      - jenkins
        run_docker.sh
        run.sh
        clear-docker-cache.sh
        Dockerfile.template
      - setup-conda.sh
    - run-step.sh
- chainerx_build_helper.py
- chainer
  - link_hook.py
  - optimizer.py
  - optimizer_hooks
    - lasso.py
    - gradient_noise.py
    - __init__.py
    - gradient_hard_clipping.py
    - gradient_lars.py
    - gradient_clipping.py
    - weight_decay.py
  - datasets
    - transform_dataset.py
    - tuple_dataset.py
    - concatenated_dataset.py
    - fashion_mnist.py
    - mnist.py
    - ptb.py
    - sub_dataset.py
    - svhn.py
    - text_dataset.py
    - __init__.py
    - pickle_dataset.py
    - kuzushiji_mnist.py
    - image_dataset.py
    - cifar.py
    - dict_dataset.py
    - _mnist_helper.py
  - functions
    - noise
      - simplified_dropconnect.py
      - dropout.py
      - gumbel_softmax.py
      - zoneout.py
      - __init__.py
      - gaussian.py
    - theano
      - theano_function.py
      - __init__.py
    - array
      - tile.py
      - broadcast.py
      - depth2space.py
      - flatten.py
      - as_strided.py
      - copy.py
      - where.py
      - squeeze.py
      - fliplr.py
      - select_item.py
      - expand_dims.py
      - pad.py
      - im2col.py
      - cast.py
      - hstack.py
      - transpose_sequence.py
      - spatial_transformer_grid.py
      - permutate.py
      - dstack.py
      - rollaxis.py
      - pad_sequence.py
      - moveaxis.py
      - flipud.py
      - repeat.py
      - scatter_add.py
      - get_item.py
      - __init__.py
      - separate.py
      - stack.py
      - spatial_transformer_sampler.py
      - transpose.py
      - diagonal.py
      - flip.py
      - space2depth.py
      - resize_images.py
      - concat.py
      - reshape.py
      - split_axis.py
      - swapaxes.py
      - vstack.py
    - util
      - forget.py
      - __init__.py
    - connection
      - local_convolution_2d.py
      - bilinear.py
      - dilated_convolution_2d.py
      - embed_id.py
      - convolution_2d.py
      - convolution_nd.py
      - deconvolution_nd.py
      - __init__.py
      - depthwise_convolution_2d.py
      - linear.py
      - deconvolution_2d.py
      - deformable_convolution_2d_sampler.py
      - shift.py
    - evaluation
      - r2_score.py
      - classification_summary.py
      - accuracy.py
      - binary_accuracy.py
      - __init__.py
    - pooling
      - roi_max_pooling_2d.py
      - roi_pooling_2d.py
      - pooling_nd_kernel.py
      - pooling_2d.py
      - max_pooling_nd_kernel.py
      - unpooling_2d.py
      - upsampling_2d.py
      - unpooling_nd.py
      - max_pooling_nd.py
      - roi_average_align_2d.py
      - __init__.py
      - average_pooling_2d.py
      - roi_average_pooling_2d.py
      - average_pooling_nd.py
      - roi_max_align_2d.py
      - spatial_pyramid_pooling_2d.py
      - average_pooling_nd_kernel.py
      - pooling_nd.py
    - rnn
      - slstm.py
      - lstm.py
      - tree_lstm.py
      - n_step_gru.py
      - n_step_rnn.py
      - __init__.py
      - n_step_lstm.py
    - __init__.py
    - math
      - einsum.py
      - fix.py
      - zeta.py
      - sum.py
      - erf.py
      - cumsum.py
      - floor.py
      - scale.py
      - tensordot.py
      - inv.py
      - identity.py
      - erfc.py
      - bias.py
      - arctanh.py
      - sign.py
      - fft.py
      - digamma.py
      - hyperbolic.py
      - clip.py
      - lgamma.py
      - exponential.py
      - erfcx.py
      - polygamma.py
      - exponential_m1.py
      - ndtr.py
      - square.py
      - minmax.py
      - cumprod.py
      - matmul.py
      - logsumexp.py
      - ndtri.py
      - trigonometric.py
      - ceil.py
      - maximum.py
      - fmod.py
      - linear_interpolate.py
      - erfcinv.py
      - __init__.py
      - batch_l2_norm_squared.py
      - logarithm_1p.py
      - log_ndtr.py
      - prod.py
      - basic_math.py
      - sqrt.py
      - cholesky.py
      - minimum.py
      - average.py
      - sparse_matmul.py
      - det.py
      - erfinv.py
    - loss
      - absolute_error.py
      - softmax_cross_entropy.py
      - mean_absolute_error.py
      - huber_loss.py
      - triplet.py
      - discriminative_loss.py
      - squared_error.py
      - hinge.py
      - vae.py
      - negative_sampling.py
      - contrastive.py
      - crf1d.py
      - decov.py
      - mean_squared_error.py
      - black_out.py
      - __init__.py
      - sigmoid_cross_entropy.py
      - ctc.py
      - cross_covariance.py
    - activation
      - maxout.py
      - rrelu.py
      - relu.py
      - softplus.py
      - tanh.py
      - softmax.py
      - selu.py
      - swish.py
      - hard_sigmoid.py
      - log_softmax.py
      - leaky_relu.py
      - sigmoid.py
      - __init__.py
      - prelu.py
      - clipped_relu.py
      - elu.py
      - crelu.py
    - normalization
      - group_normalization.py
      - batch_normalization.py
      - l2_normalization.py
      - __init__.py
      - batch_renormalization.py
      - decorrelated_batch_normalization.py
      - local_response_normalization.py
      - layer_normalization.py
  - utils
    - cache.py
    - conv.py
    - _collections.py
    - type_check.py
    - argument.py
    - walker_alias.py
    - array.py
    - conv_nd_kernel.py
    - meta.py
    - __init__.py
    - experimental.py
    - nondeterministic.py
    - error.py
    - sparse.py
    - conv_nd.py
    - imgproc.py
    - precision.py
  - link_hooks
    - spectral_normalization.py
    - weight_standardization.py
    - __init__.py
    - timer.py
  - sequential.py
  - device_resident.py
  - cuda.py
  - training
    - extensions
      - evaluator.py
      - util.py
      - snapshot_writers.py
      - linear_shift.py
      - warmup_shift.py
      - multistep_shift.py
      - _snapshot.py
      - variable_unchain.py
      - step_shift.py
      - print_report.py
      - fail_on_nonnumber.py
      - variable_statistics_plot.py
      - plot_report.py
      - micro_average.py
      - progress_bar.py
      - __init__.py
      - value_observation.py
      - computational_graph.py
      - log_report.py
      - polynomial_shift.py
      - exponential_shift.py
      - parameter_statistics.py
      - inverse_shift.py
    - trigger.py
    - util.py
    - updaters
      - multiprocess_parallel_updater.py
      - __init__.py
      - parallel_updater.py
      - standard_updater.py
    - triggers
      - interval_trigger.py
      - once_trigger.py
      - minmax_value_trigger.py
      - early_stopping_trigger.py
      - __init__.py
      - time_trigger.py
      - manual_schedule_trigger.py
    - _updater.py
    - __init__.py
    - trainer.py
    - extension.py
    - updater.py
  - serializer.py
  - initializers
    - uniform.py
    - sampling.py
    - normal.py
    - __init__.py
    - constant.py
    - orthogonal.py
  - backends
    - cuda.py
    - intel64.py
    - _cpu.py
    - __init__.py
    - _chainerx.py
  - iterators
    - multiprocess_iterator.py
    - _statemachine.py
    - order_samplers.py
    - multithread_iterator.py
    - serial_iterator.py
    - dali_iterator.py
    - __init__.py
  - function_hooks
    - debug_print.py
    - __init__.py
    - timer.py
    - cupy_memory_profile.py
    - cuda_profile.py
  - py.typed
  - distributions
    - beta.py
    - one_hot_categorical.py
    - poisson.py
    - geometric.py
    - uniform.py
    - multivariate_normal.py
    - dirichlet.py
    - normal.py
    - bernoulli.py
    - independent.py
    - exponential.py
    - laplace.py
    - __init__.py
    - utils.py
    - gamma.py
    - gumbel.py
    - log_normal.py
    - cauchy.py
    - categorical.py
    - pareto.py
    - chisquare.py
  - dataset
    - iterator.py
    - download.py
    - dataset_mixin.py
    - convert.py
    - __init__.py
    - tabular
      - tabular_dataset.py
      - _slice.py
      - delegate_dataset.py
      - _asmode.py
      - _with_converter.py
      - __init__.py
      - _join.py
      - from_data.py
      - _transform.py
      - _concat.py
  - links
    - theano
      - theano_function.py
      - __init__.py
    - connection
      - local_convolution_2d.py
      - scale.py
      - bias.py
      - deformable_convolution_2d.py
      - bilinear.py
      - dilated_convolution_2d.py
      - highway.py
      - embed_id.py
      - convolution_2d.py
      - convolution_nd.py
      - inceptionbn.py
      - deconvolution_nd.py
      - __init__.py
      - depthwise_convolution_2d.py
      - linear.py
      - parameter.py
      - deconvolution_2d.py
      - inception.py
      - mlp_convolution_2d.py
    - rnn
      - zoneoutlstm.py
      - lstm.py
      - tree_lstm.py
      - n_step_gru.py
      - mgu.py
      - n_step_rnn.py
      - __init__.py
      - peephole.py
      - n_step_lstm.py
      - gru.py
    - __init__.py
    - model
      - __init__.py
      - vision
        vgg.py
        resnet.py
        googlenet.py
        __init__.py
      - classifier.py
    - loss
      - negative_sampling.py
      - crf1d.py
      - hierarchical_softmax.py
      - black_out.py
      - __init__.py
    - activation
      - simplified_dropconnect.py
      - maxout.py
      - swish.py
      - __init__.py
      - prelu.py
    - normalization
      - group_normalization.py
      - batch_normalization.py
      - __init__.py
      - batch_renormalization.py
      - decorrelated_batch_normalization.py
      - layer_normalization.py
    - caffe
      - caffe_function.py
      - __init__.py
      - LICENSE_caffe_pb2
      - protobuf3
        __init__.py
  - link.py
  - distribution.py
  - function_hook.py
  - reporter.py
  - function.py
  - variable.py
  - graph_optimizations
    - static_graph.py
    - static_graph_utilities.py
    - __init__.py
  - memory_layouts.py
  - gradient_check.py
  - _backprop_utils.py
  - __init__.py
  - _runtime_info.py
  - configuration.py
  - warnings.py
  - computational_graph.py
  - initializer.py
  - _version.py
  - _backend.py
  - _environment_check.py
  - backend.py
  - optimizers
    - nesterov_ag.py
    - sgd.py
    - adam.py
    - ada_delta.py
    - rmsprop.py
    - smorms3.py
    - msvag.py
    - rmsprop_graves.py
    - momentum_sgd.py
    - __init__.py
    - ada_grad.py
    - corrected_momentum_sgd.py
  - types.py
  - function_node.py
  - serializers
    - npz.py
    - __init__.py
    - hdf5.py
  - _backprop.py
  - exporters
    - __init__.py
    - caffe.py
  - testing
    - distribution_test.py
    - condition.py
    - serializer.py
    - training.py
    - _distribution_test.py
    - function_link.py
    - random.py
    - _bundle.py
    - unary_math_function_test.py
    - doctest_helper.py
    - array.py
    - __init__.py
    - attr.py
    - matrix.py
    - backend.py
    - helper.py
    - parameterized.py
- .mergify.yml
- .gitignore
- docs
  - Makefile
  - source
    - install.rst
    - upgrade_v2.rst
    - contribution.rst
    - _napoleon_patch.py
    - onnx_chainer
      - reference
        index.rst
      - introduction
        index.rst
      - index.rst
    - examples
      - word2vec.rst
      - seq2seq.rst
      - dcgan.rst
      - cnn.rst
      - ptb.rst
      - mnist.rst
      - index.rst
      - rnn.rst
      - train_loop.rst
    - imports.rst
    - spelling_wordlist.txt
    - tips.rst
    - _docstring_check.py
    - _autosummary_check.py
    - performance.rst
    - chainerx
      - contribution.rst
      - tutorial
        index.rst
      - limitations.rst
      - tips.rst
      - install
        index.rst
      - reference
        backprop.rst
        ndarray.rst
        routines.rst
        context.rst
        index.rst
        backend_and_device.rst
      - index.rst
    - license.rst
    - upgrade.rst
    - compatibility.rst
    - reference
      - functions.rst
      - optimizers.rst
      - distributions.rst
      - datasets.rst
      - debug.rst
      - training.rst
      - iterators.rst
      - backends.rst
      - variable.rst
      - initializers.rst
      - util.rst
      - graph.rst
      - check.rst
      - links.rst
      - serializers.rst
      - index.rst
      - static_graph_design.rst
      - configuration.rst
      - static_graph.rst
      - caffe.rst
      - snapshot_writers.rst
    - index.rst
    - conf.py
    - glance.rst
    - _templates
      - autosummary
        class.rst
      - search.html
    - _static
      - robots.txt
      - css
        modified_theme.css
    - guides
      - functions.rst
      - optimizers.rst
      - type_checks.rst
      - variables.rst
      - define_by_run.rst
      - extensions.rst
      - links.rst
      - gpu.rst
      - serializers.rst
      - trainer.rst
      - index.rst
      - models.rst
      - report.rst
    - chainermn
      - tutorial
        step2_datasets_evaluators.rst
        overview.rst
        tips_faqs.rst
        index.rst
        step1_communicators_optimizers.rst
      - reference
        configurations.rst
        index.rst
      - index.rst
      - model_parallel
        example2_seq2seq.rst
        overview.rst
        example1_simple_mlp.rst
        example4_ensemble.rst
        index.rst
        example3_parallel_conv.rst
        model_parallel_on_chainermn.rst
      - installation
        guide.rst
        index.rst
        troubleshooting.rst
  - make.bat
  - rtd_conda.yml
  - requirements.txt
  - image
    - seq2seq
    - trainer
    - dcgan
    - word2vec
    - glance
    - model_parallel
    - train_loop
    - ptb
- MANIFEST.in
- chainermn
  - extensions
    - allreduce_persistent.py
    - multi_node_early_stopping_trigger.py
    - _multi_node_snapshot.py
    - checkpoint.py
    - observation_aggregator.py
    - multi_node_evaluator.py
    - __init__.py
  - datasets
    - scatter.py
    - __init__.py
    - empty_dataset.py
  - functions
    - batch_normalization.py
    - collective_communication.py
    - point_to_point_communication.py
    - pseudo_connect.py
    - __init__.py
  - iterators
    - multi_node_iterator.py
    - __init__.py
    - synchronized_iterator.py
  - optimizers.py
  - communicators
    - _memory_utility.py
    - dummy_communicator.py
    - communicator_base.py
    - naive_communicator.py
    - flat_communicator.py
    - mpi_communicator_base.py
    - pure_nccl_communicator.py
    - _communication_utility.py
    - __init__.py
    - non_cuda_aware_communicator.py
  - global_except_hook.py
  - links
    - batch_normalization.py
    - create_mnbn_model.py
    - multi_node_chain_list.py
    - n_step_rnn.py
    - __init__.py
  - nccl.py
  - __init__.py
  - testing
    - __init__.py
    - device.py

import chainer
import chainer.backends
from chainer.backends.cuda import cupy
import chainer.links as L
import chainer.testing
import chainermn
import numpy as np
import pytest


class Param(object):
    def __init__(self, param):
        self.dtype = None
        self.__dict__.update(param)


params = [Param(p) for p in [
    {
        'dtype': np.float16,
    }, {
        'dtype': np.float32,
    }, {
        'dtype': chainer.mixed16
    }]]


class Cycle0SubA(chainer.Chain):
    def __init__(self, size):
        super(Cycle0SubA, self).__init__()
        with self.init_scope():
            self.f = L.Linear(size, size)

    def __call__(self, x):
        return self.f(x)


class Cycle0SubB(chainer.Chain):
    def __init__(self, size):
        super(Cycle0SubB, self).__init__(
            f=L.Linear(size, 2))

    def __call__(self, h):
        return self.f(h)


class Cycle0(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_prev, rank_next):
        super(Cycle0, self).__init__(comm=comm)
        self.add_link(Cycle0SubA(size), rank_in=None, rank_out=rank_next)
        self.add_link(Cycle0SubB(size), rank_in=rank_prev, rank_out=None)


class Cycle1Sub(chainer.Chain):
    def __init__(self, size):
        super(Cycle1Sub, self).__init__(
            f=L.Linear(size, size))

    def __call__(self, h):
        return self.f(h)


class Cycle1(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_prev, rank_next):
        super(Cycle1, self).__init__(comm=comm)
        self.add_link(Cycle1Sub(size), rank_in=rank_prev, rank_out=rank_next)


class Cross0(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_prev, rank_next):
        super(Cross0, self).__init__(comm=comm)
        self.add_link(Cycle0SubA(size), rank_in=None, rank_out=rank_next)
        self.add_link(Cycle0SubB(size), rank_in=rank_prev, rank_out=None)


class Cross1(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_prev, rank_next):
        super(Cross1, self).__init__(comm=comm)
        self.add_link(Cycle0SubB(size), rank_in=rank_prev, rank_out=None)
        self.add_link(Cycle0SubA(size), rank_in=None, rank_out=rank_next)


class BranchSubA(chainer.Chain):
    def __init__(self, size):
        super(BranchSubA, self).__init__(
            f=L.Linear(size, size))

    def __call__(self, x):
        return self.f(x)


class BranchSubB(chainer.Chain):
    def __init__(self, size):
        super(BranchSubB, self).__init__(
            f=L.Linear(size, size))

    def __call__(self, *xs):
        x = xs[0]
        for _x in xs[1:]:
            x = x + _x
        return self.f(x)


class BranchParent1(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_children):
        super(BranchParent1, self).__init__(comm=comm)
        self.add_link(BranchSubA(size), rank_in=None, rank_out=rank_children)
        self.add_link(BranchSubB(size), rank_in=rank_children, rank_out=None)


class BranchParent2(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_children):
        super(BranchParent2, self).__init__(comm=comm)
        ranks = [comm.rank] + rank_children
        self.add_link(BranchSubA(size), rank_in=None, rank_out=ranks)
        self.add_link(BranchSubA(size), rank_in=comm.rank, rank_out=comm.rank)
        self.add_link(BranchSubB(size), rank_in=ranks, rank_out=None)


class BranchParent3(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_children):
        super(BranchParent3, self).__init__(comm=comm)
        ranks = rank_children + [comm.rank]
        self.add_link(BranchSubA(size), rank_in=None, rank_out=ranks)
        self.add_link(BranchSubA(size), rank_in=comm.rank, rank_out=comm.rank)
        self.add_link(BranchSubB(size), rank_in=ranks, rank_out=None)


class BranchParent4(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_children):
        super(BranchParent4, self).__init__(comm=comm)
        ranks = rank_children + [comm.rank]
        ranks = ranks[1:] + ranks[0:1]
        self.add_link(BranchSubA(size), rank_in=None, rank_out=ranks)
        self.add_link(BranchSubA(size), rank_in=comm.rank, rank_out=comm.rank)
        self.add_link(BranchSubB(size), rank_in=ranks, rank_out=None)


class BranchChild(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_parent):
        super(BranchChild, self).__init__(comm=comm)
        self.add_link(
            BranchSubA(size),
            rank_in=rank_parent,
            rank_out=rank_parent)


class TwistFirst(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_next):
        super(TwistFirst, self).__init__(comm=comm)
        self.add_link(BranchSubA(size), rank_in=None, rank_out=rank_next)
        self.add_link(BranchSubA(size), rank_in=rank_next, rank_out=None)


class Twist(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_prev, rank_next):
        super(Twist, self).__init__(comm=comm)
        self.add_link(BranchSubA(size), rank_in=rank_prev, rank_out=comm.rank)
        self.add_link(BranchSubA(size), rank_in=None, rank_out=rank_prev)
        self.add_link(BranchSubA(size), rank_in=None, rank_out=rank_next)
        self.add_link(BranchSubA(size), rank_in=rank_next, rank_out=comm.rank)
        self.add_link(
            BranchSubB(size),
            rank_in=[comm.rank, comm.rank],
            rank_out=None)


class TwistLast(chainermn.MultiNodeChainList):
    def __init__(self, size, comm, rank_prev):
        super(TwistLast, self).__init__(comm=comm)
        self.add_link(BranchSubA(size), rank_in=rank_prev, rank_out=None)
        self.add_link(BranchSubA(size), rank_in=None, rank_out=rank_prev)


class TupleDataSubA(chainer.Chain):
    def __init__(self, size):
        super(TupleDataSubA, self).__init__(
            f0=L.Linear(size, size),
            f1=L.Linear(size, size))

    def __call__(self, x):
        y0 = self.f0(x)
        y1 = self.f1(x)
        return y0, y1


class TupleDataSubB(chainer.Chain):
    def __init__(self, size):
        super(TupleDataSubB, self).__init__(
            f0=L.Linear(size, size),
            f1=L.Linear(size, size))

    def __call__(self, x):
        # TupleDataSubB receives two elemental tuple from TupleDataSubA.
        x0, x1 = x
        y0 = self.f0(x0)
        y1 = self.f1(x1)
        return y0 + y1


class TupleDataSubC(chainer.Chain):
    def __init__(self, size):
        super(TupleDataSubC, self).__init__(
            f=L.Linear(size, size))

    def __call__(self, x):
        return self.f(x)


class TupleDataParent(chainermn.MultiNodeChainList):
    def __init__(self, comm, size, rank_child):
        super(TupleDataParent, self).__init__(comm=comm)
        self.add_link(TupleDataSubA(size), rank_in=None, rank_out=rank_child)
        self.add_link(TupleDataSubC(size), rank_in=rank_child, rank_out=None)


class TupleDataChild(chainermn.MultiNodeChainList):
    def __init__(self, comm, size, rank_parent):
        super(TupleDataChild, self).__init__(comm=comm)
        self.add_link(
            TupleDataSubB(size), rank_in=rank_parent, rank_out=rank_parent)


def create_communicator(gpu):
    if gpu:
        communicator = chainermn.create_communicator('flat')
        chainer.backends.cuda.get_device_from_id(communicator.intra_rank).use()
    else:
        communicator = chainermn.create_communicator('naive')

    if communicator.size < 2:
        pytest.skip('This test is for multinode only')

    rank_next = (communicator.rank + 1) % communicator.size
    rank_prev = (communicator.rank - 1) % communicator.size
    return communicator, rank_next, rank_prev


def check_cycle_model(gpu, param):
    communicator, rank_next, rank_prev = create_communicator(gpu)

    n, d = 100, 10

    with chainer.using_config('dtype', param.dtype):
        if communicator.rank == 0:
            X = np.random.randn(n, d).astype(param.dtype)
            Y = (np.random.rand(n) * 2).astype(np.int32)
            model = L.Classifier(
                Cycle0(d, communicator, rank_next, rank_prev))

            if gpu:
                model.to_device(cupy.cuda.Device())
                X = chainer.backends.cuda.to_gpu(X)
                Y = chainer.backends.cuda.to_gpu(Y)

            for i in range(n):
                err = model(X[i:i + 1], Y[i:i + 1])
                err.backward()
        else:
            model = Cycle1(
                d, communicator, rank_next, rank_prev)
            if gpu:
                model.to_device(cupy.cuda.Device())

            for i in range(n):
                err = model()
                err.backward()


@pytest.mark.parametrize('param', params)
def test_cycle_model_cpu(param):
    check_cycle_model(False, param)


@pytest.mark.parametrize('param', params)
@chainer.testing.attr.gpu
def test_cycle_model_gpu(param):
    check_cycle_model(True, param)


def check_crossing_model(gpu, param):
    communicator, rank_next, rank_prev = create_communicator(gpu)

    n, d = 100, 10
    X = np.random.randn(n, d).astype(param.dtype)
    Y = (np.random.rand(n) * 2).astype(np.int32)

    with chainer.using_config('dtype', param.dtype):
        if communicator.rank == 0:
            model = L.Classifier(Cross0(
                d, communicator, rank_next, rank_prev))
        else:
            model = L.Classifier(Cross1(
                d, communicator, rank_next, rank_prev))

        if gpu:
            model.to_device(cupy.cuda.Device())
            X = chainer.backends.cuda.to_gpu(X)
            Y = chainer.backends.cuda.to_gpu(Y)

        for i in range(n):
            err = model(X[i:i + 1], Y[i:i + 1])
            err.backward()


@pytest.mark.parametrize('param', params)
def test_crossing_model_cpu(param):
    check_crossing_model(False, param)


@pytest.mark.parametrize('param', params)
@chainer.testing.attr.gpu
def test_crossing_model_gpu(param):
    check_crossing_model(True, param)


def check_branching_model(gpu, communicator, rank_next, rank_prev,
                          parent_model, param):
    n, d = 100, 10
    X = np.random.randn(n, d).astype(param.dtype)
    Y = (np.random.rand(n) * 2).astype(np.int32)

    with chainer.using_config('dtype', param.dtype):
        if communicator.rank == 0:
            rank_children = [rank for rank in range(1, communicator.size)]
            model = L.Classifier(parent_model(
                d, communicator, rank_children))
            if gpu:
                model.to_device(cupy.cuda.Device())
                X = chainer.backends.cuda.to_gpu(X)
                Y = chainer.backends.cuda.to_gpu(Y)

            for i in range(n):
                err = model(X[i:i + 1], Y[i:i + 1])
                err.backward()
        else:
            model = BranchChild(d, communicator, 0)
            if gpu:
                model.to_device(cupy.cuda.Device())

            for i in range(n):
                err = model()
                err.backward()


def check_branching_models(gpu, param):
    communicator, rank_next, rank_prev = create_communicator(gpu)
    check_branching_model(gpu, communicator, rank_next, rank_prev,
                          BranchParent1, param)

    check_branching_model(gpu, communicator, rank_next, rank_prev,
                          BranchParent2, param)

    check_branching_model(gpu, communicator, rank_next, rank_prev,
                          BranchParent3, param)

    check_branching_model(gpu, communicator, rank_next, rank_prev,
                          BranchParent4, param)


@pytest.mark.parametrize('param', params)
def test_branching_models_cpu(param):
    check_branching_models(False, param)


@pytest.mark.parametrize('param', params)
@chainer.testing.attr.gpu
def test_branching_models_gpu(param):
    check_branching_models(True, param)


def check_twisting_model(gpu, param):
    communicator, rank_next, rank_prev = create_communicator(gpu)

    n, d = 100, 10
    X = np.random.randn(n, d).astype(param.dtype)
    Y = (np.random.rand(n) * 2).astype(np.int32)

    with chainer.using_config('dtype', param.dtype):
        if communicator.rank == 0:
            model = L.Classifier(
                TwistFirst(d, communicator, rank_next))
        elif communicator.rank == communicator.size - 1:
            model = L.Classifier(
                TwistLast(d, communicator, rank_prev))
        else:
            model = L.Classifier(Twist(
                d, communicator, rank_prev, rank_next))

        if gpu:
            model.to_device(cupy.cuda.Device())
            X = chainer.backends.cuda.to_gpu(X)
            Y = chainer.backends.cuda.to_gpu(Y)

        for i in range(n):
            err = model(X[i:i + 1], Y[i:i + 1])
            err.backward()


@pytest.mark.parametrize('param', params)
def test_twisting_model_cpu(param):
    check_twisting_model(False, param)


@pytest.mark.parametrize('param', params)
@chainer.testing.attr.gpu
def test_twisting_model_gpu(param):
    check_twisting_model(True, param)


def check_tuple_data_model(gpu, param):
    # This test only uses pairs (0, 1), (2, 3), ... (2m, 2m+1)
    communicator, rank_next, rank_prev = create_communicator(gpu)

    n, d = 100, 10
    X = np.random.randn(n, d).astype(param.dtype)
    Y = (np.random.rand(n) * 2).astype(np.int32)

    with chainer.using_config('dtype', param.dtype):
        if communicator.rank % 2 == 0:
            if communicator.rank == communicator.size - 1:
                # in case 2m is the right end with odd number of nodes
                return
            model = L.Classifier(
                TupleDataParent(communicator, d, rank_next))
        elif communicator.rank % 2 == 1:
            model = TupleDataChild(communicator, d, rank_prev)

        assert model is not None
        if gpu:
            model.to_device(cupy.cuda.Device())
            X = chainer.backends.cuda.to_gpu(X)
            Y = chainer.backends.cuda.to_gpu(Y)

        for i in range(n):
            if communicator.rank % 2 == 0:
                err = model(X[i:i + 1], Y[i:i + 1])
            elif communicator.rank % 2 == 1:
                err = model()
            assert err is not None
            err.backward()


@pytest.mark.parametrize('param', params)
def test_tuple_data_model_cpu(param):
    check_tuple_data_model(False, param)


@pytest.mark.parametrize('param', params)
@chainer.testing.attr.gpu
def test_tuple_data_model_gpu(param):
    check_tuple_data_model(True, param)