python source code of sequence_cnn

neuralmonkey-master
- run_tests.sh
- .mailmap
- examples
  - language_model.ini
  - tagging.ini
  - data
    - language_model
      - download_example_data.sh
      - .gitignore
    - translation
      - download_example_data.sh
      - .gitignore
    - tagging
      - download_example_data.sh
      - .gitignore
  - README.md
  - translation.ini
  - _old
    - multiobjective.ini
    - factored.ini
    - multiobjective_readme.txt
- requirements-gpu.txt
- LICENSE
- .readthedocs.yml
- lib
  - mteval
    - wrap-mteval.pl
    - mteval-v13a.pl
  - __init__.py
  - subword_nmt
    - segment-char-ngrams.py
    - learn_bpe.py
    - apply_bpe.py
    - chrF.py
    - LICENSE
    - get_vocab.py
    - __init__.py
    - README.md
    - bpe_toy.py
- CONTRIBUTING.md
- .pylintrc
- setup.cfg
- .travis.yml
- README.md
- neuralmonkey
  - runners
    - word_alignment_runner.py
    - xent_runner.py
    - ctc_debug_runner.py
    - beamsearch_runner.py
    - label_runner.py
    - logits_runner.py
    - __init__.py
    - tensor_runner.py
    - base_runner.py
    - regression_runner.py
    - runner.py
    - dataset_runner.py
    - plain_runner.py
  - decorators.py
  - decoders
    - sequence_labeler.py
    - output_projection.py
    - beam_search_decoder.py
    - transformer.py
    - decoder.py
    - autoregressive.py
    - ctc_decoder.py
    - word_alignment_decoder.py
    - sequence_regressor.py
    - __init__.py
    - README.md
    - encoder_projection.py
    - classifier.py
  - run.py
  - trainers
    - delayed_update_trainer.py
    - multitask_trainer.py
    - self_critical_objective.py
    - generic_trainer.py
    - test_multitask_trainer.py
    - rl_trainer.py
    - cross_entropy_trainer.py
    - __init__.py
    - objective.py
  - learning_utils.py
  - encoders
    - facebook_conv.py
    - transformer.py
    - imagenet_encoder.py
    - numpy_stateful_filler.py
    - recurrent.py
    - pooling.py
    - sentence_cnn_encoder.py
    - attentive.py
    - __init__.py
    - README.md
    - sequence_cnn_encoder.py
    - cnn_encoder.py
  - checkpython.py
  - evaluators
    - evaluator.py
    - bleu_ref.py
    - chrf.py
    - beer.py
    - f1_bio.py
    - gleu.py
    - wer.py
    - sacrebleu.py
    - mse.py
    - edit_distance.py
    - rouge.py
    - accuracy.py
    - multeval.py
    - __init__.py
    - perplexity.py
    - ter.py
    - bleu.py
    - average.py
  - nn
    - noisy_gru_cell.py
    - ortho_gru_cell.py
    - highway.py
    - pervasive_dropout_wrapper.py
    - __init__.py
    - utils.py
    - mlp.py
    - projection.py
  - processors
    - wordpiece.py
    - alignment.py
    - editops.py
    - speech.py
    - bpe.py
    - __init__.py
    - README.md
    - german.py
    - helpers.py
  - util
    - word2vec.py
    - match_type.py
    - __init__.py
  - functions.py
  - config
    - exceptions.py
    - parsing.py
    - normalize.py
    - __init__.py
    - configuration.py
    - builder.py
  - attention
    - stateful_context.py
    - feed_forward.py
    - base_attention.py
    - scaled_dot_product.py
    - transformer_cross_layer.py
    - coverage.py
    - __init__.py
    - combination.py
    - namedtuples.py
  - writers
    - numpy_writer.py
    - plain_text_writer.py
    - __init__.py
    - auto.py
  - tf_utils.py
  - checking.py
  - train.py
  - experiment.py
  - __init__.py
  - tests
    - test_readers.py
    - test_decoder.py
    - test_eval_wrappers.py
    - test_ter.py
    - test_bleu.py
    - test_chrf.py
    - test_nn_utils.py
    - test_encoders_init.py
    - test_dataset.py
    - test_model_part.py
    - test_vocabulary.py
    - test_config.py
    - test_functions.py
    - __init__.py
    - test_wordpiece.py
  - server
    - server.py
    - templates
      - server.html
    - static
      - style.css
      - server.css
  - dataset.py
  - model
    - gradient_blocking.py
    - gradient_reversal.py
    - stateful.py
    - model_part.py
    - feedable.py
    - sequence_split.py
    - __init__.py
    - sequence.py
    - parameterized.py
  - readers
    - plain_text_reader.py
    - __init__.py
    - README.md
    - audio_reader.py
    - image_reader.py
    - numpy_reader.py
    - string_vector_reader.py
  - logging.py
  - vocabulary.py
  - training_profiler.py
  - logbook
    - logbook.js
    - logbook.py
    - style.css
    - README.md
    - highlight.css
    - index.html
  - tf_manager.py
- tests
  - str.ini
  - small.ini
  - lint_run.sh
  - mypy_requirements.txt
  - tests_run.sh
  - language-model.ini
  - tutorial-check
    - Makefile
    - extract_inis.pl
  - ctc.ini
  - beamsearch.ini
  - hier-multiattention.ini
  - test_data_ensembles_all.ini
  - pydocstyle_requirements.txt
  - pycodestyle_requirements.txt
  - captioning.ini
  - classifier.ini
  - test_data_ensembles_single.ini
  - nematus.ini
  - unit-tests_run.sh
  - doclint_run.sh
  - small_sent_cnn.ini
  - alignment.ini
  - post-edit.ini
  - data
    - train.tc.de
    - flickr30k
      - train_images.txt
      - train.en
      - val.en
      - train.de
      - val.de
      - val_images.txt
      - val_images.npz.txt
      - train_images.npz.txt
    - val.tc.counts
    - str
      - val_files.txt
      - train_files.txt
      - vocab.tsv
      - train_words.txt
      - val_words.txt
    - val10.tc.de
    - val10.part2.tc.en
    - postedit
      - dev.src
      - train.src
      - dev.mt
      - train.pe
      - dev.pe
      - train.mt
    - val.words
    - val.tc.de
    - val10.tc.en
    - train.words
    - factored_surface_vocab.tsv
    - factored_decoder_vocab.tsv
    - train.tc.counts
    - dtmf
      - test_2.wav
      - 6.wav
      - 9.wav
      - 3.wav
      - val.sound
      - 4.wav
      - test_6.wav
      - 2.wav
      - labels.vocab
      - train.sound
      - train.labels
      - 1.wav
      - test_3.wav
      - val.labels
      - 8.wav
      - 7.wav
      - 5.wav
    - train.tc.ali
    - postedit_target_vocab.tsv
    - val10.part1.tc.en
    - classification.vocab
    - multi
      - val.tags-cs.txt
      - train.forms-en.txt
      - val.forms-cs.txt
      - val.forms-en.txt
      - val.tags-en.txt
      - train.tags-cs.txt
      - train.forms-cs.txt
      - train.tags-en.txt
    - bpe_vocab.tsv
    - sample.w2v
    - encoder_vocab.tsv
    - yesno
      - yesno.vocab
      - test.txt
      - test.wavlist
      - train.wavlist
      - train.txt
      - waves_yesno
        0_1_0_1_1_1_0_0.wav
        0_0_1_0_0_1_1_1.wav
        0_0_1_0_1_0_0_1.wav
        1_1_1_0_0_1_0_1.wav
        1_1_1_1_1_0_0_0.wav
        README
        1_1_0_1_0_1_1_0.wav
        1_0_0_1_0_1_1_1.wav
        1_1_0_1_1_1_1_0.wav
        0_1_0_0_1_0_1_1.wav
        1_0_1_1_1_1_0_1.wav
        0_1_0_0_0_1_1_0.wav
        0_1_0_1_0_0_0_0.wav
        0_1_1_1_1_0_1_0.wav
        0_0_1_0_1_0_0_0.wav
        1_0_1_1_1_0_1_0.wav
    - train.tc.en
    - decoder_vocab.tsv
    - merges_100.bpe
    - val.tc.en
    - factored_tag_vocab.tsv
    - labeler
      - val.pcedt.tags
      - LICENSE
      - train.pcedt.tags
      - train.pcedt.forms
      - val.pcedt.forms
    - bert
      - train.pcedt.forms.mask
      - train.pcedt.forms.noisy
      - val.pcedt.forms
  - test_data_ensembles_duplicate.ini
  - pydocstyle_run.sh
  - self-critical.ini
  - outputs
    - .gitignore
  - factored.ini
  - README.md
  - labeler.ini
  - bert.ini
  - lint_requirements.txt
  - rl.ini
  - doclint_install.sh
  - transformer.ini
  - regressor.ini
  - bpe.ini
  - flat-multiattention.ini
  - audio-classifier.ini
  - mypy_run.sh
  - pycodestyle_run.sh
  - beamsearch_ensembles.ini
  - test_data.ini
  - bahdanau.ini
- scripts
  - avg_checkpoints.py
  - postedit_prepare_data.py
  - caffe_image_features.py
  - decompound_truecased.py
  - export_embeddings_to_w2v.py
  - tf_save_images.py
  - estimate_scheduled_sampling.py
  - import_transformer.1.2.9.py
  - imagenet_features.py
  - prepare_str_images.py
  - extract_model_part_from_ckpt.py
  - max_column_finder.py
  - import_nematus.py
  - preprocess_bert.py
  - speech_features.py
  - build_config.py
  - neuralmonkey
    - runners
      - word_alignment_runner.py
      - xent_runner.py
      - ctc_debug_runner.py
      - beamsearch_runner.py
      - label_runner.py
      - logits_runner.py
      - __init__.py
      - tensor_runner.py
      - base_runner.py
      - regression_runner.py
      - runner.py
      - dataset_runner.py
      - plain_runner.py
    - decorators.py
    - decoders
      - sequence_labeler.py
      - output_projection.py
      - beam_search_decoder.py
      - transformer.py
      - decoder.py
      - autoregressive.py
      - ctc_decoder.py
      - word_alignment_decoder.py
      - sequence_regressor.py
      - __init__.py
      - README.md
      - encoder_projection.py
      - classifier.py
    - run.py
    - trainers
      - delayed_update_trainer.py
      - multitask_trainer.py
      - self_critical_objective.py
      - generic_trainer.py
      - test_multitask_trainer.py
      - rl_trainer.py
      - cross_entropy_trainer.py
      - __init__.py
      - objective.py
    - learning_utils.py
    - encoders
      - facebook_conv.py
      - transformer.py
      - imagenet_encoder.py
      - numpy_stateful_filler.py
      - recurrent.py
      - pooling.py
      - sentence_cnn_encoder.py
      - attentive.py
      - __init__.py
      - README.md
      - sequence_cnn_encoder.py
      - cnn_encoder.py
    - checkpython.py
    - evaluators
      - evaluator.py
      - bleu_ref.py
      - chrf.py
      - beer.py
      - f1_bio.py
      - gleu.py
      - wer.py
      - sacrebleu.py
      - mse.py
      - edit_distance.py
      - rouge.py
      - accuracy.py
      - multeval.py
      - __init__.py
      - perplexity.py
      - ter.py
      - bleu.py
      - average.py
    - nn
      - noisy_gru_cell.py
      - ortho_gru_cell.py
      - highway.py
      - pervasive_dropout_wrapper.py
      - __init__.py
      - utils.py
      - mlp.py
      - projection.py
    - processors
      - wordpiece.py
      - alignment.py
      - editops.py
      - speech.py
      - bpe.py
      - __init__.py
      - README.md
      - german.py
      - helpers.py
    - util
      - word2vec.py
      - match_type.py
      - __init__.py
    - functions.py
    - config
      - exceptions.py
      - parsing.py
      - normalize.py
      - __init__.py
      - configuration.py
      - builder.py
    - attention
      - stateful_context.py
      - feed_forward.py
      - base_attention.py
      - scaled_dot_product.py
      - transformer_cross_layer.py
      - coverage.py
      - __init__.py
      - combination.py
      - namedtuples.py
    - writers
      - numpy_writer.py
      - plain_text_writer.py
      - __init__.py
      - auto.py
    - tf_utils.py
    - checking.py
    - train.py
    - experiment.py
    - __init__.py
    - tests
      - test_readers.py
      - test_decoder.py
      - test_eval_wrappers.py
      - test_ter.py
      - test_bleu.py
      - test_chrf.py
      - test_nn_utils.py
      - test_encoders_init.py
      - test_dataset.py
      - test_model_part.py
      - test_vocabulary.py
      - test_config.py
      - test_functions.py
      - __init__.py
      - test_wordpiece.py
    - server
      - server.py
      - templates
        server.html
      - static
        style.css
        server.css
    - dataset.py
    - model
      - gradient_blocking.py
      - gradient_reversal.py
      - stateful.py
      - model_part.py
      - feedable.py
      - sequence_split.py
      - __init__.py
      - sequence.py
      - parameterized.py
    - readers
      - plain_text_reader.py
      - __init__.py
      - README.md
      - audio_reader.py
      - image_reader.py
      - numpy_reader.py
      - string_vector_reader.py
    - logging.py
    - vocabulary.py
    - training_profiler.py
    - logbook
      - logbook.js
      - logbook.py
      - style.css
      - README.md
      - highlight.css
      - index.html
    - tf_manager.py
  - postedit_rule_based_fixes.pl
  - column_selector.py
  - tokenize_data.py
  - get_multeval.sh
  - get_beer.sh
  - postedit_reconstruct_data.py
  - import_transformer.1.3.2.py
- bin
  - lib
    - mteval
      - wrap-mteval.pl
      - mteval-v13a.pl
    - __init__.py
    - subword_nmt
      - segment-char-ngrams.py
      - learn_bpe.py
      - apply_bpe.py
      - chrF.py
      - LICENSE
      - get_vocab.py
      - __init__.py
      - README.md
      - bpe_toy.py
  - neuralmonkey-logbook
  - neuralmonkey
    - runners
      - word_alignment_runner.py
      - xent_runner.py
      - ctc_debug_runner.py
      - beamsearch_runner.py
      - label_runner.py
      - logits_runner.py
      - __init__.py
      - tensor_runner.py
      - base_runner.py
      - regression_runner.py
      - runner.py
      - dataset_runner.py
      - plain_runner.py
    - decorators.py
    - decoders
      - sequence_labeler.py
      - output_projection.py
      - beam_search_decoder.py
      - transformer.py
      - decoder.py
      - autoregressive.py
      - ctc_decoder.py
      - word_alignment_decoder.py
      - sequence_regressor.py
      - __init__.py
      - README.md
      - encoder_projection.py
      - classifier.py
    - run.py
    - trainers
      - delayed_update_trainer.py
      - multitask_trainer.py
      - self_critical_objective.py
      - generic_trainer.py
      - test_multitask_trainer.py
      - rl_trainer.py
      - cross_entropy_trainer.py
      - __init__.py
      - objective.py
    - learning_utils.py
    - encoders
      - facebook_conv.py
      - transformer.py
      - imagenet_encoder.py
      - numpy_stateful_filler.py
      - recurrent.py
      - pooling.py
      - sentence_cnn_encoder.py
      - attentive.py
      - __init__.py
      - README.md
      - sequence_cnn_encoder.py
      - cnn_encoder.py
    - checkpython.py
    - evaluators
      - evaluator.py
      - bleu_ref.py
      - chrf.py
      - beer.py
      - f1_bio.py
      - gleu.py
      - wer.py
      - sacrebleu.py
      - mse.py
      - edit_distance.py
      - rouge.py
      - accuracy.py
      - multeval.py
      - __init__.py
      - perplexity.py
      - ter.py
      - bleu.py
      - average.py
    - nn
      - noisy_gru_cell.py
      - ortho_gru_cell.py
      - highway.py
      - pervasive_dropout_wrapper.py
      - __init__.py
      - utils.py
      - mlp.py
      - projection.py
    - processors
      - wordpiece.py
      - alignment.py
      - editops.py
      - speech.py
      - bpe.py
      - __init__.py
      - README.md
      - german.py
      - helpers.py
    - util
      - word2vec.py
      - match_type.py
      - __init__.py
    - functions.py
    - config
      - exceptions.py
      - parsing.py
      - normalize.py
      - __init__.py
      - configuration.py
      - builder.py
    - attention
      - stateful_context.py
      - feed_forward.py
      - base_attention.py
      - scaled_dot_product.py
      - transformer_cross_layer.py
      - coverage.py
      - __init__.py
      - combination.py
      - namedtuples.py
    - writers
      - numpy_writer.py
      - plain_text_writer.py
      - __init__.py
      - auto.py
    - tf_utils.py
    - checking.py
    - train.py
    - experiment.py
    - __init__.py
    - tests
      - test_readers.py
      - test_decoder.py
      - test_eval_wrappers.py
      - test_ter.py
      - test_bleu.py
      - test_chrf.py
      - test_nn_utils.py
      - test_encoders_init.py
      - test_dataset.py
      - test_model_part.py
      - test_vocabulary.py
      - test_config.py
      - test_functions.py
      - __init__.py
      - test_wordpiece.py
    - server
      - server.py
      - templates
        server.html
      - static
        style.css
        server.css
    - dataset.py
    - model
      - gradient_blocking.py
      - gradient_reversal.py
      - stateful.py
      - model_part.py
      - feedable.py
      - sequence_split.py
      - __init__.py
      - sequence.py
      - parameterized.py
    - readers
      - plain_text_reader.py
      - __init__.py
      - README.md
      - audio_reader.py
      - image_reader.py
      - numpy_reader.py
      - string_vector_reader.py
    - logging.py
    - vocabulary.py
    - training_profiler.py
    - logbook
      - logbook.js
      - logbook.py
      - style.css
      - README.md
      - highlight.css
      - index.html
    - tf_manager.py
  - neuralmonkey-run
  - neuralmonkey-server
  - neuralmonkey-train
- requirements.txt
- .gitignore
- docs
  - Makefile
  - source
    - running.rst
    - install.rst
    - img
      - gorilla.ico
      - dataset_creation.svg
      - model_workflow.svg
    - visualization.rst
    - api.rst
    - features.rst
    - tutorial.rst
    - overview.rst
    - benchmark.rst
    - github_dev.rst
    - index.rst
    - conf.py
    - machine_translation.rst
    - configuration.rst
    - internal_dev.rst
    - ubuntu1404_fix.rst
    - test_dev.rst
  - make.bat
  - requirements.txt
  - .gitignore

"""Encoder for sentence classification with 1D convolutions and max-pooling."""

from typing import Dict, List, Tuple

from typeguard import check_argument_types
import tensorflow as tf

from neuralmonkey.dataset import Dataset
from neuralmonkey.decorators import tensor
from neuralmonkey.model.feedable import FeedDict
from neuralmonkey.model.parameterized import InitializerSpecs
from neuralmonkey.model.model_part import ModelPart
from neuralmonkey.model.stateful import Stateful
from neuralmonkey.nn.utils import dropout
from neuralmonkey.vocabulary import Vocabulary, pad_batch, sentence_mask
from neuralmonkey.tf_utils import get_variable


class SequenceCNNEncoder(ModelPart, Stateful):
    """Encoder processing a sequence using a CNN."""

    # pylint: disable=too-many-arguments
    def __init__(self,
                 name: str,
                 vocabulary: Vocabulary,
                 data_id: str,
                 embedding_size: int,
                 filters: List[Tuple[int, int]],
                 max_input_len: int = None,
                 dropout_keep_prob: float = 1.0,
                 reuse: ModelPart = None,
                 save_checkpoint: str = None,
                 load_checkpoint: str = None,
                 initializers: InitializerSpecs = None) -> None:
        """Create a new instance of the CNN sequence encoder.

        Based on: Yoon Kim: Convolutional Neural Networks for Sentence
        Classification (http://emnlp2014.org/papers/pdf/EMNLP2014181.pdf)

        Arguments:
            vocabulary: Input vocabulary
            data_id: Identifier of the data series fed to this encoder
            name: An unique identifier for this encoder
            max_input_len: Maximum length of an encoded sequence
            embedding_size: The size of the embedding vector assigned
                to each word
            filters: Specification of CNN filters. It is a list of tuples
                specifying the filter size and number of channels.
            dropout_keep_prob: The dropout keep probability
                (default 1.0)
        """
        check_argument_types()
        ModelPart.__init__(self, name, reuse, save_checkpoint, load_checkpoint,
                           initializers)

        self.vocabulary = vocabulary
        self.data_id = data_id
        self.max_input_len = max_input_len
        self.embedding_size = embedding_size
        self.dropout_keep_prob = dropout_keep_prob
        self.filters = filters

    @property
    def input_types(self) -> Dict[str, tf.DType]:
        return {self.data_id: tf.string}

    @property
    def input_shapes(self) -> Dict[str, tf.TensorShape]:
        return {self.data_id: tf.TensorShape([None, None])}

    @tensor
    def inputs(self) -> tf.Tensor:
        return self.vocabulary.strings_to_indices(self.input_tokens)

    @tensor
    def input_tokens(self) -> tf.Tensor:
        return self.dataset[self.data_id]

    @tensor
    def input_mask(self) -> tf.Tensor:
        return sentence_mask(self.inputs)

    @tensor
    def embedded_inputs(self) -> tf.Tensor:
        with tf.variable_scope("input_projection"):
            embedding_matrix = get_variable(
                "word_embeddings",
                [len(self.vocabulary), self.embedding_size],
                initializer=tf.variance_scaling_initializer(
                    mode="fan_avg", distribution="uniform"))
            return dropout(
                tf.nn.embedding_lookup(embedding_matrix, self.inputs),
                self.dropout_keep_prob,
                self.train_mode)

    @tensor
    def output(self) -> tf.Tensor:
        pooled_outputs = []
        for filter_size, num_filters in self.filters:
            with tf.variable_scope("conv-maxpool-%s" % filter_size):
                # Convolution Layer
                filter_shape = [filter_size, self.embedding_size, num_filters]
                w_filter = get_variable(
                    "conv_W", filter_shape,
                    initializer=tf.variance_scaling_initializer(
                        mode="fan_avg", distribution="uniform"))
                b_filter = get_variable(
                    "conv_bias", [num_filters],
                    initializer=tf.zeros_initializer())
                conv = tf.nn.conv1d(
                    self.embedded_inputs,
                    w_filter,
                    stride=1,
                    padding="VALID",
                    name="conv")

                # Apply nonlinearity
                conv_relu = tf.nn.relu(tf.nn.bias_add(conv, b_filter))

                # Max-pooling over the outputs
                pooled = tf.reduce_max(conv_relu, 1)
                pooled_outputs.append(pooled)

        # Combine all the pooled features
        return tf.concat(pooled_outputs, axis=1)

    def feed_dict(self, dataset: Dataset, train: bool = False) -> FeedDict:
        """Populate the feed dictionary with the encoder inputs.

        Arguments:
            dataset: The dataset to use
            train: Boolean flag telling whether it is training time
        """
        fd = ModelPart.feed_dict(self, dataset, train)
        sentences = dataset.get_series(self.data_id)
        fd[self.input_tokens] = pad_batch(list(sentences), self.max_input_len)
        return fd