python source code of utils

pynlp-master
- .github
  - workflows
    - pythonapp.yml
- sequence-tagging
  - BERT-BiLSTM-CRF-NER
    - requirement.txt
    - conlleval.pl
    - terminal_predict.py
    - data_process.py
    - conlleval.py
    - NERdata
      - ori
    - bert_lstm_ner.py
    - pictures
    - tf_metrics.py
    - README.md
    - lstm_crf_layer.py
    - bert
      - run_pretraining.py
      - modeling_test.py
      - modeling.py
      - sample_text.txt
      - optimization_test.py
      - LICENSE
      - create_pretraining_data.py
      - optimization.py
      - run_squad.py
      - CONTRIBUTING.md
      - run_classifier.py
      - multilingual.md
      - __init__.py
      - README.md
      - tokenization.py
      - requirements.txt
      - tokenization_test.py
      - extract_features.py
  - BIGRU-ATTENTION-NER
    - test_GRU.py
    - initial.py
    - origin_data
      - relation2id.txt
      - test.txt
      - train.txt
    - README.md
    - train_GRU.py
    - network.py
  - IDCNN-CRF-NER
    - rnncell.py
    - conlleval.py
    - config
      - config_file
    - model.py
    - data
      - version2
    - main.py
    - README.md
    - utils.py
    - loader.py
    - data_utils.py
    - image
- LICENSE
- nlg
  - __init__.py
- nlu
  - BERT-for-Sequence-Labeling-and-Text-Classification
    - run_slot_intent_join_task_LSTM.py
    - calculating_model_score
      - sklearn_metrics_function.py
      - calculate_atis_slot.py
      - calculate_atis_intent.py
      - calculate_snpis_intent.py
      - snips_join_task_epoch10_test4088ckpt
        intent_prediction_test_results.txt
        slot_filling_test_results.txt
      - calculate_model_score.py
      - calculate_snips_intent_and_slot_new.py
      - tf_metrics.py
      - calculate_snips_slot.py
      - calculate_snips_intent_and_slot.py
      - snips_sequence_labeling_and_text_classification_test7
        log.txt
        intent_prediction_test_results.txt
        slot_filling_test_results.txt
        model_score_log.txt
    - pretrained_model
      - uncased_L-12_H-768_A-12
        vocab.txt
        bert_config.json
    - run_text_classification.py
    - output
      - conll2003ner_epoch3_test653ckpt
        label2id.pkl
        model_score_log.txt
      - atis_join_task_epoch10_test1399ckpt
        intent_prediction_test_results.txt
        slot_filling_test_results.txt
      - score_summarization.py
      - snips_join_task_epoch10_test4088ckpt
        log.txt
        intent_prediction_test_results.txt
        slot_filling_test_results.txt
        intent_label2id.pkl
        slot_label2id.pkl
    - LICENSE
    - calculate_model_score.py
    - run_sequence_labeling.py
    - data
      - snips_Intent_Detection_and_Slot_Filling
        test
        label
        seq.out
        seq.in
        valid
        label
        seq.out
        seq.in
        train
        label
      - CoNLL2003_NER
        test
        seq.out
        valid
        seq.out
        conll03_raw_data_to_stand_file.py
        train
      - atis_Intent_Detection_and_Slot_Filling
        test
        label
        seq.out
        seq.in
        valid
        label
        seq.out
        seq.in
        train
        check_train_raw_data.py
        label
    - README.md
    - Usage example 使用方法示例.ipynb
    - output_predict
      - snips_join_task_epoch3_ckpt1000
        intent_prediction_test_results.txt
        model_score_log.txt
        intent_label2id.pkl
        slot_label2id.pkl
    - run_sequence_labeling_and_text_classification.py
    - bert
      - run_pretraining.py
      - modeling_test.py
      - run_classifier_with_tfhub.py
      - modeling.py
      - sample_text.txt
      - optimization_test.py
      - LICENSE
      - create_pretraining_data.py
      - optimization.py
      - run_squad.py
      - CONTRIBUTING.md
      - run_classifier.py
      - multilingual.md
      - predicting_movie_reviews_with_bert_on_tf_hub.ipynb
      - __init__.py
      - README.md
      - tokenization.py
      - requirements.txt
      - tokenization_test.py
      - extract_features.py
      - .gitignore
  - Intent-SlotGated
    - data
      - snips
        test
        label
        seq.out
        seq.in
        valid
        label
        seq.out
        seq.in
        train
        label
      - atis
        test
        label
        seq.out
        seq.in
        valid
        label
        seq.out
        seq.in
        train
        label
    - train.py
    - README.md
    - utils.py
  - JoinModel-Slot-Intent
    - seq_classification.py
    - conlleval.pl
    - multi_task_model.py
    - data
      - ATIS_samples
        out_vocab_10000.txt
        test
        test.seq.out
        test.ids10000.seq.in
        test.label
        test.ids.label
        test.seq.in
        test.ids10000.seq.out
        valid
        valid.ids.label
        valid.ids10000.seq.out
        valid.ids10000.seq.in
        valid.seq.out
        valid.label
        valid.seq.in
        in_vocab_10000.txt
        label.txt
        train
        train.ids10000.seq.out
        train.label
        train.seq.in
        train.ids10000.seq.in
        train.seq.out
        train.ids.label
      - air_conditional
        test
        test.ids244.seq.in
        test.ids28.seq.out
        test.label
        test.ids.label
        test.seq.in
        valid
        valid.ids.label
        valid.label
        out_vocab_28.txt
        label.txt
        train
        train.ids.label
        in_vocab_244.txt
    - seq_labeling.py
    - README.md
    - data_utils.py
    - run_multi-task_rnn.py
- DeepCTR
  - dstn_v1
    - ctr_funcs.py
    - dstn_pooling.py
    - LICENSE
    - dnn.py
    - data
    - dstn_int_att.py
    - README.md
    - dstn_self_att.py
    - config_dstn.py
  - deepmcp
    - ctr_funcs.py
    - deepcp.py
    - LICENSE
    - deepmp.py
    - dnn.py
    - deepmcp.py
    - __init__.py
    - README.md
    - config_deepmcp.py
  - README.md
- qaPairsRelationClassification
  - ABCNN_V1
    - model.py
    - train.py
    - __init__.py
    - args.py
    - test.py
  - ESIM
    - freeze_graph.py
    - modules.py
    - Config.py
    - evaluecate.py
    - config
      - config.yaml
      - log.2019_07_05_20_46_12
    - run.sh
    - data
      - vocab.txt
      - test.txt
    - train.py
    - README.md
    - utils.py
    - Model.py
    - restore_pb.py
  - utils
    - generate_char.py
    - preprocess.py
    - load_data.py
    - __init__.py
    - data_utils.py
  - DSSM
    - model.py
    - train.py
    - __init__.py
    - args.py
    - test.py
  - DIIN
    - model.py
    - train.py
    - __init__.py
    - args.py
    - test.py
  - CONVNET
    - model.py
    - train.py
    - __init__.py
    - args.py
    - test.py
  - ANN
    - text_ann.py
  - BIMPM
    - model.py
    - train.py
    - __init__.py
    - args.py
    - test.py
  - Bert
    - graph.py
    - similarity.py
    - modeling.py
    - optimization.py
    - data
    - __init__.py
    - README.md
    - tokenization.py
    - requirements.txt
    - args.py
    - extract_feature.py
  - DeepSiameseNet
    - freeze_graph.py
    - utils
      - preprocess.py
      - util.py
      - eval.py
      - eval_copy.py
      - modules.py
      - input_helpers.py
      - modeling.py
      - build_voc.py
      - optimization.py
      - generate_data.py
      - run_classifier.py
      - __init__.py
      - tokenization.py
    - LICENSE
    - siamese_network.py
    - atec_data
    - train.py
    - README.md
    - requirements.txt
  - SANN
    - text_sann.py
  - data
    - vocab.txt
  - DRCN
    - model.py
    - train.py
    - __init__.py
    - args.py
    - test.py
  - word2vec
    - word2vec_dynamic.py
    - __init__.py
    - word2vec_static.py
  - ABCNN
    - text_abcnn.py
  - __init__.py
  - README.md
  - CNN
    - text_cnn.py
  - HAN
    - text_han.py
  - RCNN
    - text_rcnn.py
  - image
  - CRNN
    - text_crnn.py
- README.md
- dst
  - __init__.py
- .gitignore
- text-classification
  - a09_Capsule
    - export_pb_model.py
    - capsule
      - layer.py
      - loss.py
      - __init__.py
      - utils.py
    - run_capsule.py
    - capsule_model.py
    - data_loader.py
    - data
      - category
        val
        data_bak
        inputs.yml
        outputs.yml
        test
        vocab.yml
        category.yml
        train
    - README.md
  - a06_Transformer
    - a2_predict_classification.py
    - a2_train.py
    - a2_split_traning_data.py
    - a2_predict.py
    - data_util_zhihu.py
    - a2_decoder.py
    - a2_train_classification.py
    - a2_transformer_classification.py
    - a2_layer_norm_residual_conn.py
    - a2_base_model.py
    - a2_poistion_wise_feed_forward.py
    - a2_transformer.py
    - a2_attention_between_enc_dec.py
    - a2_multi_head_attention.py
    - a2_encoder.py
  - a11_Bert
    - bert_modeling.py
    - run_classifier_predict_online.py
    - optimization.py
    - train_bert_multi-label.py
    - train_bert_toy_task.py
    - README_bert.md
    - __init__.py
    - utils.py
    - tokenization.py
    - unused
      - train_bert_multi-label_old.py
      - run_classifier_multi_labels_bert.py
  - a08_DynamicMemoryNet
    - a8_dynamic_memory_network.py
    - a8_predict.py
    - a8_train.py
  - a07_EntityNetwork
    - a3_entity_network.py
    - a3_predict.py
    - data_util_zhihu.py
    - a3_train.py
  - a02_TextRNN
    - p8_TextRNN_train.py
    - p8_TextRNN_model_multi_layers.py
    - p8_TextRNN_predict.py
    - p8_TextRNN_model.py
  - a10_DeepCNN
    - train_module.py
    - run.py
    - img
    - data_process.py
    - models
      - dpcnn.py
      - __init__.py
    - predict.py
    - data
      - dev.csv
      - train.csv
      - test.csv
    - README.md
    - utils.py
    - DataSet.py
  - a05_Seq2seqWithAttention
    - a1_seq2seq.py
    - a1_seq2seq_attention_predict.py
    - a1_seq2seq_attention_model.py
    - a1_seq2seq_attention_train.py
  - data
    - old
      - __init__.py
    - ieee_zhihu_cup
      - vocab.txt
      - label_set.txt
    - __init__.py
  - a00_boosting
    - boosting.py
  - README.md
  - a03_TextRCNN
    - p71_TextRCNN_mode2.py
    - p71_TextRCNN_train.py
    - p71_TextRCNN_predict.py
    - p71_TextRCNN_model.py
  - a04_HierarchicalAttentionNetwork
    - p1_HierarchicalAttention_model_transformer.py
    - p1_HierarchicalAttention_model.py
    - p1_HierarchicalAttention_train.py
    - HAN_model.py
    - p1_seq2seq.py
    - p1_HierarchicalAttention_predict.py
  - a01_TextCNN
    - predict_cnn.py
    - export_pb_model.py
    - data_loader.py
    - run_cnn.py
    - README.md
    - cnn_model.py
    - requirements.txt
  - data_util
    - data_multi_label.txt
    - 1_process_zhihu.py
    - 3_process_zhihu_question_topic_relation.py
    - data_util_zhihu.py
    - 2_predict_zhihu_get_question_representation.py
    - data_single_label.txt

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function
from tensorflow.contrib.layers.python.layers import initializers

import tensorflow as tf

slim = tf.contrib.slim

epsilon = 1e-9

def _matmul_broadcast(x, y, name):
  """Compute x @ y, broadcasting over the first `N - 2` ranks.
  """
  with tf.variable_scope(name) as scope:
    return tf.reduce_sum(
      tf.nn.dropout(x[..., tf.newaxis] * y[..., tf.newaxis, :, :],1), axis=-2
    )


def _get_variable_wrapper(
  name, shape=None, dtype=None, initializer=None,
  regularizer=None,
  trainable=True,
  collections=None,
  caching_device=None,
  partitioner=None,
  validate_shape=True,
  custom_getter=None
):
  """Wrapper over tf.get_variable().
  """

  with tf.device('/cpu:0'):
    var = tf.get_variable(
      name, shape=shape, dtype=dtype, initializer=initializer,
      regularizer=regularizer, trainable=trainable,
      collections=collections, caching_device=caching_device,
      partitioner=partitioner, validate_shape=validate_shape,
      custom_getter=custom_getter
    )
  return var


def _get_weights_wrapper(
  name, shape, dtype=tf.float32, initializer=initializers.xavier_initializer(),
  weights_decay_factor=None
):
  """Wrapper over _get_variable_wrapper() to get weights, with weights decay factor in loss.
  """

  weights = _get_variable_wrapper(
    name=name, shape=shape, dtype=dtype, initializer=initializer
  )

  if weights_decay_factor is not None and weights_decay_factor > 0.0:

    weights_wd = tf.multiply(
      tf.nn.l2_loss(weights), weights_decay_factor, name=name + '/l2loss'
    )

    tf.add_to_collection('losses', weights_wd)

  return weights


def _get_biases_wrapper(
  name, shape, dtype=tf.float32, initializer=tf.constant_initializer(0.0)
):
  """Wrapper over _get_variable_wrapper() to get bias.
  """

  biases = _get_variable_wrapper(
    name=name, shape=shape, dtype=dtype, initializer=initializer
  )

  return biases


def _conv2d_wrapper(inputs, shape, strides, padding, add_bias, activation_fn, name, stddev=0.1):
  """Wrapper over tf.nn.conv2d().
  """

  with tf.variable_scope(name) as scope:
    kernel = _get_weights_wrapper(
      name='weights', shape=shape, weights_decay_factor=0.0, #initializer=tf.truncated_normal_initializer(stddev=stddev, dtype=tf.float32)
    )
    output = tf.nn.conv2d(
      inputs, filter=kernel, strides=strides, padding=padding, name='conv'
    )
    if add_bias:
      biases = _get_biases_wrapper(
        name='biases', shape=[shape[-1]]
      )
      output = tf.add(
        output, biases, name='biasAdd'
      )
    if activation_fn is not None:
      output = activation_fn(
        output, name='activation'
      )

  return output


def _separable_conv2d_wrapper(inputs, depthwise_shape, pointwise_shape, strides, padding, add_bias, activation_fn, name):
  """Wrapper over tf.nn.separable_conv2d().
  """
  
  with tf.variable_scope(name) as scope:
    dkernel = _get_weights_wrapper(
      name='depthwise_weights', shape=depthwise_shape, weights_decay_factor=0.0
    )
    pkernel = _get_weights_wrapper(
      name='pointwise_weights', shape=pointwise_shape, weights_decay_factor=0.0
    )
    output = tf.nn.separable_conv2d(
      input=inputs, depthwise_filter=dkernel, pointwise_filter=pkernel,
      strides=strides, padding=padding, name='conv'
    )
    if add_bias:
      biases = _get_biases_wrapper(
        name='biases', shape=[pointwise_shape[-1]]
      )
      output = tf.add(
        output, biases, name='biasAdd'
      )
    if activation_fn is not None:
      output = activation_fn(
        output, name='activation'
      )

  return output


def _depthwise_conv2d_wrapper(inputs, shape, strides, padding, add_bias, activation_fn, name):
  """Wrapper over tf.nn.depthwise_conv2d().
  """

  with tf.variable_scope(name) as scope:
    dkernel = _get_weights_wrapper(
      name='depthwise_weights', shape=shape, weights_decay_factor=0.0
    )
    output = tf.nn.depthwise_conv2d(
      inputs, filter=dkernel, strides=strides, padding=padding, name='conv'
    )
    if add_bias:
      d_ = output.get_shape()[-1].value
      biases = _get_biases_wrapper(
        name='biases', shape=[d_]
      )
      output = tf.add(
        output, biases, name='biasAdd'
      )
    if activation_fn is not None:
      output = activation_fn(
        output, name='activation'
      )

    return output