python source code of compute

models-master
- Makefile
- requirements-test.txt
- third_party
  - licenses.txt
- LICENSE
- models
  - language_translation
    - __init__.py
    - tensorflow
      - mlperf_gnmt
        __init__.py
        fp32
        nmt_utils.py
        evaluation_utils.py
        rouge.py
        __init__.py
        misc_utils.py
        run_inference.py
        hparam.py
        bleu.py
      - transformer_mlperf
        training
        bfloat16
        run_and_time.sh
        run_preprocessing.sh
        transformer
        utils
        tokenizer.py
        metrics.py
        tokenizer_test.py
        __init__.py
        dataset.py
        compute_bleu_test.py
        compute_bleu.py
        __init__.py
        data_download.py
        README.md
        model
        embedding_layer.py
        transformer.py
        model_utils_test.py
        attention_layer.py
        __init__.py
        model_params.py
        ffn_layer.py
        model_utils.py
        beam_search.py
        beam_search_test.py
        translate.py
        transformer_main.py
        vocab
        process_data.py
        fp32
        run_and_time.sh
        run_preprocessing.sh
        transformer
        utils
        tokenizer.py
        metrics.py
        tokenizer_test.py
        __init__.py
        dataset.py
        compute_bleu_test.py
        compute_bleu.py
        __init__.py
        data_download.py
        README.md
        model
        embedding_layer.py
        transformer.py
        model_utils_test.py
        attention_layer.py
        __init__.py
        model_params.py
        ffn_layer.py
        model_utils.py
        beam_search.py
        beam_search_test.py
        translate.py
        transformer_main.py
        vocab
        process_data.py
      - __init__.py
      - transformer_lt_official
        inference
        fp32
        utils
        tokenizer.py
        metrics.py
        tokenizer_test.py
        __init__.py
        official
        utils
        hyperparams_flags.py
        __init__.py
        logs
        hooks_helper_test.py
        cloud_lib_test.py
        metric_hook_test.py
        metric_hook.py
        guidelines.md
        mlperf_helper.py
        hooks.py
        logger.py
        hooks_test.py
        logger_test.py
        __init__.py
        cloud_lib.py
        hooks_helper.py
        flags
        flags_test.py
        guidelines.md
        _misc.py
        __init__.py
        README.md
        _benchmark.py
        _performance.py
        core.py
        _base.py
        _conventions.py
        _device.py
        _distribution.py
        compute_bleu.py
        infer_ab.py
  - reinforcement
    - __init__.py
    - tensorflow
      - minigo
        training
        __init__.py
        requirements.txt
        fp32
        bazel-clean-large-scale.patch
        avoid-repeated-clone-singlenode.patch
        get-data.patch
        mlperf_split.patch
        bazel-clean-single-node.patch
        large-scale-no-bg.patch
        minigo_mlperf.patch
        avoid-repeated-clone-multinode.patch
        tune_for_many_core.patch
        __init__.py
      - __init__.py
  - recommendation
    - __init__.py
    - tensorflow
      - wide_deep
        __init__.py
        inference
        __init__.py
        fp32
        wide_deep_inference.py
        __init__.py
      - wide_deep_large_ds
        training
        train.py
        __init__.py
        dataset
        featurecolumn_graph_optimization.py
        preprocess_csv_tfrecords.py
        __init__.py
        inference
        parallel_inference.py
        __init__.py
        inference.py
      - __init__.py
      - ncf
        training
        neumf_model.py
        ncf_common.py
        __init__.py
        ncf_estimator_main.py
  - common
    - __init__.py
    - tensorflow
      - mlperf_compliance
        tf_mlperf_log.py
        _transformer_tags.py
        _maskrcnn_tags.py
        mlperf_log.py
        _gnmt_tags.py
        _ncf_tags.py
        _resnet_tags.py
        resnet_log_helper.py
        tags.py
        __init__.py
        _ssd_tags.py
        test_tag_set.py
      - mlperf_utils
        misc
        __init__.py
        model_helpers.py
        export
        export.py
        __init__.py
        arg_parsers
        __init__.py
        parsers.py
        __init__.py
        logs
        metric_hook.py
        benchmark_uploader.py
        hooks.py
        logger.py
        __init__.py
        hooks_helper.py
      - __init__.py
  - image_recognition
    - __init__.py
    - tensorflow
      - inceptionv4
        inference
        cnn_util.py
        preprocessing.py
        accuracy.py
        datasets.py
        __init__.py
        benchmark.py
      - inceptionv3
        fp32
        eval_image_classifier_inference.py
        preprocessing.py
        datasets.py
        __init__.py
        int8
        cnn_util.py
        preprocessing.py
        accuracy.py
        datasets.py
        __init__.py
        preprocessing_benchmark.py
        calibration.py
        benchmark.py
      - resnet101
        __init__.py
        inference
        vgg_preprocessing.py
        eval_image_classifier_inference.py
        preprocessing.py
        datasets.py
        __init__.py
        int8
        vgg_preprocessing.py
        cnn_util.py
        preprocessing.py
        datasets.py
        __init__.py
        calibration.py
      - resnet50v1_5
        training
        mlperf_compliance
        tf_mlperf_log.py
        _transformer_tags.py
        _maskrcnn_tags.py
        mlperf_log.py
        _gnmt_tags.py
        _ncf_tags.py
        _resnet_tags.py
        resnet_log_helper.py
        tags.py
        __init__.py
        _ssd_tags.py
        test_tag_set.py
        mlperf_utils
        misc
        __init__.py
        model_helpers.py
        export
        export.py
        __init__.py
        arg_parsers
        __init__.py
        parsers.py
        __init__.py
        logs
        metric_hook.py
        benchmark_uploader.py
        hooks.py
        logger.py
        __init__.py
        hooks_helper.py
        __init__.py
        mlperf_resnet
        resnet_run_loop.py
        resnet_model.py
        __init__.py
        imagenet_main.py
        imagenet_preprocessing.py
        __init__.py
        inference
        eval_image_classifier_inference.py
        preprocessing.py
        datasets.py
        __init__.py
        int8
        generate_calibration_data.py
        cnn_util.py
        preprocessing.py
        datasets.py
        __init__.py
        preprocessing_benchmark.py
        benchmark.py
      - resnet50
        __init__.py
        inference
        eval_image_classifier_inference.py
        preprocessing.py
        datasets.py
        __init__.py
        int8
        generate_calibration_data.py
        cnn_util.py
        preprocessing.py
        datasets.py
        __init__.py
        preprocessing_benchmark.py
        benchmark.py
      - mobilenet_v1
        inference
        fp32
        cnn_util.py
        accuracy.py
        accuracy_preprocessing.py
        eval_image_classifier.py
        benchmark.py
        accuracy_datasets.py
        int8
        cnn_util.py
        preprocessing.py
        accuracy.py
        datasets.py
        __init__.py
        calibration.py
        benchmark.py
      - __init__.py
      - densenet169
        inference
        fp32
        image_preprocessing.py
        cnn_util.py
        accuracy.py
        densenet_preprocessing.py
        dataset.py
        benchmark.py
  - __init__.py
  - object_detection
    - __init__.py
    - tensorflow
      - ssd-mobilenet
        __init__.py
        inference
        coco_label_map.py
        coco_detection_evaluator.py
        __init__.py
        ssdmobilenet_preprocess.pb
        fp32
        infer_detections.py
        __init__.py
        coco_tools.py
        int8
        infer_detections.py
        __init__.py
      - __init__.py
      - ssd-resnet34
        training
        bfloat16
        benchmark-tf-2.0.diff
        __init__.py
        benchmark-bfloat16.diff
        __init__.py
        fp32
        benchmark-tf-2.0.diff
        __init__.py
        __init__.py
        inference
        tensorflow_models_tf2.0.patch
        __init__.py
        fp32
        infer_detections.py
        __init__.py
        coco_constants.py
        tensorflow_benchmarks_tf2.0.patch
        int8
        infer_detections.py
        __init__.py
        coco_constants.py
      - rfcn
        __init__.py
        inference
        tf-2.0.patch
        __init__.py
        fp32
        evaluator.py
        eval.py
        run_rfcn_inference.py
        dataset_util.py
        __init__.py
        eval_util.py
        coco_mAP.sh
        int8
        run_rfcn_inference.py
        __init__.py
        coco_mAP.sh
  - language_modeling
    - tensorflow
      - bert_large
        training
        bfloat16
        run_pretraining.py
        modeling_test.py
        run_pretraining_ckppoint.sh
        run_classifier_with_tfhub.py
        modeling.py
        sample_text.txt
        optimization_test.py
        create_pretraining_data.py
        optimization.py
        run_squad.py
        CONTRIBUTING.md
        run_classifier.py
        multilingual.md
        predicting_movie_reviews_with_bert_on_tf_hub.ipynb
        __init__.py
        README.md
        create_pretraining_data.sh
        tokenization.py
        requirements.txt
        tokenization_test.py
        generic_ops.py
        extract_features.py
        __init__.py
        fp32
        run_pretraining.py
        run_classifier.sh
        run_pretraining.sh
        modeling_test.py
        run_pretraining_ckppoint.sh
        run_classifier_with_tfhub.py
        modeling.py
        sample_text.txt
        optimization_test.py
        LICENSE
        create_pretraining_data.py
        optimization.py
        run_squad.py
        CONTRIBUTING.md
        run_classifier.py
        multilingual.md
        predicting_movie_reviews_with_bert_on_tf_hub.ipynb
        __init__.py
        README.md
        create_pretraining_data.sh
        tokenization.py
        requirements.txt
        tokenization_test.py
        run_squad_large.sh
        generic_ops.py
        extract_features.py
        __init__.py
        inference
        run_pretraining.py
        modeling_test.py
        evaluate-v1.1.py
        run_pretraining_ckppoint.sh
        run_classifier_with_tfhub.py
        modeling.py
        sample_text.txt
        optimization_test.py
        create_pretraining_data.py
        optimization.py
        run_squad.py
        CONTRIBUTING.md
        run_classifier.py
        multilingual.md
        predicting_movie_reviews_with_bert_on_tf_hub.ipynb
        __init__.py
        README.md
        create_pretraining_data.sh
        tokenization.py
        requirements.txt
        tokenization_test.py
        generic_ops.py
        extract_features.py
      - __init__.py
- benchmarks
  - language_translation
    - __init__.py
    - tensorflow
      - mlperf_gnmt
        __init__.py
        README.md
        requirements.txt
        inference
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
      - transformer_mlperf
        training
        bfloat16
        config.json
        model_init.py
        __init__.py
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        README.md
      - __init__.py
      - transformer_lt_official
        __init__.py
        README.md
        requirements.txt
        inference
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
  - reinforcement
    - __init__.py
    - tensorflow
      - minigo
        training
        __init__.py
        fp32
        model_init.py
        __init__.py
        __init__.py
        README.md
        requirements.txt
      - __init__.py
  - recommendation
    - __init__.py
    - tensorflow
      - wide_deep
        __init__.py
        README.md
        inference
        __init__.py
        fp32
        model_init.py
        __init__.py
        data_download.py
      - wide_deep_large_ds
        training
        __init__.py
        fp32
        model_init.py
        __init__.py
        readme.txt
        __init__.py
        README.md
        inference
        readme.txt
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        int8
        config.json
        model_init.py
        __init__.py
      - __init__.py
      - ncf
        training
        bfloat16
        config.json
        model_init.py
        __init__.py
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
  - common
    - utils
      - __init__.py
      - validators.py
      - multi_instance.py
    - base_benchmark_util.py
    - base_model_init.py
    - __init__.py
    - platform_util.py
    - tensorflow
      - run_tf_benchmark.py
      - __init__.py
      - start.sh
  - image_recognition
    - __init__.py
    - tensorflow
      - inceptionv4
        __init__.py
        README.md
        inference
        config.json
        inceptionv4_model_init.py
        __init__.py
        fp32
        model_init.py
        __init__.py
        int8
        model_init.py
        __init__.py
      - inceptionv3
        __init__.py
        README.md
        inference
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        int8
        config.json
        model_init.py
        __init__.py
      - resnet101
        __init__.py
        README.md
        inference
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        int8
        config.json
        model_init.py
        __init__.py
      - resnet50v1_5
        training
        bfloat16
        model_init.py
        __init__.py
        __init__.py
        common_resnet50
        config.json
        __init__.py
        resnet50_model_init.py
        fp32
        model_init.py
        __init__.py
        __init__.py
        README.md
        inference
        bfloat16
        config.json
        model_init.py
        __init__.py
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        int8
        config.json
        model_init.py
        __init__.py
      - resnet50
        __init__.py
        README.md
        inference
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        int8
        config.json
        model_init.py
        __init__.py
      - mobilenet_v1
        __init__.py
        README.md
        inference
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        int8
        config.json
        model_init.py
        __init__.py
      - __init__.py
      - densenet169
        __init__.py
        README.md
        inference
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
  - __init__.py
  - README.md
  - object_detection
    - __init__.py
    - tensorflow
      - ssd-mobilenet
        __init__.py
        README.md
        requirements.txt
        inference
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        int8
        config.json
        model_init.py
        __init__.py
      - __init__.py
      - ssd-resnet34
        training
        bfloat16
        config.json
        model_init.py
        __init__.py
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        __init__.py
        README.md
        requirements.txt
        inference
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        int8
        config.json
        model_init.py
        __init__.py
      - rfcn
        __init__.py
        README.md
        requirements.txt
        inference
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        int8
        config.json
        model_init.py
        __init__.py
  - launch_benchmark.py
  - language_modeling
    - tensorflow
      - bert_large
        training
        bfloat16
        config.json
        model_init.py
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
        __init__.py
        README.md
        inference
        bfloat16
        config.json
        model_init.py
        __init__.py
        __init__.py
        fp32
        config.json
        model_init.py
        __init__.py
- __init__.py
- Contribute.md
- README.md
- tests
  - test_utils
    - platform_config.py
    - io.py
    - __init__.py
  - __init__.py
  - README.md
  - unit
    - test_launch_benchmark.py
    - common
      - utils
        test_validators.py
        files
        sorted_membind_info.json
        inference_prefix_exception.json
        membind_info.json
        inference_prefix_ht.json
        inference_prefix_no_ht.json
        test_multi_instance.py
      - test_platform_util.py
      - test_base_model_init.py
      - __init__.py
      - tensorflow
        test_run_tf_benchmarks.py
        tf_model_args
        tf_resnet50_args.json
        tf_resnet50v1_5_args.json
        tf_mobilenet_v1_args.json
        tf_inceptionv3_args.json
        tf_densenet169_args.json
        tf_rfcn_args.json
        tf_gnmt_args.json
        tf_ssd_resnet34_args.json
        tf_resnet101_args.json
        tf_wide_deep_large_ds_args.json
        tf_bert_args.json
        tf_ssd_mobilenet_args.json
        tf_inceptionv4_args.json
        tf_wide_deep_args.json
        __init__.py
    - __init__.py
  - conftest.py
- CODEOWNERS
- .gitignore
- Jenkinsfile
- docs
  - language_translation
    - tensorflow
      - Tutorial.md
  - recommendation
    - tensorflow
      - Tutorial.md
  - image_recognition
    - quantization
      - Tutorial.md
    - tensorflow
      - Tutorial.md
  - README.md
  - general
    - tensorflow
      - LaunchBenchmark.md
      - BuildContainer.md
      - GeneralBestPractices.md
  - language_modeling
    - tensorflow
      - Tutorial.md
- tox.ini

# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Script to compute official BLEU score.

Source:
https://github.com/tensorflow/tensor2tensor/blob/master/tensor2tensor/utils/bleu_hook.py
"""

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import re
import sys
import unicodedata

# pylint: disable=g-bad-import-order
import six
from absl import app as absl_app
from absl import flags
import tensorflow as tf
# pylint: enable=g-bad-import-order

from utils import metrics
from utils import tokenizer
from official.utils.flags import core as flags_core


class UnicodeRegex(object):
  """Ad-hoc hack to recognize all punctuation and symbols."""

  def __init__(self):
    punctuation = self.property_chars("P")
    self.nondigit_punct_re = re.compile(r"([^\d])([" + punctuation + r"])")
    self.punct_nondigit_re = re.compile(r"([" + punctuation + r"])([^\d])")
    self.symbol_re = re.compile("([" + self.property_chars("S") + "])")

  def property_chars(self, prefix):
    return "".join(six.unichr(x) for x in range(sys.maxunicode)
                   if unicodedata.category(six.unichr(x)).startswith(prefix))


uregex = UnicodeRegex()


def bleu_tokenize(string):
  r"""Tokenize a string following the official BLEU implementation.

  See https://github.com/moses-smt/mosesdecoder/'
           'blob/master/scripts/generic/mteval-v14.pl#L954-L983
  In our case, the input string is expected to be just one line
  and no HTML entities de-escaping is needed.
  So we just tokenize on punctuation and symbols,
  except when a punctuation is preceded and followed by a digit
  (e.g. a comma/dot as a thousand/decimal separator).

  Note that a numer (e.g. a year) followed by a dot at the end of sentence
  is NOT tokenized,
  i.e. the dot stays with the number because `s/(\p{P})(\P{N})/ $1 $2/g`
  does not match this case (unless we add a space after each sentence).
  However, this error is already in the original mteval-v14.pl
  and we want to be consistent with it.

  Args:
    string: the input string

  Returns:
    a list of tokens
  """
  string = uregex.nondigit_punct_re.sub(r"\1 \2 ", string)
  string = uregex.punct_nondigit_re.sub(r" \1 \2", string)
  string = uregex.symbol_re.sub(r" \1 ", string)
  return string.split()


def bleu_wrapper(ref_filename, hyp_filename, case_sensitive=False):
  """Compute BLEU for two files (reference and hypothesis translation)."""
  ref_lines = tokenizer.native_to_unicode(
      tf.io.gfile.GFile(ref_filename).read()).strip().splitlines()
  hyp_lines = tokenizer.native_to_unicode(
      tf.io.gfile.GFile(hyp_filename).read()).strip().splitlines()

  if len(ref_lines) != len(hyp_lines):
    raise ValueError("Reference and translation files have different number of "
                     "lines. If training only a few steps (100-200), the "
                     "translation may be empty.")
  if not case_sensitive:
    ref_lines = [x.lower() for x in ref_lines]
    hyp_lines = [x.lower() for x in hyp_lines]
  ref_tokens = [bleu_tokenize(x) for x in ref_lines]
  hyp_tokens = [bleu_tokenize(x) for x in hyp_lines]
  return metrics.compute_bleu(ref_tokens, hyp_tokens) * 100


def main(unused_argv):
  if FLAGS.bleu_variant in ("both", "uncased"):
    score = bleu_wrapper(FLAGS.reference, FLAGS.translation, False)
    tf.compat.v1.logging.info("Case-insensitive results: %f" % score)

  if FLAGS.bleu_variant in ("both", "cased"):
    score = bleu_wrapper(FLAGS.reference, FLAGS.translation, True)
    tf.compat.v1.logging.info("Case-sensitive results: %f" % score)


def define_compute_bleu_flags():
  """Add flags for computing BLEU score."""
  flags.DEFINE_string(
      name="translation", default=None,
      help=flags_core.help_wrap("File containing translated text."))
  flags.mark_flag_as_required("translation")

  flags.DEFINE_string(
      name="reference", default=None,
      help=flags_core.help_wrap("File containing reference translation."))
  flags.mark_flag_as_required("reference")

  flags.DEFINE_enum(
      name="bleu_variant", short_name="bv", default="both",
      enum_values=["both", "uncased", "cased"], case_sensitive=False,
      help=flags_core.help_wrap(
          "Specify one or more BLEU variants to calculate. Variants: \"cased\""
          ", \"uncased\", or \"both\"."))


if __name__ == "__main__":
  tf.compat.v1.logging.set_verbosity(tf.compat.v1.logging.INFO)
  define_compute_bleu_flags()
  FLAGS = flags.FLAGS
  absl_app.run(main)