python source code of video

fine-lm-master
- src
  - tensor2tensor
    - AUTHORS
    - tensor2tensor
      - serving
        export.py
        query.py
        __init__.py
        README.md
        serving_utils.py
      - utils
        video2gif.py
        avg_checkpoints.py
        expert_utils_test.py
        data_reader_test.py
        quantization.py
        trainer_lib_test.py
        modality.py
        cloud_tpu.py
        usr_dir.py
        get_rouge.py
        metrics_test.py
        learning_rate.py
        devices.py
        yellowfin_test.py
        metrics.py
        cloud_mlengine.py
        decoding.py
        adv_attack_utils.py
        rouge.py
        video_metrics.py
        diet_test.py
        flags.py
        adafactor.py
        get_ende_bleu.sh
        diet.py
        data_reader.py
        rouge_test.py
        registry.py
        restore_hook.py
        checkpoint_compatibility_test.py
        t2t_model.py
        yellowfin.py
        __init__.py
        multistep_optimizer_test.py
        registry_test.py
        bleu_hook_test.py
        optimize.py
        expert_utils.py
        compute_video_metrics.py
        metrics_hook_test.py
        beam_search.py
        beam_search_test.py
        trainer_lib.py
        get_cnndm_rouge.sh
        metrics_hook.py
        multistep_optimizer.py
        bleu_hook.py
      - layers
        discretization.py
        latent_layers.py
        discretization_test.py
        rev_block_test.py
        common_hparams.py
        modalities_test.py
        common_image_attention.py
        rev_block.py
        common_message_passing_attention.py
        common_layers.py
        common_attention.py
        common_attention_test.py
        common_image_attention_test.py
        __init__.py
        modalities.py
        common_layers_test.py
      - models
        revnet_test.py
        slicenet.py
        distillation.py
        transformer.py
        basic_test.py
        slicenet_test.py
        neural_gpu.py
        basic.py
        bytenet_test.py
        image_transformer_2d.py
        xception.py
        bytenet.py
        image_transformer_2d_test.py
        resnet.py
        lstm_test.py
        image_transformer.py
        lstm.py
        xception_test.py
        __init__.py
        README.md
        shake_shake.py
        transformer_test.py
        resnet_test.py
        research
        universal_transformer_util.py
        rl.py
        autoencoders.py
        transformer_moe.py
        cycle_gan.py
        autoencoders_test.py
        gene_expression.py
        multimodel.py
        attention_lm_moe.py
        transformer_vae_test.py
        gene_expression_test.py
        transformer_revnet.py
        adafactor_experiments.py
        transformer_nat.py
        transformer_revnet_test.py
        transformer_vae.py
        attention_lm.py
        universal_transformer_test.py
        next_frame.py
        lm_experiments.py
        transformer_symshard.py
        super_lm.py
        transformer_sketch.py
        multimodel_test.py
        __init__.py
        universal_transformer.py
        next_frame_test.py
        aligned.py
        neural_gpu_test.py
        revnet.py
        image_transformer_test.py
        vanilla_gan.py
      - rl
        model_rl_experiment_test.py
        rl_trainer_lib_test.py
        ppo.py
        model_rl_experiment_stochastic_test.py
        t2t_rl_trainer.py
        model_rl_experiment.py
        rl_trainer_lib.py
        __init__.py
        README.md
        collect.py
        envs
        py_func_batch_env.py
        batch_env_factory.py
        tf_atari_wrappers.py
        in_graph_batch_env.py
        batch_env.py
        __init__.py
        utils.py
        simulated_batch_env.py
      - test_data
        example_usr_dir
        my_submodule.py
        __init__.py
        requirements.txt
        vocab.ende.8192
        transformer_test_ckpt
        flags.txt
        model.ckpt-1.index
        hparams.json
        checkpoint
        model.ckpt-1.data-00000-of-00002
      - notebooks
        hello_t2t-rl.ipynb
        asr_transformer.ipynb
      - data_generators
        translate_test.py
        translate_enmk.py
        snli.py
        translate_enzh.py
        gym_utils.py
        twentybn.py
        mscoco_test.py
        speech_recognition.py
        audio_test.py
        gym_problems.py
        imdb.py
        gym_problems_specs.py
        timeseries_data_generator.py
        desc2code.py
        wsj_parsing.py
        tokenizer.py
        cipher.py
        gene_expression.py
        wikitext103.py
        mnist.py
        celeba.py
        librispeech.py
        translate_ende.py
        timeseries.py
        gene_expression_test.py
        ptb.py
        problem_hparams.py
        dna_encoder_test.py
        translate_enid.py
        text_encoder_test.py
        lm1b.py
        generator_utils.py
        dna_encoder.py
        cnn_dailymail.py
        wnli.py
        fsns.py
        mscoco.py
        celeba_test.py
        imagenet_test.py
        babi_qa.py
        desc2code_test.py
        text_encoder_build_subword.py
        algorithmic_test.py
        tokenizer_test.py
        video_generated.py
        program_search.py
        image_utils.py
        audio.py
        ice_parsing.py
        image_lsun.py
        algorithmic_math.py
        style_transfer.py
        test_data
        vocab-1.txt
        vocab-2.txt
        corpus-1.txt
        corpus-2.txt
        multi_problem.py
        algorithmic.py
        rte.py
        video_utils.py
        ocr.py
        problem.py
        subject_verb_agreement.py
        timeseries_data_generator_test.py
        bair_robot_pushing.py
        sst_binary.py
        image_utils_test.py
        gym_problems_test.py
        text_problems.py
        translate_enet.py
        generator_utils_test.py
        gh_function_docstring_encoder.py
        __init__.py
        text_problems_test.py
        common_voice.py
        README.md
        google_robot_pushing.py
        timeseries_test.py
        text_encoder.py
        program_search_test.py
        wikisum
        delete_instances.sh
        validate_data.py
        wikisum.py
        utils_test.py
        parallel_launch.py
        get_references_web_single_group.py
        test_data
        para_good1.txt
        para_bad1.txt
        get_references_commoncrawl.py
        get_references_web.py
        produce_examples.py
        __init__.py
        README.md
        utils.py
        generate_vocab.py
        translate_envi.py
        multinli.py
        all_problems.py
        algorithmic_math_test.py
        translate.py
        lm1b_imdb.py
        inspect_tfrecord.py
        cola.py
        imagenet.py
        cifar.py
        lambada.py
        wiki.py
        qnli.py
        translate_enfr.py
        quora_qpairs.py
        translate_encs.py
        squad.py
      - __init__.py
      - visualization
        visualization_test.py
        attention.py
        TransformerVisualization.ipynb
        attention.js
        __init__.py
        visualization.py
      - bin
        t2t-trainer
        t2t_trainer.py
        t2t_translate_all.py
        t2t-translate-all
        t2t_datagen.py
        t2t-decoder
        t2t-make-tf-configs
        t2t-avg-all
        make_tf_configs.py
        t2t_avg_all.py
        t2t_trainer_test.py
        t2t_distill.py
        t2t_attack.py
        t2t-exporter
        t2t-bleu
        __init__.py
        t2t-insights-server
        t2t_bleu.py
        t2t_decoder.py
        t2t-datagen
        t2t-query-server
      - problems_test.py
      - problems.py
      - insights
        query_processor.py
        graph.py
        insight_configuration.proto
        server.py
        polymer
        explore_view
        explore-view.js
        explore-view.html
        query_card
        query-card.js
        query-card.html
        insights_app
        insights-app.html
        insights-app.js
        language_selector
        language-selector-content.html
        language-selector-content.js
        language-selector.html
        language-selector.js
        attention_visualization
        attention-visualization.js
        attention-visualization.html
        processing_visualization
        processing-visualization.js
        processing-visualization.html
        bower.json
        translation_result
        translation-result.html
        translation-result.js
        common-types.js
        graph_visualization
        graph-visualization.html
        graph-visualization.js
        .bowerrc
        tensor2tensor.html
        index.html
        __init__.py
        README.md
        transformer_model.py
    - LICENSE
    - CONTRIBUTING.md
    - ISSUE_TEMPLATE.md
    - setup.py
    - .travis.yml
    - README.md
    - pylintrc
    - .gitignore
    - docs
      - new_model.md
      - walkthrough.md
      - cloud_mlengine.md
      - index.md
      - overview.md
      - tutorials
        asr_with_transformer.md
      - distributed_training.md
      - new_problem.md
      - cloud_tpu.md
  - README.md
  - scripts
    - opennmt-unmt
      - train.sh
      - train.py
      - inference.py
    - en-lm.sh
    - gcloud-ctpu-startup.sh
- LICENSE
- imgs
- presentations
  - intro
    - xaringan-themer.css
    - libs
      - dt-core
        js
        jquery.dataTables.min.js
        css
        jquery.dataTables.min.css
        jquery.dataTables.extra.css
      - jquery
        jquery.min.js
        LICENSE.txt
      - crosstalk
        js
        crosstalk.min.js.map
        crosstalk.js.map
        crosstalk.min.js
        crosstalk.js
        css
        crosstalk.css
      - datatables-css
        datatables-crosstalk.css
      - datatables-binding
        datatables.js
      - htmlwidgets
        htmlwidgets.js
    - imgs
      - stupendousman.jpeg
    - intro-slides_files
      - figure-html
        cars-1.svg
    - index.html
    - intro-slides.html
    - index.Rmd
  - lit
    - delayed-impact
      - xaringan-themer.css
      - imgs
      - icml.html
      - icml.Rmd
  - progress
    - xaringan-themer.css
    - libs
      - dt-core
        js
        jquery.dataTables.min.js
        css
        jquery.dataTables.min.css
        jquery.dataTables.extra.css
      - jquery
        jquery.min.js
        LICENSE.txt
      - crosstalk
        js
        crosstalk.min.js.map
        crosstalk.js.map
        crosstalk.min.js
        crosstalk.js
        css
        crosstalk.css
      - datatables-css
        datatables-crosstalk.css
      - datatables-binding
        datatables.js
      - htmlwidgets
        htmlwidgets.js
    - imgs
      - stupendousman.jpeg
    - index.html
    - index.Rmd
- README.md
- .gitignore
- docs
  - xaringan-themer.css
  - libs
    - dt-core
      - js
        jquery.dataTables.min.js
      - css
        jquery.dataTables.min.css
        jquery.dataTables.extra.css
    - jquery
      - jquery.min.js
      - LICENSE.txt
    - crosstalk
      - js
        crosstalk.min.js.map
        crosstalk.js.map
        crosstalk.min.js
        crosstalk.js
      - css
        crosstalk.css
    - datatables-css
      - datatables-crosstalk.css
    - datatables-binding
      - datatables.js
    - htmlwidgets
      - htmlwidgets.js
  - imgs
    - stupendousman.jpeg
  - index_files
    - figure-html
  - index.html
  - index.Rmd
- fine-lm.Rproj

# coding=utf-8
# Copyright 2018 The Tensor2Tensor Authors.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""Computes the metrics for video prediction and generation."""

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import os
import numpy as np
import six
import tensorflow as tf


def load_image_map_function(filename, frame_shape):
  image = tf.read_file(filename)
  image = tf.image.decode_png(image)
  image = tf.image.resize_images(image, frame_shape[0:2])
  image.set_shape(frame_shape)
  return image


def load_videos(template, video_length, frame_shape):
  """Loads videos from files.

  Args:
    template: template string for listing the image files.
    video_length: length of the video.
    frame_shape: shape of each frame.

  Returns:
    dataset: the tf dataset frame by frame.
    dataset_len: number of the items which is the number of image files.

  Raises:
    ValueError: if no files found.
  """
  filenames = tf.gfile.Glob(template)
  if not filenames:
    raise ValueError("no files found.")
  filenames = sorted(filenames)
  dataset_len = len(filenames)
  filenames = tf.constant(filenames)
  dataset = tf.data.Dataset.from_tensor_slices(filenames)
  dataset = dataset.apply(tf.contrib.data.map_and_batch(
      lambda filename: load_image_map_function(filename, frame_shape),
      video_length, drop_remainder=True))
  return dataset, dataset_len


def file_pattern(output_dir, problem_name, prefix):
  return os.path.join(output_dir, "{}_{}*.png".format(problem_name, prefix))


def get_target_and_output_filepatterns(output_dir, problem_name):
  return (file_pattern(output_dir, problem_name, "outputs"),
          file_pattern(output_dir, problem_name, "targets"))


def get_zipped_dataset_from_png_files(
    output_files, target_files, video_length, frame_shape):
  outputs, len_ = load_videos(output_files, video_length, frame_shape)
  targets, len_ = load_videos(target_files, video_length, frame_shape)
  zipped_dataset = tf.data.Dataset.zip((outputs, targets))
  num_videos = len_ // video_length
  iterator = zipped_dataset.make_one_shot_iterator()
  return iterator, None, num_videos


def save_results(results, output_dir, problem_name):
  for name, array in six.iteritems(results):
    output_filename = "{}_{}.npy".format(problem_name, name)
    output_filename = os.path.join(output_dir, output_filename)
    with tf.gfile.Open(output_filename, "wb") as fname:
      np.save(fname, array)


def compute_metrics(output_video, target_video):
  max_pixel_value = 255.0
  output_video = tf.to_float(output_video)
  target_video = tf.to_float(target_video)
  psnr = tf.image.psnr(output_video, target_video, max_pixel_value)
  ssim = tf.image.ssim(output_video, target_video, max_pixel_value)
  return {"PSNR": psnr, "SSIM": ssim}


def stack_data_given_key(predictions, key):
  x = [p[key] for p in predictions]
  x = np.stack(x, axis=0)
  return x


def get_zipped_dataset_from_predictions(predictions):
  """Creates dataset from in-memory predictions."""
  targets = stack_data_given_key(predictions, "targets")
  outputs = stack_data_given_key(predictions, "outputs")
  num_videos = len(targets)

  targets_placeholder = tf.placeholder(targets.dtype, targets.shape)
  outputs_placeholder = tf.placeholder(outputs.dtype, outputs.shape)
  dataset = tf.data.Dataset.from_tensor_slices(
      (targets_placeholder, outputs_placeholder))
  iterator = dataset.make_initializable_iterator()
  feed_dict = {targets_placeholder: targets,
               outputs_placeholder: outputs}

  return iterator, feed_dict, num_videos


def compute_one_decoding_video_metrics(iterator, feed_dict, num_videos):
  """Computes the average of all the metric for one decoding.

  Args:
    iterator: dataset iterator.
    feed_dict: feed dict to initialize iterator.
    num_videos: number of videos.

  Returns:
    Dictionary which contains the average of each metric per frame.
  """
  output, target = iterator.get_next()

  metrics_dict = compute_metrics(output, target)
  metrics_names, metrics = zip(*six.iteritems(metrics_dict))
  means, update_ops = tf.metrics.mean_tensor(metrics)

  with tf.Session() as sess:
    sess.run(tf.local_variables_initializer())
    initalizer = iterator._initializer  # pylint: disable=protected-access
    if initalizer is not None:
      sess.run(initalizer, feed_dict=feed_dict)

    # Compute mean over dataset
    for i in range(num_videos):
      print("Computing video: %d" % i)
      sess.run(update_ops)
    averaged_metrics = sess.run(means)

    results = dict(zip(metrics_names, averaged_metrics))
    return results


def compute_all_metrics_statistics(all_results):
  """Computes statistics of metrics across multiple decodings."""
  statistics = {}
  for key in all_results[0].keys():
    values = [result[key] for result in all_results]
    values = np.vstack(values)
    statistics[key + "_MEAN"] = np.mean(values, axis=0)
    statistics[key + "_STD"] = np.std(values, axis=0)
    statistics[key + "_MIN"] = np.min(values, axis=0)
    statistics[key + "_MAX"] = np.max(values, axis=0)
  return statistics


def compute_video_metrics_from_predictions(predictions):
  all_results = []
  for prediction in predictions:
    args = get_zipped_dataset_from_predictions(prediction)
    all_results.append(compute_one_decoding_video_metrics(*args))
  statistics = compute_all_metrics_statistics(all_results)
  return statistics


def compute_video_metrics_from_png_files(
    output_dirs, problem_name, video_length, frame_shape):
  """Computes the average of all the metric for one decoding.

  This function assumes that all the predicted and target frames
  have been saved on the disk and sorting them by name will result
  to consecutive frames saved in order.

  Args:
    output_dirs: directory with all the saved frames.
    problem_name: prefix of the saved frames usually name of the problem.
    video_length: length of the videos.
    frame_shape: shape of each frame in HxWxC format.

  Returns:
    Dictionary which contains the average of each metric per frame.
  """
  all_results = []
  for output_dir in output_dirs:
    output_files, target_files = get_target_and_output_filepatterns(
        output_dir, problem_name)
    args = get_zipped_dataset_from_png_files(
        output_files, target_files, video_length, frame_shape)
    all_results.append(compute_one_decoding_video_metrics(*args))
  statistics = compute_all_metrics_statistics(all_results)
  return statistics, all_results


def compute_and_save_video_metrics(
    output_dirs, problem_name, video_length, frame_shape):
  """Compute and saves the video metrics."""
  statistics, all_results = compute_video_metrics_from_png_files(
      output_dirs, problem_name, video_length, frame_shape)
  for results, output_dir in zip(all_results, output_dirs):
    save_results(results, output_dir, problem_name)

  parent_dir = os.path.join(output_dirs[0], os.pardir)
  final_dir = os.path.join(parent_dir, "decode")
  tf.gfile.MakeDirs(parent_dir)

  save_results(statistics, final_dir, problem_name)