python source code of export_kitti

lingvo-master
- codelabs
  - introduction.ipynb
- pip_package
  - build.Dockerfile
  - setup.py
  - build_pip_pkg.sh
  - README.md
  - build.sh
  - MANIFEST.in
- third_party
  - BUILD
  - toolchains
    - preconfig
      - ubuntu16.04
        gcc7_manylinux2010-nvcc-cuda10.0
        BUILD
        clang
        bin
        crosstool_wrapper_driver_is_not_gcc
        windows
        msvc_wrapper_for_nvcc.py
        cc_toolchain_config.bzl
  - auditwheel.sh
  - __init__.py
  - icu
    - BUILD
    - BUILD.system
    - udata.patch
    - BUILD.bazel
    - LICENSE
    - data
      - icu_conversion_data.c.gz.aj
      - icu_conversion_data.c.gz.aa
      - BUILD.bazel
      - icu_conversion_data.c.gz.ab
      - icu_conversion_data.c.gz.ac
      - LICENSE
      - icu_conversion_data.c.gz.ai
      - icu_conversion_data.c.gz.ad
      - icu_conversion_data.c.gz.ah
      - icu_conversion_data.c.gz.ag
      - icu_conversion_data.c.gz.af
      - icu_conversion_data.c.gz.ae
  - repo.bzl
- lingvo
  - BUILD
  - ipython_kernel.py
  - base_trial.py
  - model_registry_test.py
  - executor.py
  - model_import_test.py
  - models_test_helper.py
  - models_test.py
  - datasets.py
  - tasks
    - BUILD
    - asr
      - model_test_input_generator.py
      - frontend.py
      - BUILD
      - wpm_16k_librispeech.vocab
      - input_generator_test.py
      - fusion.py
      - decoder.py
      - model_test.py
      - decoder_test.py
      - encoder.py
      - decoder_utils_test.py
      - model.py
      - frontend_test.py
      - params
        BUILD
        librispeech.py
        params.py
      - decoder_utils.py
      - __init__.py
      - tools
        BUILD
        librispeech_get_data.sh
        librispeech_lib.sh
        librispeech.02.download_devtest.sh
        simple_wer_v2_test.py
        simple_wer_v2.py
        __init__.py
        simple_wer_test.py
        librispeech.04.parameterize_devtest.sh
        librispeech.03.parameterize_train.sh
        simple_wer.py
        librispeech.01.download_train.sh
      - encoder_test.py
      - input_generator.py
      - contextualizer_base.py
    - car
      - BUILD
      - point_detector.py
      - calibration_processing_test.py
      - summary_test.py
      - car_lib.py
      - kitti_decoder.py
      - input_extractor.py
      - ap_metric.py
      - base_extractor.py
      - input_preprocessors.py
      - pillars.py
      - kitti_metadata.py
      - breakdown_metric_test.py
      - detection_3d_lib.py
      - detection_3d_metrics.py
      - testdata
        BUILD
        kitti_raw_label_testdata.txt
        kitti_raw_calib_testdata.txt
      - car_layers_test.py
      - summary.py
      - detection_3d_lib_test.py
      - geometry_test.py
      - pointnet_test.py
      - transform_util_test.py
      - base_decoder.py
      - geometry.py
      - builder_lib_test.py
      - transform_util.py
      - lr_util_test.py
      - lr_util.py
      - detection_decoder.py
      - kitti_input_generator.py
      - pointnet.py
      - car_layers.py
      - kitti_ap_metric.py
      - evaluation_metadata.py
      - params
        BUILD
        kitti.py
        params.py
        waymo.py
      - waymo
        BUILD
        waymo_metadata.py
        waymo_open_input_generator.py
        waymo_ap_metric_test.py
        waymo_ap_metric.py
        waymo_decoder.py
        export_to_submission_format.py
        __init__.py
        tools
        BUILD
        generate_waymo_tf.py
        waymo_proto_to_tfe.py
        __init__.py
        waymo_open_input_generator_test.py
      - __init__.py
      - detection_3d_metrics_test.py
      - README.md
      - ops
        BUILD
        ps_utils.h
        image_metrics.h
        sampling_ops_test.py
        nms_3d_op_test.py
        ps_utils_test.cc
        box_util.h
        box_util.cc
        sampling_ops.cc
        nms_3d_op.cc
        image_metrics.cc
        point_grid_op_test.py
        average_precision_3d_op.cc
        car_ops.cc
        ps_utils.cc
        point_grid_op.cc
        __init__.py
        average_precision_3d_op_test.py
        pairwise_iou_op.cc
      - tools
        BUILD
        export_kitti_detection.py
        kitti_exporter.py
        kitti_data_test.py
        kitti_data.py
        create_kitti_crop_dataset.py
        __init__.py
        compare_params_main.py
      - input_extractor_test.py
      - detection_decoder_test.py
      - calibration_processing.py
      - breakdown_metric.py
      - car_lib_test.py
      - builder_lib.py
      - starnet.py
    - lm
      - layers_test.py
      - BUILD
      - input_generator_test.py
      - testdata
        BUILD
        lm1b_100.txt
        small_word_vocab.txt
      - model_test.py
      - model.py
      - layers.py
      - params
        BUILD
        params.py
        one_billion_wds.py
      - __init__.py
      - tools
        BUILD
        download_lm1b.py
        __init__.py
      - input_generator.py
    - punctuator
      - BUILD
      - input_generator_test.py
      - model_test.py
      - model.py
      - params
        BUILD
        codelab.py
        params.py
        brown_corpus_wpm.16000.vocab
      - __init__.py
      - tools
        BUILD
        download_brown_corpus.py
        __init__.py
      - input_generator.py
    - mt
      - layers_test.py
      - BUILD
      - data_augmenter.py
      - base_config.py
      - input_generator_test.py
      - decoder.py
      - data_augmenter_test.py
      - testdata
        BUILD
        en_fr.tfrecord
        wmt14_ende_wpm_32k_test.tfrecord
        en_de.text
      - model_test.py
      - decoder_test.py
      - encoder.py
      - model.py
      - layers.py
      - wpm-ende-2k.voc
      - params
        BUILD
        wmtm16_en_de.py
        params.py
        wmt14_en_de.py
      - __init__.py
      - README.md
      - tools
        wmt14.05.unpack_devtest.sh
        wmt14.07.tokenize_devtest.sh
        wmt14_get_data.sh
        wmt14.03.download_devtest.sh
        wmtm16_get_data.sh
        wmt14.02.download_train.sh
        wmtm16.02.download_data.sh
        wmtm16.04.tokenize_data.sh
        wmtm16.03.unpack_data.sh
        wmtm16_lib.sh
        wmt14.09.wpm_encode_devtest.sh
        wmt14_lib.sh
        __init__.py
        wmt14.04.unpack_train.sh
        wmtm16.01.download_moses_scripts.sh
        wmt14.01.download_moses_scripts.sh
        wmt14.08.wpm_encode_train.sh
        wmt14.06.tokenize_train.sh
        wmtm16.05.wpm_encode_data.sh
      - text_input.proto
      - encoder_test.py
      - input_generator.py
    - __init__.py
    - image
      - BUILD
      - input_generator_test.py
      - params
        BUILD
        mnist.py
        params.py
      - __init__.py
      - classifier.py
      - classifier_test.py
      - input_generator.py
  - model_registry.py
  - __init__.py
  - compat_test.py
  - base_runner.py
  - tools
    - BUILD
    - generate_proto_def.cc
    - compare_params_test.py
    - audio_lib_test.py
    - create_asr_features.py
    - wpm_encode_file.py
    - compare_params.py
    - beam_utils_test.py
    - print_tf_records.py
    - compute_stats.py
    - keras2ckpt.py
    - testdata
      - BUILD
      - gan_or_vae.16k.wav
      - gan_or_vae.flac
      - gan_or_vae.wav
    - gke_launch.py
    - generate_tf_dot_protos.sh
    - bpe_word_tokenizer.py
    - __init__.py
    - beam_utils.py
    - audio_lib.py
  - core
    - predictor.py
    - scorers_test.py
    - checkpointer.py
    - layers_test.py
    - gpipe_test.py
    - conv_layers_with_time_padding_test.py
    - trainer_test_utils.py
    - BUILD
    - symbolic_test.py
    - matrix_functions.py
    - optimizer.py
    - layers_with_gpipe.py
    - target_sequence_sampler.py
    - learner_test.py
    - base_layer.py
    - insertion.py
    - recurrent_gpu_test.py
    - base_model_params.py
    - early_stop.py
    - cluster_factory.py
    - test_utils.py
    - predictor_test.py
    - builder_layers.py
    - builder_layers_test.py
    - tshape.py
    - generic_input.py
    - hyperparams.proto
    - adagraft.py
    - spectrum_augmenter_on_device_test.py
    - reversible_layers_test.py
    - rnn_layers_test.py
    - inference_graph_exporter.py
    - target_sequence_sampler_test.py
    - quant_utils_test.py
    - inference_graph.proto
    - adagraft_test.py
    - metrics_test.py
    - inspect_utils.py
    - relative_atten_util.py
    - py_utils.py
    - testdata
      - BUILD
      - lenet_test_model.index
    - metrics.py
    - attention_test.py
    - scorers.py
    - plot_test.py
    - beam_search_helper.py
    - inspect_utils_test.py
    - layers_with_attention_test.py
    - datasource.py
    - checkpointer_test.py
    - decoder_lib.py
    - input_generator_helper.py
    - base_model.py
    - base_model_params_test.py
    - inference_graph_exporter_test.py
    - base_decoder.py
    - self_attention_layer.py
    - self_attention_layer_test.py
    - attention.py
    - lstm_frnn_layer.py
    - rnn_layers.py
    - cluster_test.py
    - symbolic.py
    - quant_utils.py
    - rnn_cell.py
    - wpm_tokenizer_test.py
    - bfloat16_variables.py
    - batch_major_attention.py
    - test_utils_test.py
    - input_generator_helper_test.py
    - summary_utils.py
    - plot.py
    - wpm_encoder.py
    - step.py
    - recurrent.py
    - base_model_test.py
    - relative_atten_util_test.py
    - ml_perf_log.py
    - task_scheduler_test.py
    - sendrecv_test.py
    - build_data.py
    - ml_perf_bleu_metric.py
    - test_helper.py
    - constants.py
    - ml_perf_log_test.py
    - layers.py
    - matrix_functions_test.py
    - hyperparams.py
    - spectrum_augmenter.py
    - conv_layers_builder.py
    - multitask_model.py
    - base_input_generator_test.py
    - builder_test.py
    - step_test.py
    - distributed_shampoo_test.py
    - lstm_frnn_layer_test.py
    - gpipe.py
    - spectrum_augmenter_on_device.py
    - __init__.py
    - steps
      - BUILD
      - embedding_steps.py
      - attention_steps.py
      - rnn_steps.py
      - rnn_steps_test.py
      - __init__.py
      - attention_steps_test.py
      - embedding_steps_test.py
    - layers_with_gpipe_test.py
    - base_input_generator.py
    - ml_perf_tokenizer.py
    - retry_test.py
    - layers_with_attention.py
    - sendrecv.py
    - cluster.py
    - ops
      - mass_op_test.py
      - chain_record_yielder.cc
      - weighted_mix_record_yielder_test.cc
      - hyps.proto
      - weighted_mix_record_yielder.h
      - mass_op.cc
      - BUILD
      - ascii_tokenizer.cc
      - beam_search_step_op_test.py
      - versioned_file_set.proto
      - assert_kernels.cc
      - preconditioner_op_kernels.cc
      - ascii_tokenizer.h
      - record_debug.cc
      - chain_record_yielder.h
      - generic_input_op_kernels.cc
      - record_batcher.h
      - weighted_mix_record_yielder.cc
      - static_map_op_test.py
      - functional_ops_test.py
      - input_common.cc
      - preconditioner_captain.h
      - tokenizer_op_headers.h
      - testdata
        BUILD
        bpe_words.vocab
        bpe_codes.vocab
        wmt
        history.txt
        test_vocab.txt
        test_ngrams.txt
        history_bleu.txt
        events.out.tfevents.test
      - ml_perf_subword_op.cc
      - best_step_op_kernels.cc
      - simple_vocab.cc
      - functional_ops_kernels.cc
      - static_map_op.cc
      - simple_vocab.h
      - yielder_test_helper.h
      - simple_vocab_test.py
      - best_step_op_test.py
      - record_yielder.cc
      - record_yielder_test.cc
      - text_packing.h
      - preconditioner_captain.cc
      - record_batcher.cc
      - ml_perf_subword_op.h
      - record_yielder.h
      - tokenizer_ops_kernels.cc
      - chain_record_yielder_test.cc
      - text_packing_test.cc
      - input_common.h
      - __init__.py
      - x_ops_helper.h
      - rope.h
      - record_batcher_test.cc
      - pack_ops.cc
      - tokenizer_ops_test.py
      - pack_ops_test.py
      - random_ops_test.py
      - sequential_record_yielder.cc
      - beam_search_step_op_kernels.cc
      - assert_ops_test.py
      - beam_search_step_op_top_k_test.cc
      - preconditioner_op_kernels_test.py
      - yielder_test_helper.cc
      - beam_search_step_op_kernels.h
      - sequential_record_yielder.h
      - text_packing.cc
      - record.proto
      - x_ops.cc
      - random_ops_kernels.cc
    - conv_layers_builder_test.py
    - hyperparams_test.py
    - reversible_layers.py
    - saver_test.py
    - tshape_test.py
    - retry.py
    - conv_layers_with_time_padding.py
    - base_layer_test.py
    - batch_major_attention_test.py
    - schedule_test.py
    - task_scheduler.py
    - beam_search_helper_test.py
    - ml_perf_bleu_metric_test.py
    - summary_utils_test.py
    - generic_input_test.py
    - learner.py
    - predictor_runner_base.py
    - builder.py
    - optimizer_test.py
    - bfloat16_variables_test.py
    - datasource_test.py
    - py_utils_test.py
    - distributed_shampoo.py
    - spectrum_augmenter_test.py
    - bn_layers.py
    - schedule.py
    - multitask_model_test.py
    - egdd.py
    - recurrent_test.py
    - saver.py
    - model_helper.py
    - program.py
    - early_stop_test.py
    - egdd_test.py
    - insertion_test.py
    - rnn_cell_test.py
    - ema_test.py
    - test_trainer_utils.py
    - wpm_encoder_test.py
    - computation_cost.py
    - tokenizers.py
  - lingvo.bzl
  - model_imports.py
  - trainer_test.py
  - trainer.py
  - compat.py
  - repo.bzl
- LICENSE
- CONTRIBUTING.md
- .bazelrc
- docker
  - run_distributed.py
  - dev.dockerfile
  - lib.dockerfile
  - __init__.py
- tf_env_collect.sh
- publications.bib
- README.md
- WORKSPACE
- .gitignore
- docs
  - generate_apidoc.sh
  - apidoc
    - index.rst
    - conf.py
- update_publications.sh
- PUBLICATIONS.md

# Lint as: python2, python3
# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
r"""Read saved Decoder's outputs and convert to KITTI text format.

First, obtain a KITTI camera calibration file.

To export all detections from a single model:

python export_kitti_detection.py \
--decoder_path=/path/to/decoder_out_000103000 \
--calib_file=/tmp/kitti_test_calibs.npz \
--output_dir=/tmp/my-kitti-export-directory \
--logtostderr

--- OR ---

Export combined detections selected from multiple models:

python export_kitti_detection.py \
--car_decoder_path=/path/to/car_decoder_out \
--ped_decoder_path=/path/to/ped_decoder_out \
--cyc_decoder_path=/path/to/cyc_decoder_out \
--calib_file=/tmp/kitti_test_calibs.npz \
--output_dir=/tmp/my-kitti-export-directory \
--logtostderr
"""

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

from absl import flags
from lingvo import compat as tf
from lingvo.core.ops import record_pb2
from lingvo.tasks.car import kitti_metadata
from lingvo.tasks.car.tools import kitti_data
import numpy as np
from six.moves import zip


FLAGS = flags.FLAGS
flags.DEFINE_string(
    "decoder_path", None, "Paths to decoder file containing output "
    "of decoder for everything. Either supply this argument or individual "
    "decoder paths for cars, pedestrians and cyclists.")
flags.DEFINE_string(
    "car_decoder_path", None,
    "Paths to decoder file containing output of decoder for cars."
    "Either supply plus cyclists and pedestrians or supply one "
    "decoder for all labels.")
flags.DEFINE_string(
    "ped_decoder_path", None,
    "Paths to decoder file containing output of decoder for "
    "pedestrians. Either supply plus cyclists and cars or "
    "supply one decoder for all labels.")
flags.DEFINE_string(
    "cyc_decoder_path", None,
    "Paths to decoder file containing output of decoder for cyclist. "
    "Either supply plus cars and pedestrians or supply one "
    "decoder for all labels.")
flags.DEFINE_string(
    "calib_file", None,
    "Path to a npz file that contains all calibration matrices.")
flags.DEFINE_string("output_dir", None, "Place to write detections.")
flags.DEFINE_float("score_threshold", 0, "Ignore detections with lower score.")


def LoadCalibData(fname):
  """Load and parse calibration data from NPZ file."""
  # If this throws an error, make sure the npz file was generated from
  # the same version of python as this binary.
  npz = np.load(fname)
  scene_to_calib = {}
  for idx, scene_id in enumerate(npz["scene_id"]):
    tf.logging.info("Processing %s", scene_id)
    raw_calib = {}
    raw_calib["P0"] = npz["P0"][idx]
    raw_calib["P1"] = npz["P1"][idx]
    raw_calib["P2"] = npz["P2"][idx]
    raw_calib["P3"] = npz["P3"][idx]
    raw_calib["R0_rect"] = npz["R0_rect"][idx]
    raw_calib["Tr_velo_to_cam"] = npz["Tr_velo_to_cam"][idx]
    raw_calib["Tr_imu_to_velo"] = npz["Tr_imu_to_velo"][idx]

    calib = kitti_data.ParseCalibrationDict(raw_calib)
    scene_to_calib[scene_id] = calib
  return scene_to_calib


def ExtractNpContent(np_dict, calib):
  """Parse saved np arrays and convert 3D bboxes to camera0 coordinates.

  Args:
    np_dict: a dict of numpy arrays.
    calib: a parsed calibration dictionary.

  Returns:
    A tuple of 6 ndarrays:

    - location_camera: [N, 3]. [x, y, z] in camera0 coordinate.
    - dimension_camera: [N, 3]. The [height, width, length] of objects.
    - phi_camera: [N]. Rotation around y-axis in camera0 coodinate.
    - bboxes_2d: [N, 4]. The corresponding 2D bboxes in the image coordinate.
    - scores: [N]. Confidence scores for each box for the assigned class.
    - class_ids: [N]. The class id assigned to each box.
  """
  bboxes = np_dict["bboxes"]
  scores = np_dict["scores"]
  class_ids = np_dict["class_ids"]
  bboxes_2d = np_dict["bboxes_2d"]

  # Transform from velodyne coordinates to camera coordinates.
  velo_to_cam_transform = kitti_data.VeloToCameraTransformation(calib)
  location_cam = np.zeros((len(bboxes), 3))
  dimension_cam = np.zeros((len(bboxes), 3))
  rotation_cam = np.zeros((len(bboxes), 1))
  for idx, bbox in enumerate(bboxes):
    location_cam[idx, :], dimension_cam[idx, :], rotation_cam[idx, :] = (
        kitti_data.BBox3DToKITTIObject(bbox, velo_to_cam_transform))

  return location_cam, dimension_cam, rotation_cam, bboxes_2d, scores, class_ids


_INCLUDED_KITTI_CLASS_NAMES = ["Car", "Pedestrian", "Cyclist"]


def ExportKITTIDetection(out_dir, source_id, location_cam, dimension_cam,
                         rotation_cam, bboxes_2d, scores, class_name, is_first):
  """Write detections to a text file in KITTI format."""
  tf.logging.info("Exporting %s for %s" % (class_name, source_id))
  fname = out_dir + "/" + source_id + ".txt"
  with tf.io.gfile.GFile(fname, "a") as fid:
    # Ensure we always create a file even when there's no detection.
    # TODO(shlens): Test whether this is actually necessary on the KITTI
    # eval server.
    if is_first:
      fid.write("")
    for location, dimension, ry, bbox_2d, score in zip(
        location_cam, dimension_cam, rotation_cam, bboxes_2d, scores):
      if score < FLAGS.score_threshold:
        continue
      # class_name, truncated(ignore), alpha(ignore), bbox2D x 4
      part1 = [class_name, -1, -1, -10] + list(bbox_2d)
      # dimesion x 3, location x 3, rotation_y x 1, score x 1
      fill = tuple(part1 + list(dimension) + list(location) + [ry] + [score])
      kitti_format_string = ("%s %lf %lf %lf %lf %lf %lf %lf %lf %lf %lf %lf "
                             "%lf %lf %lf %lf")
      kitti_line = kitti_format_string % fill
      fid.write(kitti_line + "\n")


def main(argv):
  if len(argv) > 1:
    raise tf.app.UsageError("Too many command-line arguments.")

  if FLAGS.decoder_path:
    assert not FLAGS.car_decoder_path and not FLAGS.ped_decoder_path \
        and not FLAGS.cyc_decoder_path, ("Either provide decoder_path or "
                                         "individual decoders but not both.")
  else:
    assert FLAGS.car_decoder_path and FLAGS.ped_decoder_path and \
        FLAGS.cyc_decoder_path, ("No decoder_path specified. Please supply all "
                                 "individual decoder_paths for labels.")
  is_single_decoder_file = FLAGS.decoder_path is not None

  if is_single_decoder_file:
    list_of_decoder_paths = [FLAGS.decoder_path]
  else:
    # Note the correspondence between _INCLUDED_KITTI_CLASS_NAMES ordering and
    # this list.
    list_of_decoder_paths = [
        FLAGS.car_decoder_path, FLAGS.ped_decoder_path, FLAGS.cyc_decoder_path
    ]

  # A list of dictionaries mapping img ids to a dictionary of numpy tensors.
  table_data = []

  img_ids = []
  for table_path in list_of_decoder_paths:
    img_id_dict = {}
    for serialized in tf.io.tf_record_iterator(table_path):
      record = record_pb2.Record()
      record.ParseFromString(serialized)
      img_id = str(tf.make_ndarray(record.fields["img_id"]))
      img_ids.append(img_id)
      np_dict = {k: tf.make_ndarray(v) for k, v in record.fields.items()}
      img_id_dict[img_id] = np_dict
    table_data.append(img_id_dict)
  img_ids = list(set(img_ids))

  if not tf.io.gfile.exists(FLAGS.output_dir):
    tf.io.gfile.mkdir(FLAGS.output_dir)

  all_kitti_class_names = kitti_metadata.KITTIMetadata().ClassNames()
  calib_data = LoadCalibData(tf.io.gfile.GFile(FLAGS.calib_file, "rb"))
  count = 0
  for img_id in img_ids:
    # Ignore padded samples where the img_ids are empty.
    if not img_id:
      continue
    for table_index, img_id_dict in enumerate(table_data):
      if img_id in img_id_dict:
        np_dict = img_id_dict[img_id]

        (location_cam, dimension_cam, rotation_cam, bboxes_2d, scores,
         class_ids) = ExtractNpContent(np_dict, calib_data[img_id + ".txt"])
        if is_single_decoder_file:
          valid_labels = _INCLUDED_KITTI_CLASS_NAMES
        else:
          valid_labels = [_INCLUDED_KITTI_CLASS_NAMES[table_index]]
        is_first = table_index == 0
        for class_name in valid_labels:
          class_mask = (class_ids == all_kitti_class_names.index(class_name))
          ExportKITTIDetection(FLAGS.output_dir, img_id,
                               location_cam[class_mask],
                               dimension_cam[class_mask],
                               rotation_cam[class_mask], bboxes_2d[class_mask],
                               scores[class_mask], class_name, is_first)
    count += 1
  tf.logging.info("Total example exported: %d", count)


if __name__ == "__main__":
  tf.app.run(main)