python source code of file_2

visual_foresight-master
- examples
  - dataset_reader.py
- LICENSE
- data_collection
  - kuka
    - head_cam
      - collection_params_dict.json
      - hparams.py
    - 3_View
      - collection_params_dict.json
      - hparams.py
  - sim
    - cartgripper_pusher
      - cube_objects
        hparams.py
    - cartgripper_xz_grasp
      - cube_objects
        hparams.py
    - sawyer_grasp
      - hparams.py
    - cartgripper_grasp
      - grasp_reflex_lblocks
        hparams.py
      - grasp_reflex_cubes
        hparams.py
  - widowx
    - hparams.py
  - sawyer
    - towel_data
      - hparams.py
      - get_examples.py
    - five_view
      - collection_params_dict.json
      - hparams.py
      - hparams_eps.py
    - grasp
      - collection_params_dict.json
      - hparams.py
      - hparams_eps.py
    - multi_env
      - hparams.py
    - hard_object_data
      - hparams.py
    - correlated_noise_bottombias
      - collection_params_dict.json
      - hparams.py
  - baxter
    - head_cam
      - collection_params_dict.json
      - hparams.py
    - 3_View
      - collection_params_dict.json
      - hparams.py
- visual_mpc
  - utils
    - check_dataset.py
    - file_2_record.py
    - file_2_hdf5.py
    - im_utils.py
    - sync.py
    - summarize_dataset.py
    - logger.py
    - __init__.py
  - video_prediction
    - vpred_model_interface.py
    - checkpoint_matcher.py
    - pred_util.py
    - setup_predictor.py
    - __init__.py
  - policy
    - utils
      - controller_utils.py
      - __init__.py
    - policy.py
    - handcrafted
      - lifting_policy.py
      - __init__.py
      - playback_policy.py
    - cem_controllers
      - register_gtruth_controller.py
      - pixel_cost_controller.py
      - cem_base_controller.py
      - goal_im_controller.py
      - human_cem_controller.py
      - variants
        ensemble_vidpred.py
        classifier_controller.py
        nce_cost_controller.py
        __init__.py
      - __init__.py
      - visualizer
        construct_html.py
        __init__.py
        plot_helper.py
      - samplers
        cem_sampler.py
        folding_sampler.py
        autograsp_epsilon.py
        correlated_noise.py
        autograsp_sampler.py
        __init__.py
        gaussian_sampler.py
    - inverse_models
      - __init__.py
      - inverse_model_base_controller.py
    - __init__.py
    - interactive
      - classifier_collector.py
      - __init__.py
    - random
      - random_fold_policy.py
      - __init__.py
      - gaussian.py
      - sampler_policy.py
  - foresight_rospkg
    - src
      - log_cameras.py
      - utils
        camera_calib
        setup_calibrated_sawyer_cams.py
        calibrated_camera.py
        __init__.py
        get_points.py
        __init__.py
        record_motion.py
      - run_robot.py
      - __init__.py
      - video_stream.cpp
    - package.xml
    - CMakeLists.txt
    - __init__.py
    - launch
      - start_impedance.sh
      - start_cameras.py
      - camera.launch
      - start_gripper.launch
  - agent
    - general_agent.py
    - utils
      - raw_saver.py
      - hdf5_saver.py
      - file_saver.py
      - record_saver.py
      - traj_saver.py
      - __init__.py
    - benchmarking_agent.py
    - __init__.py
    - offline_agent.py
  - sim
    - run.py
    - simulator.py
    - util
      - config_agent.py
      - combine_score.py
      - __init__.py
      - synchronize_tfrecs.py
    - __init__.py
    - benchmarks.py
  - __init__.py
  - envs
    - base_env.py
    - mujoco_env
      - cartgripper_env
        base_cartgripper.py
        cartgripper_xz_grasp.py
        cartgripper_pusher.py
        cartgripper_xyz.py
        cartgripper_rot_grasp.py
        util
        sensor_util.py
        __init__.py
        __init__.py
        autograsp_env.py
      - util
        create_xml.py
        __init__.py
      - __init__.py
      - base_mujoco_env.py
      - sawyer_env
        base_sawyer_env.py
        robosuite_wrappers
        BinArena.py
        SawyerIKEnv.py
        __init__.py
        bin_arena.xml
        __init__.py
    - robot_envs
      - base_env.py
      - recorded_trajectories
        README.txt
      - grippers
        kuka
        default_kuka_gripper.py
        __init__.py
        __init__.py
        gripper.py
        sawyer
        default_sawyer_gripper.py
        __init__.py
        weiss
        __init__.py
        wsg50_gripper.py
        wsg50_xml
        wsg_50_mod.urdf
        wsg_50_dependent_joints.yaml
        wsg_50.urdf.xacro
        wsg_50.urdf
        baxter
        default_baxter_gripper.py
        __init__.py
      - kuka
        save_images_from_topic.py
        kuka_interface.py
        inverse_kinematics.py
        __init__.py
        control_util.py
        kuka_impedance.py
      - util
        camera_recorder.py
        __init__.py
        topic_utils.py
        user_interface.py
      - file2hdf5.py
      - vanilla_env.py
      - __init__.py
      - robot_controller_interface.py
      - robot_configs.json
      - widowx
        __init__.py
        widowx
        widowx.urdf
        meshes
        wrist_2_link.stl
        shoulder_link.stl
        base_link.stl
        wrist_1_link.stl
        biceps_link.stl
        gripper_rail_link.stl
        forearm_link.stl
        gripper_hand_fixed_link.stl
        bsd_license.txt
        widowx_controller.py
      - autograsp_env.py
      - sawyer
        sawyer_impedance.py
        register_wsg.py
        inverse_kinematics.py
        __init__.py
        control_util.py
      - franka
        franka_impedance.py
        __init__.py
      - baxter
        inverse_kinematics.py
        __init__.py
        control_util.py
        baxter_impedance.py
    - mjc_models
      - styrofoam_cup
        Shape_IndexedFaceSet_031.stl
        Shape_IndexedFaceSet_016.stl
        Shape_IndexedFaceSet_015.stl
        Shape_IndexedFaceSet_026.stl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_027.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_019.stl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_025.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_024.stl
        Shape_IndexedFaceSet_014.stl
        Shape_IndexedFaceSet_023.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_030.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Shape_IndexedFaceSet_032.stl
        Shape_IndexedFaceSet_022.stl
        Camera.stl
        Shape_IndexedFaceSet_029.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_028.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_020.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_012.stl
        Shape_IndexedFaceSet_021.stl
        Shape_IndexedFaceSet_018.stl
        Shape_IndexedFaceSet_017.stl
      - fox
        Shape_IndexedFaceSet.stl
        Fox.off
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Fox.wrl
        Fox.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Fox_GM.stl
      - GlassBowl
        Shape_IndexedFaceSet_031.stl
        Shape_IndexedFaceSet_016.stl
        Shape_IndexedFaceSet_015.stl
        Shape_IndexedFaceSet_026.stl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_027.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_019.stl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_025.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_024.stl
        Shape_IndexedFaceSet_014.stl
        Shape_IndexedFaceSet_023.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_030.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Shape_IndexedFaceSet_032.stl
        Shape_IndexedFaceSet_033.stl
        Shape_IndexedFaceSet_022.stl
        Shape_IndexedFaceSet_034.stl
        Camera.stl
        Shape_IndexedFaceSet_029.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_028.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_020.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_012.stl
        Shape_IndexedFaceSet_021.stl
        GlassBowl.wrl
        Shape_IndexedFaceSet_018.stl
        Shape_IndexedFaceSet_017.stl
      - sawyer_assets
        meshes
        sawyer
        l5.stl
        l6.stl
        GUIDE_WSG50_110.stl
        l3.stl
        sawyer_ft
        l5.stl
        l3.DAE
        l6.stl
        l0.DAE
        l2.DAE
        l3.stl
        l1.stl
        l0.stl
        l4.DAE
        l2.stl
        l1.DAE
        base.stl
        l4.stl
        WSG50_110.stl
        l2.stl
        sawyer_mp1
        sawyer_pv
        l5.stl
        l6.stl
        l3.stl
        l1.stl
        l0.stl
        l2.stl
        WSG-FMF.stl
        sawyer_mp3
        sawyer_xyz
        sawyer_wsg_base.xml
        shared_config.xml
        sawyer_grasp.xml
      - Fork
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_006.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
        Fork.wrl
      - Rook
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_006.stl
        Lamp.stl
        Rook.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Rook_GM.stl
      - Elephant
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
      - cartgripper_assets
        cartgripper_pusher.xml
        cartgripper_updown_2cam.xml
        __init__.py
        cartgripper_grasp.xml
        cartgripper_xz_grasp.xml
      - Knife
        Shape_IndexedFaceSet.stl
        Lamp.stl
        Camera.stl
        Knife.wrl
      - cupcake
        Shape_IndexedFaceSet.stl
        Lamp.stl
        Camera.stl
      - __init__.py
      - Bowl
        Shape_IndexedFaceSet_031.stl
        Shape_IndexedFaceSet_016.stl
        Shape_IndexedFaceSet_015.stl
        Shape_IndexedFaceSet_026.stl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_027.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_019.stl
        Shape_IndexedFaceSet_010.stl
        Bowl.wrl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_035.stl
        Shape_IndexedFaceSet_025.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_024.stl
        Shape_IndexedFaceSet_014.stl
        Shape_IndexedFaceSet_023.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_030.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Shape_IndexedFaceSet_032.stl
        Shape_IndexedFaceSet_033.stl
        Shape_IndexedFaceSet_022.stl
        Shape_IndexedFaceSet_034.stl
        Camera.stl
        Shape_IndexedFaceSet_029.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_028.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_020.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_012.stl
        Shape_IndexedFaceSet_021.stl
        Shape_IndexedFaceSet_018.stl
        Shape_IndexedFaceSet_017.stl
      - LotusBowl01
        Shape_IndexedFaceSet_031.stl
        Shape_IndexedFaceSet_016.stl
        Shape_IndexedFaceSet_015.stl
        Shape_IndexedFaceSet_026.stl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_027.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_019.stl
        LotusBowl01.wrl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_025.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_024.stl
        Shape_IndexedFaceSet_014.stl
        Shape_IndexedFaceSet_023.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_030.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Shape_IndexedFaceSet_032.stl
        Shape_IndexedFaceSet_033.stl
        Shape_IndexedFaceSet_022.stl
        Shape_IndexedFaceSet_034.stl
        Camera.stl
        Shape_IndexedFaceSet_029.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_028.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_020.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_012.stl
        Shape_IndexedFaceSet_021.stl
        Shape_IndexedFaceSet_018.stl
        Shape_IndexedFaceSet_017.stl
      - RuggedBowl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        RuggedBowl.wrl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_012.stl
        RuggedBowl.off
      - ElephantBowl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_004.stl
        ElephantBowl.wrl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        ElephantBowl.off
      - Queen
        Queen_GM.stl
        Shape_IndexedFaceSet.stl
        Queen.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
      - ServingBowl
        Shape_IndexedFaceSet_031.stl
        Shape_IndexedFaceSet_016.stl
        Shape_IndexedFaceSet_015.stl
        Shape_IndexedFaceSet_026.stl
        Shape_IndexedFaceSet_047.stl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_027.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_019.stl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_035.stl
        Shape_IndexedFaceSet_049.stl
        Shape_IndexedFaceSet_046.stl
        Shape_IndexedFaceSet_025.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_036.stl
        Shape_IndexedFaceSet_024.stl
        Shape_IndexedFaceSet_040.stl
        Shape_IndexedFaceSet_042.stl
        Shape_IndexedFaceSet_014.stl
        Shape_IndexedFaceSet_045.stl
        Shape_IndexedFaceSet_023.stl
        Shape_IndexedFaceSet_041.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_030.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Shape_IndexedFaceSet_032.stl
        Shape_IndexedFaceSet_033.stl
        Shape_IndexedFaceSet_022.stl
        Shape_IndexedFaceSet_034.stl
        Camera.stl
        Shape_IndexedFaceSet_029.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_028.stl
        ServingBowl.wrl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_020.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_037.stl
        Shape_IndexedFaceSet_044.stl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_039.stl
        Shape_IndexedFaceSet_048.stl
        Shape_IndexedFaceSet_012.stl
        Shape_IndexedFaceSet_021.stl
        Shape_IndexedFaceSet_038.stl
        ServingBowl.off
        Shape_IndexedFaceSet_043.stl
        Shape_IndexedFaceSet_018.stl
        Shape_IndexedFaceSet_017.stl
      - Pawn
        Pawn_GM.stl
        Shape_IndexedFaceSet.stl
        Pawn.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
      - Spoon
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Spoon.wrl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
    - util
      - interpolation.py
      - action_util.py
      - __init__.py
    - offline_env.py
    - __init__.py
- setup.py
- experiments
  - robonet
    - pixel_cost
      - hparams.py
      - conf.py
    - robotiq
      - fine_tune_start_all.py
      - fine_tune_start_sawyer.py
      - from_scratch.py
      - zero_shot.py
    - new_bin_inlay
      - sawyer_only.py
      - all_robots.py
    - inverse_model
      - sawyer_one_step.py
      - sawyer_two_step.py
      - multibot_one_step.py
      - franka_inverse_conf.py
    - view_generalization
      - single_view.py
      - all_views.py
    - franka
      - franka.py
    - baxter_fine_tune
      - baxter_fine_tune.py
      - sawyer_baxter_fine_tune.py
      - baxter_scratch.py
  - offline_exp
    - towel_classifier
      - hparams.py
      - conf.py
  - sim
    - cartgripper_2d_grasping
      - generate_tasks
        hparams.py
      - pixel_cost
        hparams.py
        conf.py
      - nce_experiments
        hparams.py
        conf.py
    - ensemble_grasping
      - hparams.py
      - generate_tasks.py
      - conf.py
  - sawyer
    - pixel_cost
      - hparams.py
      - conf.py
    - registration_experiments
      - hparams.py
      - gdnconf.py
      - conf.py
    - towel_classifier
      - hparams.py
      - conf.py
    - human_cem
      - hparams.py
      - conf.py
    - mixed_objects
      - hparams_deformable_objects.py
      - conf.py
      - hparams_hardobjects.py
- docker
  - vendor
    - Xdummy
    - 10_nvidia.json
  - Dockerfile
- README.md
- requirements.txt
- .gitignore

import h5py
import cv2
import numpy as np
import copy
import os
import imageio
import io
from multiprocessing import Pool, Manager
from visual_mpc.utils.sync import ManagedSyncCounter
import random
import functools
from tqdm import tqdm


MANDATORY_KEYS = ['camera_configuration', 'policy_desc', 'bin_type', 'bin_insert', 'contains_annotation',
                                'robot', 'gripper', 'background', 'action_space', 'object_classes', 'primitives', 'camera_type']


def serialize_image(img):
    assert img.dtype == np.uint8, "Must be uint8!"
    return cv2.imencode('.jpg', img)[1]


def serialize_video(imgs, temp_name_append):
    mp4_name = './temp{}.mp4'.format(temp_name_append)
    try:
        assert imgs.dtype == np.uint8, "Must be uint8 array!"
        assert not os.path.exists(mp4_name), "file {} exists!".format(mp4_name)
        # this is a hack to ensure imageio succesfully saves as a mp4 (instead of getting encoding confused)
        writer = imageio.get_writer(mp4_name)
        [writer.append_data(i[:, :, ::-1]) for i in imgs]
        writer.close()

        f = open(mp4_name, 'rb')
        buf = f.read()
        f.close()
    finally:
        if os.path.exists(mp4_name):
            os.remove(mp4_name)

    return np.frombuffer(buf, dtype=np.uint8)


def save_dict(data_container, dict_group, video_encoding, t_index):
    for k, d in data_container.items():
                    if 'images' == k:
                        T, n_cams = d.shape[:2]
                        dict_group.attrs['n_cams'] = n_cams

                        for n in range(n_cams):
                            dict_group.attrs['cam_encoding'] = video_encoding
                            cam_group = dict_group.create_group("cam{}_video".format(n))
                            if video_encoding == 'mp4':
                                data = cam_group.create_dataset("frames", data=serialize_video(d[:, n], t_index))
                                data.attrs['shape'] = d[0, n].shape
                                data.attrs['T'] = d.shape[0]
                                data.attrs['image_format'] = 'RGB'
                            elif video_encoding == 'jpeg':
                                for t in range(T):
                                    data = cam_group.create_dataset("frame{}".format(t), data=serialize_image(d[t, n]))
                                    data.attrs['shape'] = d[t, n].shape
                                    data.attrs['image_format'] = 'RGB'
                            else:
                                raise ValueError
                    elif 'image' in k:
                        data = dict_group.create_dataset(k, data=serialize_image(d))
                        data.attrs['shape'] = d.shape
                    else:
                        dict_group.create_dataset(k, data=d)


def save_hdf5(filename, env_obs, policy_out, agent_data, meta_data, video_encoding='mp4', t_index=None):
    if t_index is None:
        t_index = random.randint(0, 9999999)
    # meta-data includes calibration "number", policy "type" descriptor, environment bounds
    with h5py.File(filename, 'w') as f:
        f.create_dataset('file_version', data='0.1.0')
        [save_dict(data_container, f.create_group(name), video_encoding, t_index) for data_container, name in zip([env_obs, agent_data], ['env', 'misc'])]

        policy_dict = {}
        first_keys = list(policy_out[0].keys())
        for k in first_keys:
            assert all([k in p for p in policy_out[1:]]), "hdf5 format requires keys must be uniform across time!"
            policy_dict[k] = np.concatenate([p[k][None] for p in policy_out], axis=0)
        save_dict(policy_dict, f.create_group('policy'), video_encoding, t_index)

        meta_data_group = f.create_group('metadata')
        for mandatory_key in MANDATORY_KEYS:
            meta_data_group.attrs[mandatory_key] = meta_data.pop(mandatory_key)
        
        for k in meta_data.keys():
            meta_data_group.attrs[k] = meta_data[k]
            

def save_worker(traj_data, cntr, group_name=''):
    t_index = random.randint(0, 9999999)
    t, meta_data = traj_data

    try:
        env_obs = pkl.load(open('{}/obs_dict.pkl'.format(t), 'rb'), encoding='latin1')
        if meta_data['contains_annotation']:
            env_obs['bbox_annotations'] = pkl.load(open('{}/annotation_array.pkl'.format(t), 'rb'), encoding='latin1')
        n_cams = len(glob.glob('{}/images*'.format(t)))
        if n_cams:
            T = min([len(glob.glob('{}/images{}/*.jpg'.format(t, i))) for i in range(n_cams)])
            height, width = cv2.imread('{}/images0/im_0.jpg'.format(t)).shape[:2]
            env_obs['images'] = np.zeros((T, n_cams, height, width, 3), dtype=np.uint8)

            for n in range(n_cams):
                for time in range(T):
                    env_obs['images'][time, n] = cv2.imread('{}/images{}/im_{}.jpg'.format(t, n, time))

        policy_out = pkl.load(open('{}/policy_out.pkl'.format(t), 'rb'), encoding='latin1')
        agent_data = pkl.load(open('{}/agent_data.pkl'.format(t), 'rb'), encoding='latin1')

        def store_in_metadata_if_exists(key):  
            if key in agent_data:
                meta_data[key] = agent_data.pop(key)
        [store_in_metadata_if_exists(k) for k in ['goal_reached', 'term_t']]

        c = cntr.ret_increment
        save_hdf5('{}/{}traj{}.hdf5'.format(args.output_folder, group_name, c), env_obs, policy_out, agent_data, meta_data, video_encoding, t_index)
        return True
    except (FileNotFoundError, NotADirectoryError):
        return False


if __name__ == '__main__':
    import argparse
    import glob
    import json
    import random
    import sys
    import os
    import shutil
    import math
    if sys.version_info[0] == 2:
        import cPickle as pkl
        input_fn = raw_input
    else:
        import pickle as pkl
        input_fn = input

    parser = argparse.ArgumentParser(description="converts dataset from pkl format to hdf5")
    parser.add_argument('input_folder', type=str, help='where raw files are stored')
    parser.add_argument('output_folder', type=str, help='where to save')
    parser.add_argument('--output_group_name', type=str, default='', help='name to prepend in front of trajs')
    parser.add_argument('--video_jpeg_encoding', action='store_true', default=False, help='uses jpeg encoding for video frames instead of mp4')
    parser.add_argument('--counter', type=int, help='where to start counter', default=0)
    parser.add_argument('--n_workers', type=int, help='number of multi-threaded workers', default=1)
    args = parser.parse_args()

    assert args.n_workers >= 1, "can't have less than 1 worker thread!"
    args.input_folder, args.output_folder = [os.path.expanduser(x) for x in (args.input_folder, args.output_folder)]
    if not os.path.exists(args.output_folder):
        os.makedirs(args.output_folder)
    elif input_fn('path {} exists, should folder be deleted? (y/n): '.format(args.output_folder)) == 'y':
        shutil.rmtree(args.output_folder)
        os.makedirs(args.output_folder)   
    
    if args.video_jpeg_encoding:
        video_encoding = 'jpeg'
    else:
        video_encoding = 'mp4'
        if len(glob.glob('./temp*.mp4')) != 0:
            print("Please delete all temp*.mp4 files! (needed for saving)")
            raise EnvironmentError
    
    traj_groups = glob.glob(args.input_folder + "/*")
    print('found {} traj groups!'.format(len(traj_groups)))

    trajs, annotations_loaded = [], 0
    for group in traj_groups:
        meta_data_dict = json.load(open('{}/hparams.json'.format(group), 'r'))
        group_trajs = glob.glob('{}/*'.format(group))
        for t in group_trajs:
            traj_meta_data = copy.deepcopy(meta_data_dict)
            traj_meta_data['object_batch'] = group
            if os.path.exists('{}/annotation_array.pkl'.format(t)):
                traj_meta_data['contains_annotation'] = True
                annotations_loaded += 1
            else:
                traj_meta_data['contains_annotation'] = False
            
            if isinstance(traj_meta_data['object_classes'], str):
                traj_meta_data['object_classes'] = traj_meta_data['object_classes'].split("+")
            
            assert all([k in traj_meta_data for k in MANDATORY_KEYS]), 'metadata for {} is missing keys!'.format(t)
            assert isinstance(traj_meta_data['object_classes'], list), "did not split object classes!"
            assert all([isinstance(x, str) for x in traj_meta_data['object_classes']]), 'object classes is not a string!'

            trajs.append((t, traj_meta_data))
    random.shuffle(trajs)
    
    print('Loaded {} trajectories with {} annotations!'.format(len(trajs), annotations_loaded))

    cntr = ManagedSyncCounter(Manager(), args.counter)
    if args.n_workers == 1:
        saved = 0
        for t in tqdm(trajs):
            saved += save_worker(t, cntr, args.output_group_name)
        
        print('saved {} total trajs'.format(saved))
    else:
        map_fn = functools.partial(save_worker, cntr=cntr, group_name=args.output_group_name)
        p = Pool(args.n_workers)
        print('saved {} total trajs'.format(sum(tqdm(p.imap_unordered(map_fn, trajs), total=len(trajs)))))