python source code of goal_im

visual_foresight-master
- examples
  - dataset_reader.py
- LICENSE
- data_collection
  - kuka
    - head_cam
      - collection_params_dict.json
      - hparams.py
    - 3_View
      - collection_params_dict.json
      - hparams.py
  - sim
    - cartgripper_pusher
      - cube_objects
        hparams.py
    - cartgripper_xz_grasp
      - cube_objects
        hparams.py
    - sawyer_grasp
      - hparams.py
    - cartgripper_grasp
      - grasp_reflex_lblocks
        hparams.py
      - grasp_reflex_cubes
        hparams.py
  - widowx
    - hparams.py
  - sawyer
    - towel_data
      - hparams.py
      - get_examples.py
    - five_view
      - collection_params_dict.json
      - hparams.py
      - hparams_eps.py
    - grasp
      - collection_params_dict.json
      - hparams.py
      - hparams_eps.py
    - multi_env
      - hparams.py
    - hard_object_data
      - hparams.py
    - correlated_noise_bottombias
      - collection_params_dict.json
      - hparams.py
  - baxter
    - head_cam
      - collection_params_dict.json
      - hparams.py
    - 3_View
      - collection_params_dict.json
      - hparams.py
- visual_mpc
  - utils
    - check_dataset.py
    - file_2_record.py
    - file_2_hdf5.py
    - im_utils.py
    - sync.py
    - summarize_dataset.py
    - logger.py
    - __init__.py
  - video_prediction
    - vpred_model_interface.py
    - checkpoint_matcher.py
    - pred_util.py
    - setup_predictor.py
    - __init__.py
  - policy
    - utils
      - controller_utils.py
      - __init__.py
    - policy.py
    - handcrafted
      - lifting_policy.py
      - __init__.py
      - playback_policy.py
    - cem_controllers
      - register_gtruth_controller.py
      - pixel_cost_controller.py
      - cem_base_controller.py
      - goal_im_controller.py
      - human_cem_controller.py
      - variants
        ensemble_vidpred.py
        classifier_controller.py
        nce_cost_controller.py
        __init__.py
      - __init__.py
      - visualizer
        construct_html.py
        __init__.py
        plot_helper.py
      - samplers
        cem_sampler.py
        folding_sampler.py
        autograsp_epsilon.py
        correlated_noise.py
        autograsp_sampler.py
        __init__.py
        gaussian_sampler.py
    - inverse_models
      - __init__.py
      - inverse_model_base_controller.py
    - __init__.py
    - interactive
      - classifier_collector.py
      - __init__.py
    - random
      - random_fold_policy.py
      - __init__.py
      - gaussian.py
      - sampler_policy.py
  - foresight_rospkg
    - src
      - log_cameras.py
      - utils
        camera_calib
        setup_calibrated_sawyer_cams.py
        calibrated_camera.py
        __init__.py
        get_points.py
        __init__.py
        record_motion.py
      - run_robot.py
      - __init__.py
      - video_stream.cpp
    - package.xml
    - CMakeLists.txt
    - __init__.py
    - launch
      - start_impedance.sh
      - start_cameras.py
      - camera.launch
      - start_gripper.launch
  - agent
    - general_agent.py
    - utils
      - raw_saver.py
      - hdf5_saver.py
      - file_saver.py
      - record_saver.py
      - traj_saver.py
      - __init__.py
    - benchmarking_agent.py
    - __init__.py
    - offline_agent.py
  - sim
    - run.py
    - simulator.py
    - util
      - config_agent.py
      - combine_score.py
      - __init__.py
      - synchronize_tfrecs.py
    - __init__.py
    - benchmarks.py
  - __init__.py
  - envs
    - base_env.py
    - mujoco_env
      - cartgripper_env
        base_cartgripper.py
        cartgripper_xz_grasp.py
        cartgripper_pusher.py
        cartgripper_xyz.py
        cartgripper_rot_grasp.py
        util
        sensor_util.py
        __init__.py
        __init__.py
        autograsp_env.py
      - util
        create_xml.py
        __init__.py
      - __init__.py
      - base_mujoco_env.py
      - sawyer_env
        base_sawyer_env.py
        robosuite_wrappers
        BinArena.py
        SawyerIKEnv.py
        __init__.py
        bin_arena.xml
        __init__.py
    - robot_envs
      - base_env.py
      - recorded_trajectories
        README.txt
      - grippers
        kuka
        default_kuka_gripper.py
        __init__.py
        __init__.py
        gripper.py
        sawyer
        default_sawyer_gripper.py
        __init__.py
        weiss
        __init__.py
        wsg50_gripper.py
        wsg50_xml
        wsg_50_mod.urdf
        wsg_50_dependent_joints.yaml
        wsg_50.urdf.xacro
        wsg_50.urdf
        baxter
        default_baxter_gripper.py
        __init__.py
      - kuka
        save_images_from_topic.py
        kuka_interface.py
        inverse_kinematics.py
        __init__.py
        control_util.py
        kuka_impedance.py
      - util
        camera_recorder.py
        __init__.py
        topic_utils.py
        user_interface.py
      - file2hdf5.py
      - vanilla_env.py
      - __init__.py
      - robot_controller_interface.py
      - robot_configs.json
      - widowx
        __init__.py
        widowx
        widowx.urdf
        meshes
        wrist_2_link.stl
        shoulder_link.stl
        base_link.stl
        wrist_1_link.stl
        biceps_link.stl
        gripper_rail_link.stl
        forearm_link.stl
        gripper_hand_fixed_link.stl
        bsd_license.txt
        widowx_controller.py
      - autograsp_env.py
      - sawyer
        sawyer_impedance.py
        register_wsg.py
        inverse_kinematics.py
        __init__.py
        control_util.py
      - franka
        franka_impedance.py
        __init__.py
      - baxter
        inverse_kinematics.py
        __init__.py
        control_util.py
        baxter_impedance.py
    - mjc_models
      - styrofoam_cup
        Shape_IndexedFaceSet_031.stl
        Shape_IndexedFaceSet_016.stl
        Shape_IndexedFaceSet_015.stl
        Shape_IndexedFaceSet_026.stl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_027.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_019.stl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_025.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_024.stl
        Shape_IndexedFaceSet_014.stl
        Shape_IndexedFaceSet_023.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_030.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Shape_IndexedFaceSet_032.stl
        Shape_IndexedFaceSet_022.stl
        Camera.stl
        Shape_IndexedFaceSet_029.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_028.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_020.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_012.stl
        Shape_IndexedFaceSet_021.stl
        Shape_IndexedFaceSet_018.stl
        Shape_IndexedFaceSet_017.stl
      - fox
        Shape_IndexedFaceSet.stl
        Fox.off
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Fox.wrl
        Fox.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Fox_GM.stl
      - GlassBowl
        Shape_IndexedFaceSet_031.stl
        Shape_IndexedFaceSet_016.stl
        Shape_IndexedFaceSet_015.stl
        Shape_IndexedFaceSet_026.stl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_027.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_019.stl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_025.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_024.stl
        Shape_IndexedFaceSet_014.stl
        Shape_IndexedFaceSet_023.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_030.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Shape_IndexedFaceSet_032.stl
        Shape_IndexedFaceSet_033.stl
        Shape_IndexedFaceSet_022.stl
        Shape_IndexedFaceSet_034.stl
        Camera.stl
        Shape_IndexedFaceSet_029.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_028.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_020.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_012.stl
        Shape_IndexedFaceSet_021.stl
        GlassBowl.wrl
        Shape_IndexedFaceSet_018.stl
        Shape_IndexedFaceSet_017.stl
      - sawyer_assets
        meshes
        sawyer
        l5.stl
        l6.stl
        GUIDE_WSG50_110.stl
        l3.stl
        sawyer_ft
        l5.stl
        l3.DAE
        l6.stl
        l0.DAE
        l2.DAE
        l3.stl
        l1.stl
        l0.stl
        l4.DAE
        l2.stl
        l1.DAE
        base.stl
        l4.stl
        WSG50_110.stl
        l2.stl
        sawyer_mp1
        sawyer_pv
        l5.stl
        l6.stl
        l3.stl
        l1.stl
        l0.stl
        l2.stl
        WSG-FMF.stl
        sawyer_mp3
        sawyer_xyz
        sawyer_wsg_base.xml
        shared_config.xml
        sawyer_grasp.xml
      - Fork
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_006.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
        Fork.wrl
      - Rook
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_006.stl
        Lamp.stl
        Rook.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Rook_GM.stl
      - Elephant
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
      - cartgripper_assets
        cartgripper_pusher.xml
        cartgripper_updown_2cam.xml
        __init__.py
        cartgripper_grasp.xml
        cartgripper_xz_grasp.xml
      - Knife
        Shape_IndexedFaceSet.stl
        Lamp.stl
        Camera.stl
        Knife.wrl
      - cupcake
        Shape_IndexedFaceSet.stl
        Lamp.stl
        Camera.stl
      - __init__.py
      - Bowl
        Shape_IndexedFaceSet_031.stl
        Shape_IndexedFaceSet_016.stl
        Shape_IndexedFaceSet_015.stl
        Shape_IndexedFaceSet_026.stl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_027.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_019.stl
        Shape_IndexedFaceSet_010.stl
        Bowl.wrl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_035.stl
        Shape_IndexedFaceSet_025.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_024.stl
        Shape_IndexedFaceSet_014.stl
        Shape_IndexedFaceSet_023.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_030.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Shape_IndexedFaceSet_032.stl
        Shape_IndexedFaceSet_033.stl
        Shape_IndexedFaceSet_022.stl
        Shape_IndexedFaceSet_034.stl
        Camera.stl
        Shape_IndexedFaceSet_029.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_028.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_020.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_012.stl
        Shape_IndexedFaceSet_021.stl
        Shape_IndexedFaceSet_018.stl
        Shape_IndexedFaceSet_017.stl
      - LotusBowl01
        Shape_IndexedFaceSet_031.stl
        Shape_IndexedFaceSet_016.stl
        Shape_IndexedFaceSet_015.stl
        Shape_IndexedFaceSet_026.stl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_027.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_019.stl
        LotusBowl01.wrl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_025.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_024.stl
        Shape_IndexedFaceSet_014.stl
        Shape_IndexedFaceSet_023.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_030.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Shape_IndexedFaceSet_032.stl
        Shape_IndexedFaceSet_033.stl
        Shape_IndexedFaceSet_022.stl
        Shape_IndexedFaceSet_034.stl
        Camera.stl
        Shape_IndexedFaceSet_029.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_028.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_020.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_012.stl
        Shape_IndexedFaceSet_021.stl
        Shape_IndexedFaceSet_018.stl
        Shape_IndexedFaceSet_017.stl
      - RuggedBowl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        RuggedBowl.wrl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_012.stl
        RuggedBowl.off
      - ElephantBowl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_004.stl
        ElephantBowl.wrl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        ElephantBowl.off
      - Queen
        Queen_GM.stl
        Shape_IndexedFaceSet.stl
        Queen.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
      - ServingBowl
        Shape_IndexedFaceSet_031.stl
        Shape_IndexedFaceSet_016.stl
        Shape_IndexedFaceSet_015.stl
        Shape_IndexedFaceSet_026.stl
        Shape_IndexedFaceSet_047.stl
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_027.stl
        Shape_IndexedFaceSet_013.stl
        Shape_IndexedFaceSet_019.stl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Shape_IndexedFaceSet_035.stl
        Shape_IndexedFaceSet_049.stl
        Shape_IndexedFaceSet_046.stl
        Shape_IndexedFaceSet_025.stl
        Shape_IndexedFaceSet_011.stl
        Shape_IndexedFaceSet_036.stl
        Shape_IndexedFaceSet_024.stl
        Shape_IndexedFaceSet_040.stl
        Shape_IndexedFaceSet_042.stl
        Shape_IndexedFaceSet_014.stl
        Shape_IndexedFaceSet_045.stl
        Shape_IndexedFaceSet_023.stl
        Shape_IndexedFaceSet_041.stl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_030.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Shape_IndexedFaceSet_032.stl
        Shape_IndexedFaceSet_033.stl
        Shape_IndexedFaceSet_022.stl
        Shape_IndexedFaceSet_034.stl
        Camera.stl
        Shape_IndexedFaceSet_029.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_028.stl
        ServingBowl.wrl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_020.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_037.stl
        Shape_IndexedFaceSet_044.stl
        Shape_IndexedFaceSet_007.stl
        Shape_IndexedFaceSet_039.stl
        Shape_IndexedFaceSet_048.stl
        Shape_IndexedFaceSet_012.stl
        Shape_IndexedFaceSet_021.stl
        Shape_IndexedFaceSet_038.stl
        ServingBowl.off
        Shape_IndexedFaceSet_043.stl
        Shape_IndexedFaceSet_018.stl
        Shape_IndexedFaceSet_017.stl
      - Pawn
        Pawn_GM.stl
        Shape_IndexedFaceSet.stl
        Pawn.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
      - Spoon
        Shape_IndexedFaceSet.stl
        Shape_IndexedFaceSet_010.stl
        Shape_IndexedFaceSet_004.stl
        Shape_IndexedFaceSet_005.stl
        Spoon.wrl
        Shape_IndexedFaceSet_006.stl
        Shape_IndexedFaceSet_008.stl
        Lamp.stl
        Camera.stl
        Shape_IndexedFaceSet_009.stl
        Shape_IndexedFaceSet_001.stl
        Shape_IndexedFaceSet_002.stl
        Shape_IndexedFaceSet_003.stl
        Shape_IndexedFaceSet_007.stl
    - util
      - interpolation.py
      - action_util.py
      - __init__.py
    - offline_env.py
    - __init__.py
- setup.py
- experiments
  - robonet
    - pixel_cost
      - hparams.py
      - conf.py
    - robotiq
      - fine_tune_start_all.py
      - fine_tune_start_sawyer.py
      - from_scratch.py
      - zero_shot.py
    - new_bin_inlay
      - sawyer_only.py
      - all_robots.py
    - inverse_model
      - sawyer_one_step.py
      - sawyer_two_step.py
      - multibot_one_step.py
      - franka_inverse_conf.py
    - view_generalization
      - single_view.py
      - all_views.py
    - franka
      - franka.py
    - baxter_fine_tune
      - baxter_fine_tune.py
      - sawyer_baxter_fine_tune.py
      - baxter_scratch.py
  - offline_exp
    - towel_classifier
      - hparams.py
      - conf.py
  - sim
    - cartgripper_2d_grasping
      - generate_tasks
        hparams.py
      - pixel_cost
        hparams.py
        conf.py
      - nce_experiments
        hparams.py
        conf.py
    - ensemble_grasping
      - hparams.py
      - generate_tasks.py
      - conf.py
  - sawyer
    - pixel_cost
      - hparams.py
      - conf.py
    - registration_experiments
      - hparams.py
      - gdnconf.py
      - conf.py
    - towel_classifier
      - hparams.py
      - conf.py
    - human_cem
      - hparams.py
      - conf.py
    - mixed_objects
      - hparams_deformable_objects.py
      - conf.py
      - hparams_hardobjects.py
- docker
  - vendor
    - Xdummy
    - 10_nvidia.json
  - Dockerfile
- README.md
- requirements.txt
- .gitignore

import numpy as np
import imp
from .cem_base_controller import CEMBaseController
from .visualizer.construct_html import save_gifs, save_html, save_img, fill_template
import matplotlib.pyplot as plt
from collections import OrderedDict
from visual_mpc.video_prediction.pred_util import get_context, rollout_predictions
import cv2


class GoalImController(CEMBaseController):
    """
    Cross Entropy Method Stochastic Optimizer
    """
    def __init__(self, ag_params, policyparams, gpu_id, ngpu):
        """

        :param ag_params: agent parameter dictionary
        :param policyparams: policy parameter dict
        :param gpu_id: gpu id
        :param ngpu: number of gpus to use
        """
        CEMBaseController.__init__(self, ag_params, policyparams)

        params = imp.load_source('params', ag_params['current_dir'] + '/conf.py')
        netconf = params.configuration
        self.predictor = netconf['setup_predictor'](ag_params, netconf, gpu_id, ngpu, self._logger)

        self._net_bsize = netconf['batch_size']
        self._net_seqlen = netconf['sequence_length']

        self._net_context = netconf['context_frames']
        self._hp.start_planning = self._net_context

        self._n_desig = netconf.get('ndesig', None)
        self._img_height, self._img_width = netconf['orig_size']

        self._n_cam = netconf['ncam']

        self._desig_pix = None
        self._goal_pix = None
        self._images = None

        if self._hp.predictor_propagation:
            self._rec_input_distrib = []  # record the input distributions

    def _default_hparams(self):
        default_dict = {
            "verbose_img_height": 128,
            'predictor_propagation':False,
            'only_take_first_view':False,
            'state_append': None,
            'finalweight': 10.
        }
        parent_params = super(GoalImController, self)._default_hparams()

        for k in default_dict.keys():
            parent_params.add_hparam(k, default_dict[k])
        return parent_params

    def reset(self):
        super(GoalImController, self).reset()
        if self._hp.predictor_propagation:
            self._rec_input_distrib = []  # record the input distributions

    # def switch_on_pix(self, desig):
    #     one_hot_images = np.zeros((1, self._net_context, self._n_cam, self._img_height, self._img_width, self._n_desig), dtype=np.float32)
    #     desig = np.clip(desig, np.zeros(2).reshape((1, 2)), np.array([self._img_height, self._img_width]).reshape((1, 2)) - 1).astype(np.int)
    #     # switch on pixels
    #     for icam in range(self._n_cam):
    #         for p in range(self._n_desig):
    #             one_hot_images[:, :, icam, desig[icam, p, 0], desig[icam, p, 1], p] = 1.
    #             self._logger.log('using desig pix', desig[icam, p, 0], desig[icam, p, 1])

    #     return one_hot_images

    def evaluate_rollouts(self, actions, cem_itr):
        last_frames, last_states = get_context(self._net_context, self._t,
                                               self._state, self._images, self._hp)
        # input_distrib = self._make_input_distrib(cem_itr)

        gen_images, _, _ = rollout_predictions(self.predictor, self._net_bsize, actions,
                                                      last_frames, last_states)#, input_distrib, logger=self._logger)[:2]
        gen_images = np.concatenate(gen_images, 0)
        print(gen_images.shape)

        goalim = cv2.imread('/home/sudeep/Documents/ext_data/robot_data/sawyer/goal_images/vestri/train/collection/traj1/images0/im_2.jpg')
        print(goalim.shape)
        goalim = cv2.resize(goalim, (64, 48), interpolation=cv2.INTER_AREA)
        goalim = cv2.cvtColor(goalim, cv2.COLOR_BGR2RGB)
        goalims = np.repeat(np.expand_dims(goalim, 0), 600, 0)
        print(goalims.shape)
        scores = ((gen_images[:, -1, 0, :, :, :] - goalims)**2).mean((1,2,3))
        print(scores.shape)


        # gen_distrib = np.concatenate(gen_distrib, 0)

        # scores = self._eval_pixel_cost(cem_itr, gen_distrib, gen_images)
        
        if self._verbose_condition(cem_itr):
            verbose_folder = "planning_{}_itr_{}".format(self._t, cem_itr)
            content_dict = OrderedDict()
            visualize_indices = scores.argsort()[:10]

            # start images
            for c in range(self._n_cam):
                name = 'cam_{}_start'.format(c)
                save_path = save_img(self._verbose_worker, verbose_folder, name, self._images[-1, c])
                content_dict[name] = [save_path for _ in visualize_indices]

            for c in range(self._n_cam):
                name = 'cam_{}_goal'.format(c)
                save_path = save_img(self._verbose_worker, verbose_folder, name, goalim)
                content_dict[name] = [save_path for _ in visualize_indices]

            # # render distributions
            # for c in range(self._n_cam):
            #     for p in range(self._n_desig):
            #         dist_p = [gen_distrib[g_i, :, c, :, :, p] for g_i in visualize_indices]
            #         for v in range(len(dist_p)):
            #             rendered = []
            #             for t in range(gen_distrib.shape[1]):
            #                 dist = dist_p[v][t] / (np.amax(dist_p[v][t]) + 1e-6)
            #                 rendered.append((np.squeeze(plt.cm.viridis(dist)[:, :, :3]) * 255).astype(np.uint8))
            #             dist_p[v] = rendered
            #         desig_name = 'cam_{}_desig_{}'.format(c, p)
            #         content_dict[desig_name] = save_gifs(self._verbose_worker, verbose_folder,
            #                                             desig_name, dist_p)

            # render predicted images
            for c in range(self._n_cam):
                verbose_images = [(gen_images[g_i, :, c] * 255).astype(np.uint8) for g_i in visualize_indices]
                row_name = 'cam_{}_pred_images'.format(c)
                content_dict[row_name] = save_gifs(self._verbose_worker, verbose_folder,
                                                       row_name, verbose_images)

            # save scores
            content_dict['scores'] = scores[visualize_indices]
            html_page = fill_template(cem_itr, self._t, content_dict, img_height=self._hp.verbose_img_height)
            save_html(self._verbose_worker, "{}/plan.html".format(verbose_folder), html_page)

        return scores

    # def _eval_pixel_cost(self, cem_itr, gen_distrib, gen_images):
    #     scores_per_task = []

    #     for icam in range(self._n_cam):
    #         for p in range(self._n_desig):
    #             distance_grid = self._get_distancegrid(self._goal_pix[icam, p])
    #             score = self._expected_distance(icam, p, gen_distrib[:, :, icam, :, :, p], distance_grid,
    #                                             normalize=True)
                
    #             scores_per_task.append(score)
    #             self._logger.log(
    #                 'best flow score of task {} cam{}  :{}'.format(p, icam, np.min(scores_per_task[-1])))

    #     scores_per_task = np.stack(scores_per_task, axis=1)

    #     if self._hp.only_take_first_view:
    #         scores_per_task = scores_per_task[:, 0][:, None]

    #     scores = np.mean(scores_per_task, axis=1)

    #     bestind = scores.argsort()[0]
    #     for icam in range(self._n_cam):
    #         for p in range(self._n_desig):
    #             self._logger.log('flow score of best traj for task{} cam{} :{}'.format(p, icam, scores_per_task[
    #                 bestind, p + icam * self._n_desig]))

    #     if self._hp.predictor_propagation:
    #         if cem_itr == (self._hp.iterations - 1):
    #             # pick the prop distrib from the action actually chosen after the last iteration (i.e. self.indices[0])
    #             bestind = scores.argsort()[0]
    #             best_gen_distrib = gen_distrib[bestind, self._net_context].reshape(1, self._n_cam, self._img_height,
    #                                                                                self._img_width, self._n_desig)
    #             self._rec_input_distrib.append(best_gen_distrib)
    #     return scores

    # def _expected_distance(self, icam, idesig, gen_distrib, distance_grid, normalize=True):
    #     """
    #     :param gen_distrib: shape [batch, t, r, c]
    #     :param distance_grid: shape [r, c]
    #     :return:
    #     """
    #     assert len(gen_distrib.shape) == 4
    #     t_mult = np.ones([self._net_seqlen - self._net_context])
    #     t_mult[-1] = self._hp.finalweight

    #     gen_distrib = gen_distrib.copy()
    #     #normalize prob distributions
    #     if normalize:
    #         gen_distrib /= np.sum(np.sum(gen_distrib, axis=2), 2)[:,:, None, None]
    #     gen_distrib *= distance_grid[None, None]
    #     scores = np.sum(np.sum(gen_distrib, axis=2),2)

    #     scores *= t_mult[None]
    #     scores = np.sum(scores, axis=1)/np.sum(t_mult)
    #     return scores

    # def _get_distancegrid(self, goal_pix):
    #     distance_grid = np.empty((self._img_height, self._img_width))
    #     for i in range(self._img_height):
    #         for j in range(self._img_width):
    #             pos = np.array([i, j])
    #             distance_grid[i, j] = np.linalg.norm(goal_pix - pos)

    #     self._logger.log('making distance grid with goal_pix', goal_pix)
    #     return distance_grid

    # def _make_input_distrib(self, itr):
    #     if self._hp.predictor_propagation:  # using the predictor's DNA to propagate, no correction
    #         input_distrib = self._get_recinput(itr, self._rec_input_distrib, self._desig_pix)
    #     else:
    #         input_distrib = self.switch_on_pix(self._desig_pix)
    #     return input_distrib

    # def _get_recinput(self, itr, rec_input_distrib, desig):
    #     ctxt = self._net_context
    #     if len(rec_input_distrib) < ctxt:
    #         input_distrib = self.switch_on_pix(desig)
    #         if itr == 0:
    #             rec_input_distrib.append(input_distrib[:, 0])
    #     else:
    #         input_distrib = [rec_input_distrib[c] for c in range(-ctxt, 0)]
    #         input_distrib = np.stack(input_distrib, axis=1)
    #     return input_distrib

    def act(self, t=None, i_tr=None, desig_pix=None, goal_pix=None, images=None, state=None, verbose_worker=None):
        """
        Return a random action for a state.
        Args:
            if performing highres tracking images is highres image
            t: the current controller's Time step
            goal_pix: in coordinates of small image
            desig_pix: in coordinates of small image
        """
        # self._desig_pix = np.array(desig_pix).reshape((self._n_cam, self._n_desig, 2))
        # self._goal_pix = np.array(goal_pix).reshape((self._n_cam, self._n_desig, 2))

        self._images = images

        self._verbose_worker = verbose_worker

        return super(GoalImController, self).act(t, i_tr, state)