python source code of enc

ConvLab-master
- run.py
- convlab
  - evaluator
    - evaluator.py
    - __init__.py
    - multiwoz.py
  - human_eval
    - task_config.py
    - run.py
    - db
      - taxi_db.json
      - attraction-dbase.db
      - train-dbase.db
      - restaurant-dbase.db
      - police_db.json
      - hospital-dbase.db
      - restaurant_db.json
      - hospital_db.json
      - hotel-dbase.db
      - hotel_db.json
      - taxi-dbase.db
      - attraction_db.json
    - html
      - mturk_index.html
    - analysis.py
    - bot_server.py
    - sequicity_server.py
    - dqnbot_server.py
    - worlds.py
    - rulebot_server.py
    - __init__.py
    - goal
      - goal_model.pkl
    - cambot_server.py
  - agent
    - net
      - conv.py
      - net_util.py
      - recurrent.py
      - __init__.py
      - mlp.py
      - base.py
    - __init__.py
    - algorithm
      - external.py
      - sil.py
      - ppo.py
      - random.py
      - actor_critic.py
      - sarsa.py
      - reinforce.py
      - __init__.py
      - dqn.py
      - policy_util.py
      - base.py
    - memory
      - replay.py
      - prioritized.py
      - onpolicy.py
      - __init__.py
      - base.py
  - lib
    - optimizer.py
    - util.py
    - decorator.py
    - math_util.py
    - file_util.py
    - distribution.py
    - logger.py
    - __init__.py
    - viz.py
  - spec
    - spec_util.py
    - baseline.json
    - demo.json
    - test.json
    - __init__.py
    - _fitness_std.json
  - __init__.py
  - experiment
    - retro_analysis.py
    - search.py
    - analysis.py
    - control.py
    - __init__.py
  - modules
    - usr
      - user.py
      - multiwoz
        goal_generator.py
        __init__.py
        vhus_usr
        config.py
        user.py
        usermanager.py
        usermodule.py
        main.py
        model
      - __init__.py
    - action_decoder
      - multiwoz
        __init__.py
        multiwoz_vocab_action_decoder.py
      - __init__.py
      - README.md
    - policy
      - user
        policy.py
        multiwoz
        policy_agenda_multiwoz.py
        policy_vhus.py
        __init__.py
        __init__.py
      - __init__.py
      - README.md
      - system
        policy.py
        multiwoz
        vanilla_mle
        policy.py
        evaluate.py
        dataset_reader.py
        model.py
        train.py
        configs
        300.jsonnet
        __init__.py
        README.md
        rule_based_multiwoz_bot.py
        __init__.py
        __init__.py
    - e2e
      - multiwoz
        Sequicity
        metric.py
        config.py
        tsd_net.py
        reader.py
        model.py
        Sequicity.py
        __init__.py
        README.md
        requirements.txt
        __init__.py
        Mem2Seq
        utils
        utils_kvr_mem2seq.py
        utils_NMT.py
        config.py
        masked_cross_entropy.py
        utils_woz_mem2seq.py
        multi-bleu.perl
        __init__.py
        utils_babi_mem2seq.py
        utils_kvr.py
        measures.py
        utils_babi.py
        until_temp.py
        main_test.py
        main_train.py
        models
        enc_vanilla.py
        enc_PTRUNK.py
        enc_Luong.py
        __init__.py
        Mem2Seq.py
        Mem2Seq_NMT.py
        __init__.py
        README.md
        main_nmt.py
        main_interact.py
        Mem2Seq.py
      - __init__.py
      - README.md
    - nlg
      - nlg.py
      - multiwoz
        evaluate.py
        sc_lstm
        run_woz.py
        config
        config_usr.cfg
        config.cfg
        nlg_sc_lstm.py
        loader
        dataset_woz.py
        __init__.py
        README.md
        model
        layers
        decoder_deep.py
        sclstm.py
        masked_cross_entropy.py
        lm_deep.py
        bleu.py
        __init__.py
        README.md
        utils.py
        template_nlg.py
        multiwoz_template_nlg
        multiwoz_template_nlg.py
        manual_system_template_nlg.json
        manual_user_template_nlg.json
        __init__.py
        README.md
      - __init__.py
      - README.md
    - word_policy
      - multiwoz
        mdrg
        create_delex_data.py
        utils
        util.py
        nlp.py
        mapping.pair
        delexicalize.py
        dbquery.py
        dbPointer.py
        __init__.py
        policy.py
        db
        taxi_db.json
        attraction-dbase.db
        restaurant-dbase.db
        police_db.json
        hospital-dbase.db
        restaurant_db.json
        hospital_db.json
        hotel-dbase.db
        hotel_db.json
        taxi-dbase.db
        attraction_db.json
        train.py
        __init__.py
        README.md
        requirements.txt
        model
        evaluator.py
        policy.py
        model.py
        data
        val_dials
        val_dials_gen.json
        test_dials
        test_dials_gen.json
        __init__.py
        test.py
        hdsa
        predictor.py
        hdsa.py
        transformer
        Beam.py
        Transformer.py
        __init__.py
        Constants.py
        generator.py
        __init__.py
        README.md
        __init__.py
        larl
        utils
        util.py
        corpora.py
        nlp.py
        mapping.pair
        delexicalize.py
        dbquery.py
        dbPointer.py
        __init__.py
        policy.py
        latent_dialog
        judgment.py
        metric.py
        data_loaders.py
        evaluators.py
        corpora.py
        domain.py
        base_data_loaders.py
        criterions.py
        dialog_task.py
        normalizer
        mapping.pair
        delexicalize.py
        __init__.py
        models_task.py
        enc2dec
        decoders.py
        __init__.py
        classifier.py
        encoders.py
        base_modules.py
        __init__.py
        main.py
        agent_task.py
        utils.py
        base_models.py
        nn_lib.py
        record.py
        data
        __init__.py
        scripts
        reinforce_gauss.py
        sl_gauss.py
        dialog_utils.py
        sl_cat.py
        __init__.py
        reinforce_cat.py
        sl_word.py
        reinforce_word.py
        corpora_inference.py
        experiments_woz
        reinforce_gauss.py
        sl_gauss.py
        dialog_utils.py
        mytest.py
        sl_cat.py
        __init__.py
        reinforce_cat.py
        sl_word.py
        reinforce_word.py
      - __init__.py
      - README.md
    - util
      - multiwoz
        multiwoz_slot_trans.py
        da_normalize.py
        dbquery.py
      - __init__.py
    - nlu
      - multiwoz
        milu
        evaluate.py
        dataset_reader.py
        multilabel_f1_measure.py
        model.py
        nlu.py
        train.py
        configs
        base.jsonnet
        system.jsonnet
        user.jsonnet
        context3.jsonnet
        __init__.py
        README.md
        dai_f1_measure.py
        evaluate.py
        onenet
        evaluate.py
        dataset_reader.py
        model.py
        nlu.py
        train.py
        configs
        base.jsonnet
        __init__.py
        README.md
        dai_f1_measure.py
        svm
        preprocess.py
        config.md
        corpora
        scripts
        misc.py
        check_track.py
        report.py
        baseline.py
        config
        testListFile
        valListFile
        trainListFile
        ontology_multiwoz.json
        score_slu.py
        score.py
        prettyPrint.py
        __init__.py
        dataset_walker.py
        sutils.py
        Tuples.py
        config
        multiwoz.cfg
        nlu.py
        train.py
        Classifier.py
        Features.py
        __init__.py
        README.md
        __init__.py
        README.md
        utils.py
        error.py
        bert
        jointBERT.py
        dataloader.py
        multiwoz
        preprocess.py
        postprocess.py
        nlu.py
        configs
        multiwoz_all_fr.json
        multiwoz_all_context.json
        multiwoz_all_context_fr.json
        multiwoz_all.json
        __init__.py
        train.py
        __init__.py
        README.md
        test.py
      - nlu.py
      - __init__.py
      - README.md
    - word_dst
      - multiwoz
        evaluate.py
        mdbt
        mdbt_util.py
        allennlp_file_utils.py
        __init__.py
        mdbt.py
        __init__.py
        trade
        trade.py
        trade_config.py
        __init__.py
        trade_utils.py
        sumbt
        sumbt_config.py
        sumbt.py
        BeliefTrackerSlotQueryMultiSlot.py
        __init__.py
        sumbt_utils.py
      - __init__.py
      - README.md
    - __init__.py
    - dst
      - multiwoz
        dst_util.py
        evaluate.py
        rule_dst.py
        __init__.py
      - __init__.py
      - README.md
      - state_tracker.py
    - state_encoder
      - multiwoz
        multiwoz_state_encoder.py
        __init__.py
      - __init__.py
      - README.md
  - env
    - __init__.py
    - movie.py
    - multiwoz.py
    - base.py
- tutorial
  - How to create non-RL policy.md
  - How to create NLU model.md
- LICENSE
- setup.py
- data
  - multiwoz
    - dia_acts.txt
    - db
      - taxi_db.json
      - police_db.json
      - restaurant_db.json
      - db_values.json
      - extract_db_value.py
      - hospital_db.json
      - hotel_db.json
      - attraction_db.json
    - testListFile
    - slot_set.txt
    - value_dict.json
    - valListFile
    - trainListFile
    - goal
      - goal_model.pkl
      - vocab.pkl
    - README.md
    - annotation
      - Multiwoz data analysis.md
      - annotate_patch_name.py
      - annotate.py
    - split_dataset.py
    - dialog_act_slot.txt
  - movie
    - dia_acts.txt
    - user_goals_first_turn_template.part.movie.v1.p
    - dicts.v3.json
    - user_goals_all_turns_template.p
    - slot_set.txt
    - movie_kb.v2.json
    - movie_kb.1k.p
    - movie_kb.v2.p
    - movie_kb.1k.json
    - user_goals_first_turn_template.v2.p
    - dia_act_nl_pairs.v6.json
    - dicts.v3.p
  - value_set.json
  - data_processor.py
- .travis.yml
- README.md
- requirements.txt
- Dockerfile
- NOTICE
- .gitignore
- docs
  - Makefile
  - source
    - convlab.modules.word_policy.multiwoz.mdrg.utils.rst
    - convlab.modules.util.rst
    - convlab.evaluator.rst
    - convlab.modules.nlg.rst
    - convlab.modules.e2e.multiwoz.Sequicity.rst
    - convlab.modules.word_policy.multiwoz.mdrg.model.rst
    - convlab.modules.nlu.multiwoz.milu.rst
    - convlab.modules.policy.rst
    - convlab.modules.state_encoder.rst
    - convlab.modules.e2e.multiwoz.Mem2Seq.models.rst
    - convlab.env.rst
    - convlab.modules.usr.multiwoz.rst
    - convlab.modules.nlu.rst
    - convlab.rst
    - convlab.modules.policy.system.multiwoz.vanilla_mle.rst
    - convlab.modules.nlg.multiwoz.rst
    - convlab.experiment.rst
    - convlab.modules.word_policy.multiwoz.rst
    - convlab.agent.memory.rst
    - convlab.modules.dst.rst
    - convlab.modules.policy.user.multiwoz.rst
    - convlab.modules.policy.system.multiwoz.rst
    - convlab.modules.word_policy.rst
    - convlab.modules.rst
    - convlab.modules.dst.multiwoz.rst
    - convlab.modules.policy.system.rst
    - convlab.modules.nlg.multiwoz.sc_lstm.rst
    - convlab.modules.nlg.multiwoz.multiwoz_template_nlg.rst
    - convlab.agent.algorithm.rst
    - convlab.modules.state_encoder.multiwoz.rst
    - convlab.modules.e2e.multiwoz.rst
    - convlab.modules.e2e.multiwoz.Mem2Seq.utils.rst
    - convlab.human_eval.rst
    - convlab.modules.word_policy.multiwoz.mdrg.rst
    - convlab.modules.nlu.multiwoz.svm.rst
    - convlab.modules.action_decoder.multiwoz.rst
    - convlab.modules.usr.rst
    - convlab.modules.nlu.multiwoz.onenet.rst
    - modules.rst
    - convlab.modules.word_dst.multiwoz.rst
    - index.rst
    - conf.py
    - convlab.modules.e2e.multiwoz.Mem2Seq.rst
    - convlab.modules.e2e.rst
    - convlab.modules.policy.user.rst
    - convlab.modules.word_dst.rst
    - convlab.lib.rst
    - convlab.modules.action_decoder.rst
    - convlab.agent.net.rst
    - convlab.agent.rst
    - convlab.spec.rst
    - convlab.modules.nlu.multiwoz.rst
  - make.bat
  - build
    - doctrees
      - modules.doctree
      - convlab.modules.word_policy.multiwoz.mdrg.model.doctree
      - convlab.modules.e2e.multiwoz.Mem2Seq.models.doctree
      - convlab.modules.action_decoder.multiwoz.doctree
      - convlab.modules.policy.system.doctree
      - convlab.modules.policy.system.multiwoz.doctree
      - convlab.modules.word_policy.multiwoz.mdrg.doctree
      - convlab.agent.memory.doctree
      - convlab.modules.e2e.multiwoz.doctree
      - convlab.modules.nlg.doctree
      - convlab.modules.e2e.doctree
      - convlab.modules.policy.doctree
      - convlab.modules.state_encoder.doctree
      - convlab.modules.state_encoder.multiwoz.doctree
      - convlab.agent.net.doctree
      - convlab.doctree
      - convlab.modules.util.doctree
      - convlab.experiment.doctree
      - convlab.modules.e2e.multiwoz.Sequicity.doctree
      - convlab.modules.word_policy.multiwoz.mdrg.utils.doctree
      - convlab.modules.word_dst.doctree
      - convlab.modules.word_policy.doctree
      - convlab.modules.nlu.multiwoz.svm.doctree
      - convlab.evaluator.doctree
      - convlab.modules.e2e.multiwoz.Mem2Seq.utils.doctree
      - convlab.modules.nlg.multiwoz.sc_lstm.doctree
      - convlab.modules.policy.user.doctree
      - convlab.env.doctree
      - convlab.modules.e2e.multiwoz.Mem2Seq.doctree
      - convlab.modules.dst.multiwoz.doctree
      - convlab.modules.dst.doctree
      - convlab.modules.usr.multiwoz.doctree
      - convlab.modules.doctree
      - convlab.agent.doctree
      - convlab.modules.nlu.doctree
      - convlab.spec.doctree
      - convlab.modules.word_policy.multiwoz.doctree
      - convlab.modules.nlu.multiwoz.milu.doctree
      - convlab.modules.policy.system.multiwoz.vanilla_mle.doctree
      - convlab.modules.nlu.multiwoz.onenet.doctree
      - convlab.modules.usr.doctree
      - convlab.modules.action_decoder.doctree
      - convlab.modules.policy.user.multiwoz.doctree
      - convlab.modules.nlg.multiwoz.multiwoz_template_nlg.doctree
      - convlab.modules.nlg.multiwoz.doctree
      - convlab.modules.nlu.multiwoz.doctree
      - convlab.human_eval.doctree
      - index.doctree
      - convlab.modules.word_dst.multiwoz.doctree
    - html
      - convlab.modules.policy.user.html
      - convlab.modules.word_dst.multiwoz.html
      - convlab.modules.action_decoder.html
      - convlab.modules.util.html
      - convlab.agent.memory.html
      - convlab.modules.policy.system.multiwoz.vanilla_mle.html
      - convlab.modules.e2e.multiwoz.Sequicity.html
      - convlab.modules.policy.system.multiwoz.html
      - .nojekyll
      - convlab.env.html
      - convlab.modules.e2e.multiwoz.Mem2Seq.models.html
      - convlab.modules.word_policy.multiwoz.mdrg.utils.html
      - convlab.modules.state_encoder.multiwoz.html
      - convlab.experiment.html
      - convlab.modules.e2e.multiwoz.html
      - convlab.modules.nlu.multiwoz.svm.html
      - convlab.modules.dst.html
      - convlab.lib.html
      - convlab.evaluator.html
      - _sources
        convlab.modules.policy.rst.txt
        index.rst.txt
        convlab.modules.nlu.multiwoz.milu.rst.txt
        convlab.spec.rst.txt
        convlab.agent.net.rst.txt
        convlab.modules.policy.system.rst.txt
        convlab.modules.policy.user.rst.txt
        convlab.agent.algorithm.rst.txt
        convlab.modules.policy.user.multiwoz.rst.txt
        convlab.modules.e2e.multiwoz.Mem2Seq.rst.txt
        convlab.modules.nlg.multiwoz.rst.txt
        convlab.modules.e2e.multiwoz.rst.txt
        modules.rst.txt
        convlab.agent.rst.txt
        convlab.modules.policy.system.multiwoz.vanilla_mle.rst.txt
        convlab.human_eval.rst.txt
        convlab.agent.memory.rst.txt
        convlab.modules.word_dst.rst.txt
        convlab.modules.state_encoder.rst.txt
        convlab.modules.usr.multiwoz.rst.txt
        convlab.modules.nlu.rst.txt
        convlab.modules.dst.rst.txt
        convlab.modules.word_policy.rst.txt
        convlab.modules.state_encoder.multiwoz.rst.txt
        convlab.modules.dst.multiwoz.rst.txt
        convlab.modules.util.rst.txt
        convlab.evaluator.rst.txt
        convlab.modules.word_policy.multiwoz.rst.txt
        convlab.modules.action_decoder.multiwoz.rst.txt
        convlab.lib.rst.txt
        convlab.modules.usr.rst.txt
        convlab.modules.e2e.multiwoz.Sequicity.rst.txt
        convlab.env.rst.txt
        convlab.modules.e2e.rst.txt
        convlab.modules.e2e.multiwoz.Mem2Seq.models.rst.txt
        convlab.modules.nlg.multiwoz.sc_lstm.rst.txt
        convlab.modules.nlu.multiwoz.svm.rst.txt
        convlab.modules.policy.system.multiwoz.rst.txt
        convlab.modules.nlu.multiwoz.onenet.rst.txt
        convlab.modules.word_policy.multiwoz.mdrg.model.rst.txt
        convlab.modules.nlg.rst.txt
        convlab.modules.word_dst.multiwoz.rst.txt
        convlab.modules.action_decoder.rst.txt
        convlab.modules.e2e.multiwoz.Mem2Seq.utils.rst.txt
        convlab.rst.txt
        convlab.modules.word_policy.multiwoz.mdrg.utils.rst.txt
        convlab.modules.nlu.multiwoz.rst.txt
        convlab.modules.word_policy.multiwoz.mdrg.rst.txt
        convlab.modules.rst.txt
        convlab.modules.nlg.multiwoz.multiwoz_template_nlg.rst.txt
        convlab.experiment.rst.txt
      - searchindex.js
      - convlab.modules.nlu.multiwoz.onenet.html
      - convlab.modules.usr.multiwoz.html
      - convlab.modules.nlg.multiwoz.html
      - convlab.modules.e2e.html
      - convlab.modules.policy.system.html
      - _modules
        convlab
        evaluator
        multiwoz.html
        evaluator.html
        human_eval
        analysis.html
        sequicity_server.html
        agent
        net
        conv.html
        base.html
        recurrent.html
        mlp.html
        net_util.html
        algorithm
        actor_critic.html
        reinforce.html
        random.html
        dqn.html
        base.html
        external.html
        ppo.html
        sarsa.html
        sil.html
        policy_util.html
        memory
        prioritized.html
        onpolicy.html
        replay.html
        base.html
        lib
        optimizer.html
        viz.html
        util.html
        file_util.html
        decorator.html
        logger.html
        math_util.html
        distribution.html
        spec
        spec_util.html
        agent.html
        experiment
        analysis.html
        retro_analysis.html
        env.html
        modules
        usr
        user.html
        multiwoz
        goal_generator.html
        action_decoder
        multiwoz
        multiwoz_vocab_action_decoder.html
        policy
        user
        multiwoz
        policy_agenda_multiwoz.html
        policy_vhus.html
        policy.html
        system
        multiwoz
        util.html
        vanilla_mle
        dataset_reader.html
        evaluate.html
        train.html
        policy.html
        model.html
        rule_based_multiwoz_bot.html
        policy.html
        e2e
        multiwoz
        Sequicity
        Sequicity.html
        tsd_net.html
        metric.html
        model.html
        Mem2Seq
        utils
        measures.html
        nlg
        nlg.html
        multiwoz
        evaluate.html
        sc_lstm
        bleu.html
        nlg_sc_lstm.html
        template_nlg.html
        utils.html
        multiwoz_template_nlg
        multiwoz_template_nlg.html
        word_policy
        multiwoz
        mdrg
        utils
        util.html
        dbquery.html
        delexicalize.html
        nlp.html
        model
        policy.html
        model.html
        policy.html
        nlu
        nlu.html
        multiwoz
        evaluate.html
        milu
        dataset_reader.html
        evaluate.html
        train.html
        multilabel_f1_measure.html
        nlu.html
        model.html
        dai_f1_measure.html
        error.html
        utils.html
        onenet
        dataset_reader.html
        evaluate.html
        train.html
        nlu.html
        model.html
        dai_f1_measure.html
        svm
        Classifier.html
        Tuples.html
        preprocess.html
        train.html
        nlu.html
        sutils.html
        Features.html
        word_dst
        multiwoz
        evaluate.html
        mdbt.html
        dst
        state_tracker.html
        multiwoz
        dst_util.html
        evaluate.html
        rule_dst.html
        state_encoder
        multiwoz
        multiwoz_state_encoder.html
        env
        multiwoz.html
        base.html
        index.html
      - convlab.human_eval.html
      - convlab.modules.action_decoder.multiwoz.html
      - convlab.modules.e2e.multiwoz.Mem2Seq.html
      - convlab.modules.nlg.multiwoz.sc_lstm.html
      - convlab.spec.html
      - convlab.agent.html
      - convlab.modules.nlu.multiwoz.milu.html
      - .buildinfo
      - convlab.modules.e2e.multiwoz.Mem2Seq.utils.html
      - objects.inv
      - convlab.modules.nlu.html
      - convlab.agent.net.html
      - genindex.html
      - convlab.modules.nlu.multiwoz.html
      - convlab.modules.word_policy.multiwoz.mdrg.model.html
      - convlab.modules.usr.html
      - py-modindex.html
      - convlab.html
      - convlab.modules.word_policy.multiwoz.mdrg.html
      - convlab.modules.html
      - index.html
      - search.html
      - convlab.modules.word_dst.html
      - convlab.modules.nlg.multiwoz.multiwoz_template_nlg.html
      - convlab.modules.nlg.html
      - modules.html
      - convlab.modules.policy.user.multiwoz.html
      - convlab.modules.word_policy.html
      - convlab.modules.policy.html
      - convlab.agent.algorithm.html
      - _static
        ajax-loader.gif
        jquery.js
        basic.css
        pygments.css
        searchtools.js
        documentation_options.js
        language_data.js
        doctools.js
        fonts
        fontawesome-webfont.woff2
        fontawesome-webfont.woff
        fontawesome-webfont.eot
        RobotoSlab-Bold.ttf
        Lato
        lato-bold.woff2
        lato-bolditalic.woff2
        lato-italic.woff2
        lato-regular.woff2
        RobotoSlab
        roboto-slab-v7-bold.woff2
        roboto-slab-v7-regular.eot
        roboto-slab-v7-bold.ttf
        roboto-slab-v7-bold.eot
        roboto-slab-v7-regular.woff
        roboto-slab-v7-bold.woff
        roboto-slab-v7-regular.ttf
        roboto-slab-v7-regular.woff2
        Inconsolata.ttf
        Inconsolata-Bold.ttf
        RobotoSlab-Regular.ttf
        fontawesome-webfont.ttf
        Inconsolata-Regular.ttf
        websupport.js
        underscore-1.3.1.js
        alabaster.css
        js
        theme.js
        modernizr.min.js
        underscore.js
        custom.css
        css
        badge_only.css
        theme.css
      - convlab.modules.state_encoder.html
      - convlab.modules.word_policy.multiwoz.html
      - convlab.modules.dst.multiwoz.html

# Modified by Microsoft Corporation.
# Licensed under the MIT license.

import math
import random

import numpy as np
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch import optim
from torch.autograd import Variable
from tqdm import tqdm
from utils.config import *
from utils.masked_cross_entropy import *
from utils.measures import wer, moses_multi_bleu


class PTRUNK(nn.Module):
    def __init__(self,hidden_size,max_len,max_r,lang,path,task,lr,n_layers, dropout):
        super(PTRUNK, self).__init__()
        self.name = "PTRUNK"
        self.task = task
        self.input_size = lang.n_words
        self.output_size = lang.n_words
        self.hidden_size = hidden_size
        self.max_len = max_len ## max input
        self.max_r = max_r ## max responce len        
        self.lang = lang
        self.lr = lr
        self.decoder_learning_ratio = 5.0
        self.n_layers = n_layers
        self.dropout = dropout
        if path:
            if USE_CUDA:
                logging.info("MODEL {} LOADED".format(str(path)))
                self.encoder = torch.load(str(path)+'/enc.th')
                self.decoder = torch.load(str(path)+'/dec.th')
            else:
                logging.info("MODEL {} LOADED".format(str(path)))
                self.encoder = torch.load(str(path)+'/enc.th',lambda storage, loc: storage)
                self.decoder = torch.load(str(path)+'/dec.th',lambda storage, loc: storage)
                self.decoder.viz_arr =[] 
        else:
            self.encoder = EncoderRNN(lang.n_words, hidden_size, n_layers,dropout)
            self.decoder = PtrDecoderRNN(hidden_size, lang.n_words, n_layers, dropout)
        # Initialize optimizers and criterion
        self.encoder_optimizer = optim.Adam(self.encoder.parameters(), lr=lr)
        self.decoder_optimizer = optim.Adam(self.decoder.parameters(), lr=lr* self.decoder_learning_ratio)
        self.criterion = nn.MSELoss()
        self.loss = 0
        self.loss_gate = 0
        self.loss_ptr = 0
        self.loss_vac = 0
        self.print_every = 1
        # Move models to GPU
        if USE_CUDA:
            self.encoder.cuda()
            self.decoder.cuda()

    def print_loss(self):
        print_loss_avg = self.loss / self.print_every
        print_loss_gate = self.loss_gate / self.print_every
        print_loss_ptr =  self.loss_ptr / self.print_every
        print_loss_vac =  self.loss_vac / self.print_every
        self.print_every += 1
        return 'L:{:.2f}, VL:{:.2f},GL:{:.2f}, PL:{:.2f}'.format(print_loss_avg,print_loss_vac,print_loss_gate,print_loss_ptr)
    
    def save_model(self,dec_type):
        name_data = "KVR/" if self.task=='' else "BABI/"
        if USEKB:
            directory = 'save/PTR_KB-'+name_data+str(self.task)+'HDD'+str(self.hidden_size)+'DR'+str(self.dropout)+'L'+str(self.n_layers)+'lr'+str(self.lr)+str(dec_type)         
        else:
            directory = 'save/PTR_noKB-'+name_data+str(self.task)+'HDD'+str(self.hidden_size)+'DR'+str(self.dropout)+'L'+str(self.n_layers)+'lr'+str(self.lr)+str(dec_type)         
        #directory = 'save/PTR_KVR_KB/'+str(self.task)+'HDD'+str(self.hidden_size)+'DR'+str(self.dropout)+'L'+str(self.n_layers)+'lr'+str(self.lr)+str(dec_type) #+datetime.datetime.now().strftime("%I%M%p%B%d%Y"
        if not os.path.exists(directory):
            os.makedirs(directory)
        torch.save(self.encoder, directory+'/enc.th')
        torch.save(self.decoder, directory+'/dec.th')
        
    def train_batch(self, input_batches, input_lengths, target_batches, 
                    target_lengths, target_index, target_gate, batch_size, clip,
                    teacher_forcing_ratio,reset):   
        if reset:
            self.loss = 0
            self.loss_gate = 0
            self.loss_ptr = 0
            self.loss_vac = 0
            self.print_every = 1 
        # Zero gradients of both optimizers
        self.encoder_optimizer.zero_grad()
        self.decoder_optimizer.zero_grad()
        loss_Vocab,loss_Ptr,loss_Gate = 0,0,0
        # Run words through encoder
        encoder_outputs, encoder_hidden = self.encoder(input_batches, input_lengths)
      
        # Prepare input and output variables
        decoder_input = Variable(torch.LongTensor([SOS_token] * batch_size))
        decoder_hidden = (encoder_hidden[0][:self.decoder.n_layers],encoder_hidden[1][:self.decoder.n_layers])
        
        max_target_length = max(target_lengths)
        all_decoder_outputs_vocab = Variable(torch.zeros(max_target_length, batch_size, self.output_size))
        all_decoder_outputs_ptr = Variable(torch.zeros(max_target_length, batch_size, encoder_outputs.size(0)))
        all_decoder_outputs_gate = Variable(torch.zeros(max_target_length, batch_size))
        # Move new Variables to CUDA
        if USE_CUDA:
            all_decoder_outputs_vocab = all_decoder_outputs_vocab.cuda()
            all_decoder_outputs_ptr = all_decoder_outputs_ptr.cuda()
            all_decoder_outputs_gate = all_decoder_outputs_gate.cuda()
            decoder_input = decoder_input.cuda()

        # Choose whether to use teacher forcing
        use_teacher_forcing = random.random() < teacher_forcing_ratio
        
        if use_teacher_forcing:    
            # Run through decoder one time step at a time
            for t in range(max_target_length):
                decoder_ptr,decoder_vacab,gate,decoder_hidden = self.decoder(
                    decoder_input, decoder_hidden, encoder_outputs)

                all_decoder_outputs_vocab[t] = decoder_vacab
                all_decoder_outputs_ptr[t] = decoder_ptr
                all_decoder_outputs_gate[t] = gate
                decoder_input = target_batches[t] # Next input is current target
                if USE_CUDA: decoder_input = decoder_input.cuda()
                
        else:
            for t in range(max_target_length):
                decoder_ptr,decoder_vacab,gate,decoder_hidden = self.decoder(
                    decoder_input, decoder_hidden, encoder_outputs)
                all_decoder_outputs_vocab[t] = decoder_vacab
                all_decoder_outputs_ptr[t] = decoder_ptr
                all_decoder_outputs_gate[t] = gate
                topv, topvi = decoder_vacab.data.topk(1)
                topp, toppi = decoder_ptr.data.topk(1)
                ## get the correspective word in input
                top_ptr_i = torch.gather(input_batches,0,toppi.view(1, -1))
                next_in = [top_ptr_i.squeeze()[i].data[0] if(gate.squeeze()[i].data[0]>=0.5) else topvi.squeeze()[i] for i in range(batch_size)]
                decoder_input = Variable(torch.LongTensor(next_in)) # Chosen word is next input
                if USE_CUDA: decoder_input = decoder_input.cuda()
                  
        #Loss calculation and backpropagation
        loss_Vocab = masked_cross_entropy(
            all_decoder_outputs_vocab.transpose(0, 1).contiguous(), # -> batch x seq
            target_batches.transpose(0, 1).contiguous(), # -> batch x seq
            target_lengths
        )
        loss_Ptr = masked_cross_entropy(
            all_decoder_outputs_ptr.transpose(0, 1).contiguous(), # -> batch x seq
            target_index.transpose(0, 1).contiguous(), # -> batch x seq
            target_lengths
        )
        loss_gate = self.criterion(all_decoder_outputs_gate,target_gate.float())


        loss = loss_Vocab + loss_Ptr + loss_gate
        loss.backward()
        
        # Clip gradient norms
        ec = torch.nn.utils.clip_grad_norm(self.encoder.parameters(), clip)
        dc = torch.nn.utils.clip_grad_norm(self.decoder.parameters(), clip)
        # Update parameters with optimizers
        self.encoder_optimizer.step()
        self.decoder_optimizer.step()
        self.loss += loss.data[0]
        self.loss_gate += loss_gate.data[0] 
        self.loss_ptr += loss_Ptr.data[0]
        self.loss_vac += loss_Vocab.data[0]
        
        
    def evaluate_batch(self,batch_size,input_batches, input_lengths, target_batches, target_lengths, target_index,target_gate,src_plain):  
        # Set to not-training mode to disable dropout
        self.encoder.train(False)
        self.decoder.train(False)  
        # Run words through encoder
        encoder_outputs, encoder_hidden = self.encoder(input_batches, input_lengths, None)
        # Prepare input and output variables
        decoder_input = Variable(torch.LongTensor([SOS_token] * batch_size))
        decoder_hidden = (encoder_hidden[0][:self.decoder.n_layers],encoder_hidden[1][:self.decoder.n_layers])

        decoded_words = []
        all_decoder_outputs_vocab = Variable(torch.zeros(self.max_r, batch_size, self.decoder.output_size))
        all_decoder_outputs_ptr = Variable(torch.zeros(self.max_r, batch_size, encoder_outputs.size(0)))
        all_decoder_outputs_gate = Variable(torch.zeros(self.max_r, batch_size))
        # Move new Variables to CUDA

        if USE_CUDA:
            all_decoder_outputs_vocab = all_decoder_outputs_vocab.cuda()
            all_decoder_outputs_ptr = all_decoder_outputs_ptr.cuda()
            all_decoder_outputs_gate = all_decoder_outputs_gate.cuda()
            decoder_input = decoder_input.cuda()
        p = []
        for elm in src_plain:
            p.append(elm.split(' '))
        # Run through decoder one time step at a time
        for t in range(self.max_r):
            decoder_ptr,decoder_vacab,gate,decoder_hidden  = self.decoder(
                decoder_input, decoder_hidden, encoder_outputs)
            all_decoder_outputs_vocab[t] = decoder_vacab
            all_decoder_outputs_ptr[t] = decoder_ptr
            all_decoder_outputs_gate[t] = gate

            topv, topvi = decoder_vacab.data.topk(1)
            topp, toppi = decoder_ptr.data.topk(1)
            top_ptr_i = torch.gather(input_batches,0,toppi.view(1, -1))        
            next_in = [top_ptr_i.squeeze()[i].data[0] if(gate.squeeze()[i].data[0]>=0.5) else topvi.squeeze()[i] for i in range(batch_size)]
            decoder_input = Variable(torch.LongTensor(next_in)) 
            # Next input is chosen word
            if USE_CUDA: decoder_input = decoder_input.cuda()

            temp = []
            for i in range(batch_size):
                if(gate.squeeze()[i].data[0]>=0.5):
                    if(toppi.squeeze()[i] >= len(p[i]) ):
                        temp.append('<EOS>')
                    else:
                        temp.append(p[i][toppi.squeeze()[i]])
                else:
                    ind = topvi.squeeze()[i]
                    if ind == EOS_token:
                        temp.append('<EOS>')
                    else:
                        temp.append(self.lang.index2word[ind])
            decoded_words.append(temp)

        # Set back to training mode
        self.encoder.train(True)
        self.decoder.train(True)    

        return decoded_words


    def evaluate(self,dev,avg_best,BLEU=False):
        logging.info("STARTING EVALUATION")
        acc_avg = 0.0
        wer_avg = 0.0
        acc_G = 0.0
        acc_P = 0.0
        acc_V = 0.0
        ref = []
        hyp = []
        ref_s = ""
        hyp_s = ""
        pbar = tqdm(enumerate(dev),total=len(dev))
        for j, data_dev in pbar: 
            words = self.evaluate_batch(len(data_dev[1]),data_dev[0],data_dev[1],data_dev[2],data_dev[3],data_dev[4],data_dev[5],data_dev[6])            
            acc=0
            w = 0
            temp_gen = []
            for i, row in enumerate(np.transpose(words)):
                st = ''
                for e in row:
                    if e== '<EOS>':
                        break
                    else:
                        st+= e + ' '
                temp_gen.append(st)
                correct = data_dev[7][i]
                
                if (correct.lstrip().rstrip() == st.lstrip().rstrip()):
                    acc+=1
                w += wer(correct.lstrip().rstrip(),st.lstrip().rstrip())
                ref.append(str(correct.lstrip().rstrip()))
                hyp.append(str(st.lstrip().rstrip()))
                ref_s+=str(correct.lstrip().rstrip())+ "\n"
                hyp_s+=str(st.lstrip().rstrip()) + "\n"

            acc_avg += acc/float(len(data_dev[1]))
            wer_avg += w/float(len(data_dev[1]))
            pbar.set_description("R:{:.4f},W:{:.4f}".format(acc_avg/float(len(dev)),wer_avg/float(len(dev))))

        if (BLEU):       
            bleu_score = moses_multi_bleu(np.array(hyp), np.array(ref), lowercase=True) 
            logging.info("BLEU SCORE:"+str(bleu_score))     
                                                                      
            if (bleu_score >= avg_best):
                self.save_model(str(self.name)+str(bleu_score))
                logging.info("MODEL SAVED")
            return bleu_score
        else:              
            acc_avg = acc_avg/float(len(dev))
            if (acc_avg >= avg_best):
                self.save_model(str(self.name)+str(acc_avg))
                logging.info("MODEL SAVED")
            return acc_avg


class EncoderRNN(nn.Module):
    def __init__(self, input_size, hidden_size, n_layers=1, dropout=0.1):
        super(EncoderRNN, self).__init__()      
        self.input_size = input_size
        self.hidden_size = hidden_size
        self.n_layers = n_layers
        self.dropout = dropout       
        self.embedding = nn.Embedding(input_size, hidden_size)
        self.embedding_dropout = nn.Dropout(dropout) 
        self.lstm = nn.LSTM(hidden_size, hidden_size, n_layers, dropout=self.dropout)
        if USE_CUDA:
            self.lstm = self.lstm.cuda() 
            self.embedding_dropout = self.embedding_dropout.cuda()
            self.embedding = self.embedding.cuda() 

    def get_state(self, input):
        """Get cell states and hidden states."""
        batch_size = input.size(1)
        c0_encoder = Variable(torch.zeros(self.n_layers, batch_size, self.hidden_size))  
        h0_encoder = Variable(torch.zeros(self.n_layers, batch_size, self.hidden_size)) ### * self.num_directions = 2 if bi
        if USE_CUDA:
            h0_encoder = h0_encoder.cuda()
            c0_encoder = c0_encoder.cuda() 
        return (h0_encoder, c0_encoder)

    def forward(self, input_seqs, input_lengths, hidden=None):
        # Note: we run this all at once (over multiple batches of multiple sequences)
        embedded = self.embedding(input_seqs)
        embedded = self.embedding_dropout(embedded)
        hidden = self.get_state(input_seqs)
        if input_lengths:
            embedded = nn.utils.rnn.pack_padded_sequence(embedded, input_lengths, batch_first=False)
        
        outputs, hidden = self.lstm(embedded, hidden)
        if input_lengths:
            outputs, _ = nn.utils.rnn.pad_packed_sequence(outputs, batch_first=False)   
        
        return outputs, hidden

class PtrDecoderRNN(nn.Module):
    def __init__(self, hidden_size, output_size, n_layers=1, dropout=0.1):
        super(PtrDecoderRNN, self).__init__()
        self.hidden_size = hidden_size
        self.output_size = output_size ### Vocab size
        self.n_layers = n_layers
        self.dropout = dropout
        self.embedding = nn.Embedding(output_size, hidden_size)
        self.embedding_dropout = nn.Dropout(dropout)
        self.lstm = nn.LSTM(2*hidden_size, hidden_size, n_layers, dropout=dropout)
        self.W1 = nn.Linear(2*hidden_size, hidden_size)
        self.v = nn.Parameter(torch.rand(hidden_size))
        stdv = 1. / math.sqrt(self.v.size(0))
        self.v.data.normal_(mean=0, std=stdv)
        self.concat = nn.Linear(hidden_size * 2, hidden_size)  
        self.U = nn.Linear(hidden_size, output_size)
        self.W = nn.Linear(hidden_size, 1)

        if USE_CUDA:
            self.embedding = self.embedding.cuda()
            self.embedding_dropout = self.embedding_dropout.cuda()
            self.lstm = self.lstm.cuda()
            self.W1 = self.W1.cuda() 
            self.v = self.v.cuda() 
            self.U = self.U.cuda() 
            self.W = self.W.cuda() 

    def forward(self, input_seq, last_hidden, encoder_outputs):
        # Note: we run this one step at a time     
        # Get the embedding of the current input word (last output word)
        max_len = encoder_outputs.size(0)
        batch_size = input_seq.size(0)
        input_seq = input_seq
        encoder_outputs = encoder_outputs.transpose(0,1)
            
        word_embedded = self.embedding(input_seq) # S=1 x B x N
        word_embedded = self.embedding_dropout(word_embedded)

        ## ATTENTION CALCULATION 
        s_t = last_hidden[0][-1].unsqueeze(0)
        H = s_t.repeat(max_len,1,1).transpose(0,1)

        energy = F.tanh(self.W1(torch.cat([H,encoder_outputs], 2)))
        energy = energy.transpose(2,1)
        v = self.v.repeat(encoder_outputs.data.shape[0],1).unsqueeze(1) #[B*1*H]
        p_ptr = torch.bmm(v,energy) # [B*1*T]
        
        a = F.softmax(p_ptr)
        context = a.bmm(encoder_outputs)

        # Combine embedded input word and attended context, run through RNN
        rnn_input = torch.cat((word_embedded, context.squeeze()), 1).unsqueeze(0)
        output, hidden = self.lstm(rnn_input, last_hidden)
    
        p_vacab = self.U(output)
        
        gate = F.sigmoid(self.W(hidden[0][-1]))

        return p_ptr,p_vacab,gate,hidden