python source code of MaSIF_ppi

masif-master
- pymol_plugin_installation.md
- source
  - input_output
    - read_msms.py
    - extractHelix.py
    - extractPDB.py
    - protonate.py
    - save_ply.py
    - __init__.py
    - read_ply.py
    - README.md
  - masif_ppi_search
    - masif_ppi_search_comp_desc.py
    - second_stage_alignment_nn.py
    - masif_ppi_search_train.py
    - second_stage_alignment.py
    - pdl1_benchmark
      - README.md
      - pdl1_benchmark_nn.py
      - pdl1_benchmark.py
    - alignment_utils_masif_search.py
    - masif_ppi_search_cache_training_data.py
    - transformation_training_data
      - second_stage_transformation_training_helper.py
      - precompute_evaluation_features.py
      - second_stage_transformation_training.py
      - __init__.py
      - README.md
      - score_nn.py
      - train_evaluation_network.py
    - README.md
  - masif_pymol_plugin.zip
  - masif_modules
    - train_ppi_search.py
    - MaSIF_ppi_search.py
    - read_ligand_tfrecords.py
    - read_data_from_surface.py
    - MaSIF_site.py
    - __init__.py
    - train_masif_site.py
    - README.md
    - MaSIF_ligand.py
  - geometry
    - open3d_import.py
    - compute_polar_coordinates.py
    - .compute_polar_coordinates.py.swp
  - masif_ligand
    - masif_ligand_train.py
    - README.md
    - masif_ligand_evaluate_test.py
  - masif_pymol_plugin
    - simple_mesh.py
    - loadPLY.py
    - masif_plugin.py
    - __init__.py
    - README.md
    - loadDOTS.py
  - triangulation
    - computeMSMS.py
    - xyzrn.py
    - computeHydrophobicity.py
    - computeAPBS.py
    - compute_normal.py
    - __init__.py
    - fixmesh.py
    - README.md
    - computeCharges.py
  - gif_descriptors
    - compute_gif_descriptors.py
    - eval_gif_descriptors.py
    - README.md
  - README.md
  - masif_site
    - masif_site_label_surface.py
    - README.md
    - masif_site_train.py
    - masif_site_predict.py
  - data_preparation
    - 00-pdb_download.py
    - 01-pdb_extract_and_triangulate.py
    - 04-masif_precompute.py
    - 00b-generate_assembly.py
    - 00c-save_ligand_coords.py
    - 04b-make_ligand_tfrecords.py
    - README.md
    - 01b-helix_extract_and_triangulate.py
  - default_config
    - __init__.py
    - README.md
    - global_vars.py
    - chemistry.py
    - masif_opts.py
- img
- comparison
  - masif_ppi_search
    - zdock
      - 01-zdock_marked
        3IBM_B_m.pdb
        3FJS_C_m.pdb
        2AQX_B_m.pdb
        1LQM_E_m.pdb
        2ZXW_O_m.pdb
        3WN7_A_m.pdb
        1JZO_A_m.pdb
        2Z0P_D_m.pdb
        3F74_B_m.pdb
        1NPO_A_m.pdb
        4KGG_C_m.pdb
        2YZJ_A_m.pdb
        1JZO_B_m.pdb
        3TND_D_m.pdb
        1ERN_B_m.pdb
        2WQ4_A_m.pdb
        4KGG_A_m.pdb
        2O8Q_B_m.pdb
        2LBU_D_m.pdb
        2J12_B_m.pdb
        3HCG_C_m.pdb
        3HN6_B_m.pdb
        1BRS_D_m.pdb
        1T0F_B_m.pdb
        3K3C_A_m.pdb
        1SOT_A_m.pdb
        3Q9U_C_m.pdb
        1SOT_C_m.pdb
        1ID5_H_m.pdb
        2Y32_B_m.pdb
        5GPG_A_m.pdb
        1NPO_C_m.pdb
        1TQ9_B_m.pdb
        1ZVN_A_m.pdb
        3M85_B_m.pdb
        4AG2_A_m.pdb
        3SGB_I_m.pdb
        2GKW_B_m.pdb
        2P47_A_m.pdb
        1PXV_A_m.pdb
        3E2U_E_m.pdb
        3S9C_B_m.pdb
        3QWN_I_m.pdb
        3Q87_B_m.pdb
        3ISM_B_m.pdb
        1YY9_D_m.pdb
        3SGB_E_m.pdb
        2GD4_B_m.pdb
        3ISM_A_m.pdb
        3S9C_A_m.pdb
        1O9Y_A_m.pdb
        2YZJ_C_m.pdb
        4CJ0_B_m.pdb
        3CHW_P_m.pdb
        1T0F_A_m.pdb
        1LQM_F_m.pdb
        3M85_E_m.pdb
        1XUA_B_m.pdb
        3PGA_4_m.pdb
        1HBT_H_m.pdb
        2O8Q_A_m.pdb
        1JKG_B_m.pdb
        1ERN_A_m.pdb
        1HBT_I_m.pdb
        3Q0Y_B_m.pdb
        3EYD_C_m.pdb
        2JI1_D_m.pdb
        3OGF_A_m.pdb
        3E2U_A_m.pdb
        1I4O_B_m.pdb
        3F74_A_m.pdb
        3AXY_B_m.pdb
        4AG2_C_m.pdb
        2P45_A_m.pdb
        2HDP_B_m.pdb
        2QLC_B_m.pdb
        1SHY_A_m.pdb
        2B42_B_m.pdb
        1YLQ_A_m.pdb
        1JKG_A_m.pdb
        3CDW_H_m.pdb
        2QLC_C_m.pdb
        2J12_A_m.pdb
        3Q9U_A_m.pdb
        2P47_B_m.pdb
        3KMT_B_m.pdb
        2HDP_A_m.pdb
        2I32_A_m.pdb
        3RDZ_C_m.pdb
        2I32_E_m.pdb
        2WAM_A_m.pdb
        1AVX_B_m.pdb
        1XT9_A_m.pdb
        3P71_C_m.pdb
        4TQ1_B_m.pdb
        1Q5H_B_m.pdb
        3HCG_A_m.pdb
        3CG8_B_m.pdb
        1I07_A_m.pdb
        2A2L_C_m.pdb
        3WN7_B_m.pdb
        2GKW_A_m.pdb
        3KMT_A_m.pdb
        3ECY_A_m.pdb
        3HRD_H_m.pdb
        2G2W_B_m.pdb
        2Z0P_C_m.pdb
        2Z7F_E_m.pdb
        1I4O_D_m.pdb
        3EYD_D_m.pdb
        3KZH_B_m.pdb
        2WAM_C_m.pdb
        1XPJ_A_m.pdb
        1ZR0_A_m.pdb
        2AQX_A_m.pdb
        1O9Y_D_m.pdb
        1XDT_R_m.pdb
        3CEW_D_m.pdb
        1I07_B_m.pdb
        2G2W_A_m.pdb
        1UUG_A_m.pdb
        3QWQ_B_m.pdb
        2LBU_E_m.pdb
        3AXY_D_m.pdb
        1UGH_E_m.pdb
        1ID5_L_m.pdb
        1Z0K_C_m.pdb
        1Z0K_A_m.pdb
        3PGA_1_m.pdb
        5GPG_B_m.pdb
        3HN6_D_m.pdb
        1ZR0_B_m.pdb
        1AVX_A_m.pdb
        2P45_B_m.pdb
        1XPJ_D_m.pdb
        3K3C_B_m.pdb
        3P8B_C_m.pdb
        3QWN_J_m.pdb
        2JI1_C_m.pdb
        1BRS_A_m.pdb
        2WQ4_C_m.pdb
        3FJS_D_m.pdb
        3CG8_C_m.pdb
        1XT9_B_m.pdb
        2ZXW_U_m.pdb
        3P8B_D_m.pdb
        1XUA_A_m.pdb
        1ZVN_B_m.pdb
        2A2L_B_m.pdb
        1TQ9_A_m.pdb
        1Q5H_A_m.pdb
        1YLQ_B_m.pdb
        1UUG_B_m.pdb
        3IBM_A_m.pdb
        3CEW_C_m.pdb
        3KZH_A_m.pdb
        1A2K_AB_m.pdb
        2Y32_D_m.pdb
        3ECY_B_m.pdb
        3RDZ_A_m.pdb
        4TQ1_A_m.pdb
        3OGF_B_m.pdb
        1A2K_C_m.pdb
        3S8V_X_m.pdb
        4M5F_B_m.pdb
        1UGH_I_m.pdb
        3Q87_A_m.pdb
        2Z7F_I_m.pdb
        1PXV_C_m.pdb
        4YDJ_G_m.pdb
        3Q0Y_C_m.pdb
        3TND_B_m.pdb
      - zdock_results.txt
      - README
      - util
        compute_blocked_res_list.py
        mark_surfaces_benchmark_set.sh
        compute_blocked_res_list.sh
      - 02-zdock_marked_blocked_pdbs
        3IBM_A_m_bl.pdb
        2J12_A_m_bl.pdb
        1UGH_E_m_bl.pdb
        1Z0K_A_m_bl.pdb
        1YLQ_A_m_bl.pdb
        1Q5H_A_m_bl.pdb
        3KMT_A_m_bl.pdb
        2O8Q_A_m_bl.pdb
        2I32_A_m_bl.pdb
        3HN6_B_m_bl.pdb
        1ERN_A_m_bl.pdb
        3AXY_B_m_bl.pdb
        3PGA_1_m_bl.pdb
        4AG2_A_m_bl.pdb
        3EYD_C_m_bl.pdb
        3SGB_E_m_bl.pdb
        3HCG_A_m_bl.pdb
        3OGF_A_m_bl.pdb
        2WQ4_A_m_bl.pdb
        1XT9_A_m_bl.pdb
        1TQ9_A_m_bl.pdb
        2Z7F_E_m_bl.pdb
        3M85_B_m_bl.pdb
        1JKG_A_m_bl.pdb
        3K3C_A_m_bl.pdb
        1ZVN_A_m_bl.pdb
        1BRS_A_m_bl.pdb
        2LBU_E_m_bl.pdb
        1NPO_A_m_bl.pdb
        2A2L_C_m_bl.pdb
        1SHY_A_m_bl.pdb
        2HDP_A_m_bl.pdb
        2Y32_B_m_bl.pdb
        2G2W_A_m_bl.pdb
        3ISM_A_m_bl.pdb
        1O9Y_A_m_bl.pdb
        2GKW_A_m_bl.pdb
        3P71_C_m_bl.pdb
        1T0F_A_m_bl.pdb
        1PXV_A_m_bl.pdb
        4KGG_C_m_bl.pdb
        2P47_A_m_bl.pdb
        3CEW_C_m_bl.pdb
        1XPJ_A_m_bl.pdb
        3S9C_A_m_bl.pdb
        3F74_A_m_bl.pdb
        1HBT_I_m_bl.pdb
        1SOT_A_m_bl.pdb
        3FJS_C_m_bl.pdb
        2JI1_C_m_bl.pdb
        2AQX_A_m_bl.pdb
        2WAM_A_m_bl.pdb
        4TQ1_A_m_bl.pdb
        3RDZ_A_m_bl.pdb
        1ID5_H_m_bl.pdb
        1AVX_A_m_bl.pdb
        2B42_B_m_bl.pdb
        1XUA_A_m_bl.pdb
        2QLC_C_m_bl.pdb
        1JZO_A_m_bl.pdb
        README.md
        3TND_B_m_bl.pdb
        3WN7_A_m_bl.pdb
        2ZXW_O_m_bl.pdb
        1I07_A_m_bl.pdb
        3CG8_C_m_bl.pdb
        3QWN_I_m_bl.pdb
        2YZJ_A_m_bl.pdb
        3P8B_C_m_bl.pdb
        1I4O_B_m_bl.pdb
        3E2U_A_m_bl.pdb
        2Z0P_C_m_bl.pdb
        3Q9U_A_m_bl.pdb
        3Q87_A_m_bl.pdb
        3KZH_A_m_bl.pdb
        1UUG_A_m_bl.pdb
        1A2K_C_m_bl.pdb
        3ECY_A_m_bl.pdb
        1LQM_E_m_bl.pdb
        1ZR0_A_m_bl.pdb
        5GPG_A_m_bl.pdb
        3Q0Y_C_m_bl.pdb
        2P45_A_m_bl.pdb
      - parse_results.py
      - dock_all.sh
      - eval_all.sh
      - eval_one.sh
      - eval_zdock.py
      - dock_one.sh
      - .gitignore
    - masif_descriptors_nn
      - results_masif.txt
      - second_stage_masif.sh
      - models
        nn_score
        trained_model.hdf5.index
      - second_stage.slurm
    - zrank
      - run_all.sh
      - eval_zrank.py
      - parse_results.py
      - run_one.sh
      - .gitignore
    - gif_descriptors
      - second_stage_gif.sh
    - README.md
    - benchmark_list.txt
    - patchdock
      - process_times.py
      - evalPatchDock.py
      - count_all.sh
      - runPatchDockBenchmark.py
      - total_times.txt
      - pdbs
        1ZVN_A.pdb
        1TQ9_B.pdb
        3IBM_A.pdb
        3P8B_C.pdb
        4KGG_A.pdb
        2QLC_C.pdb
        1XDT_R.pdb
        1O9Y_D.pdb
        5GPG_B.pdb
        1AVX_B.pdb
        3S9C_B.pdb
        2YZJ_A.pdb
        1I07_B.pdb
        2LBU_E.pdb
        2Y32_B.pdb
        3WN7_B.pdb
        3KMT_B.pdb
        4M5F_B.pdb
        3OGF_A.pdb
        3TND_D.pdb
        3P8B_D.pdb
        3Q0Y_C.pdb
        1UUG_B.pdb
        3Q0Y_B.pdb
        1XPJ_A.pdb
        3CEW_C.pdb
        1LQM_F.pdb
        1ZVN_B.pdb
        3HCG_C.pdb
        3QWQ_B.pdb
        2O8Q_B.pdb
        2A2L_B.pdb
        3SGB_I.pdb
        2WQ4_A.pdb
        1NPO_A.pdb
        1ZR0_B.pdb
        4CJ0_B.pdb
        1O9Y_A.pdb
        1BRS_A.pdb
        3EYD_D.pdb
        2O8Q_A.pdb
        2YZJ_C.pdb
        4AG2_C.pdb
        3CEW_D.pdb
        1XPJ_D.pdb
        3EYD_C.pdb
        3CDW_H.pdb
        3K3C_A.pdb
        1Q5H_B.pdb
        1PXV_C.pdb
        1TQ9_A.pdb
        3KMT_A.pdb
        3Q87_A.pdb
        1UGH_I.pdb
        3OGF_B.pdb
        1YLQ_A.pdb
        3ECY_A.pdb
        2GKW_B.pdb
        2A2L_C.pdb
        2P47_A.pdb
        2P45_B.pdb
        2Z7F_I.pdb
        3Q9U_A.pdb
        2P45_A.pdb
        3HCG_A.pdb
        2G2W_B.pdb
        3E2U_E.pdb
        3RDZ_C.pdb
        2LBU_D.pdb
        1ID5_L.pdb
        1I07_A.pdb
        3E2U_A.pdb
        2JI1_D.pdb
        3TND_B.pdb
        2I32_A.pdb
        2J12_B.pdb
        3FJS_D.pdb
        2QLC_B.pdb
        4KGG_C.pdb
        3ECY_B.pdb
        1NPO_C.pdb
        3K3C_B.pdb
        2HDP_B.pdb
        5GPG_A.pdb
        3HRD_H.pdb
        2JI1_C.pdb
        3CHW_P.pdb
        4TQ1_B.pdb
        2ZXW_U.pdb
        2Y32_D.pdb
        3FJS_C.pdb
        1BRS_D.pdb
        3Q9U_C.pdb
        2WQ4_C.pdb
        1JKG_A.pdb
        3IBM_B.pdb
        1XT9_B.pdb
        2HDP_A.pdb
        1I4O_D.pdb
        2I32_E.pdb
        3S8V_X.pdb
        1HBT_I.pdb
        1Q5H_A.pdb
        2P47_B.pdb
        1YLQ_B.pdb
      - eval_all.sh
      - params_templ.txt
      - countPatchDockPoses.py
      - runPatchDockBenchmark.slurm
      - .gitignore
      - data.txt
  - masif_ppi_search_ub
    - zdock
      - 01-zdock_marked
        1ezu_C_m.pdb
        1r0r_E_m.pdb
        1ewy_C_m.pdb
        2sic_E_m.pdb
        1yvb_A_m.pdb
        2fju_A_m.pdb
        1kac_A_m.pdb
        1t6b_Y_m.pdb
        1avx_A_m.pdb
        1pvh_A_m.pdb
        1z5y_D_m.pdb
        1udi_E_m.pdb
        1fle_E_m.pdb
        1pvh_B_m.pdb
        2sni_E_m.pdb
        1s1q_A_m.pdb
        2hle_A_m.pdb
        2uuy_A_m.pdb
        1d6r_A_m.pdb
        1hcf_X_m.pdb
        1eaw_B_m.pdb
        1fle_I_m.pdb
        1udi_I_m.pdb
        1d6r_I_m.pdb
        2abz_E_m.pdb
        1a2k_AB_m.pdb
        3biw_E_m.pdb
        2sni_I_m.pdb
        4cpa_I_m.pdb
        2mta_A_m.pdb
        1s1q_B_m.pdb
        2abz_B_m.pdb
        1gxd_C_m.pdb
        2oul_B_m.pdb
        1ay7_B_m.pdb
        1kac_B_m.pdb
        1ml0_D_m.pdb
        1jtd_B_m.pdb
        2yvj_B_m.pdb
        1a2k_C_m.pdb
        1z5y_E_m.pdb
        1avx_B_m.pdb
        1ppe_E_m.pdb
        1yvb_I_m.pdb
        1ak4_D_m.pdb
        1dfj_E_m.pdb
        1ezu_AB_m.pdb
        1r0r_I_m.pdb
        1hcf_AB_m.pdb
        4cpa_A_m.pdb
        2btf_P_m.pdb
        1gl1_I_m.pdb
        2uuy_B_m.pdb
        1eaw_A_m.pdb
        1ay7_A_m.pdb
        1jtd_A_m.pdb
        1ewy_A_m.pdb
        1xd3_A_m.pdb
        2sic_I_m.pdb
        2oul_A_m.pdb
        3sgq_E_m.pdb
        1ppe_I_m.pdb
        1xd3_B_m.pdb
        1gl1_A_m.pdb
        2b42_B_m.pdb
        1ak4_A_m.pdb
        2hle_B_m.pdb
        3sgq_I_m.pdb
      - zdock_results.txt
      - util
        compute_blocked_res_list.py
        mark_surfaces_benchmark_set.sh
        compute_blocked_res_list.sh
      - 02-zdock_marked_blocked_pdbs
        1ppe_E_m_bl.pdb
        4cpa_A_m_bl.pdb
        1pvh_A_m_bl.pdb
        1r0r_E_m_bl.pdb
        1kac_A_m_bl.pdb
        1z5y_D_m_bl.pdb
        1s1q_A_m_bl.pdb
        1hcf_AB_m_bl.pdb
        2oul_A_m_bl.pdb
        2sic_E_m_bl.pdb
        1gl1_A_m_bl.pdb
        1avx_A_m_bl.pdb
        1udi_E_m_bl.pdb
        1xd3_A_m_bl.pdb
        1d6r_A_m_bl.pdb
        1ezu_C_m_bl.pdb
        1fle_E_m_bl.pdb
        2abz_B_m_bl.pdb
        1ay7_A_m_bl.pdb
        1yvb_A_m_bl.pdb
        1a2k_C_m_bl.pdb
        3sgq_E_m_bl.pdb
        2hle_A_m_bl.pdb
        2b42_B_m_bl.pdb
        1ewy_A_m_bl.pdb
        1ak4_A_m_bl.pdb
        1dfj_E_m_bl.pdb
        1eaw_A_m_bl.pdb
        2uuy_A_m_bl.pdb
        2sni_E_m_bl.pdb
        1jtd_B_m_bl.pdb
      - parse_results.py
      - dock_all.sh
      - eval_all.sh
      - eval_one.sh
      - README.md
      - eval_zdock.py
      - dock_one.sh
      - .gitignore
    - masif_descriptors_nn
      - results_masif.txt
      - second_stage_masif.sh
      - models
        nn_score
        trained_model.hdf5.index
      - second_stage.slurm
    - zrank
      - results
      - run_all.sh
      - eval_zrank.py
      - parse_results.py
      - run_one.sh
      - .gitignore
    - gif_descriptors
      - second_stage_gif.sh
    - README.md
    - benchmark_list.txt
    - patchdock
      - process_times.py
      - evalPatchDock.py
      - runPatchDockBenchmark.py
      - total_times.txt
      - pdbs
        2uuy_B.pdb
        1eaw_B.pdb
        1ak4_A.pdb
        1ay7_B.pdb
        1ay7_A.pdb
        1pvh_B.pdb
        1avx_B.pdb
        2yvj_B.pdb
        1fle_I.pdb
        1s1q_A.pdb
        1s1q_B.pdb
        1yvb_I.pdb
        2oul_B.pdb
        3sgq_I.pdb
        1ak4_D.pdb
        1udi_I.pdb
        2abz_E.pdb
        1dfj_E.pdb
        1z5y_D.pdb
        1ppe_I.pdb
        1ewy_C.pdb
        1gl1_I.pdb
        2hle_B.pdb
        1ml0_D.pdb
        1kac_B.pdb
        1r0r_I.pdb
        1d6r_I.pdb
        2sic_I.pdb
        1xd3_B.pdb
        1hcf_X.pdb
        4cpa_I.pdb
        1z5y_E.pdb
        2mta_A.pdb
        2btf_P.pdb
        2sni_I.pdb
      - sum_time.py
      - eval_all.sh
      - params_templ.txt
      - runPatchDockBenchmark.slurm
      - .gitignore
      - data.txt
  - masif_ligand
    - probis_fpr100.npy
    - run_probis.sh
    - query.json
    - masif_pred
      - test_set_predictions
        all_masif_names.txt
        analysis.ipynb
        all_masif_kripo_names.txt
        make_pocket_names.py
    - copy_dataset.py
    - masif_tpr100.npy
    - probis_tpr50.npy
    - run_all.sh
    - test_pdbs_sequence.npy
    - training_srf_fn_list.txt
    - kripo_fpr100.npy
    - probis_fpr50.npy
    - Kripo
      - add_pdb_header.py
      - lists
        testset_pocket_split_tmscore0.25.txt
        all_masif_test_names.txt
        testset_pocket_split_tmscore0.40.txt
      - similarity_results
        generate_ROCs.py
      - training_set
        all_training_pdbs.list
        generate_fingerprints_multithreaded.py
      - test_set
        all_test_pdbs.list
        generate_fingerprints_multithreaded.py
      - README.md
      - compare_test_training.py
    - probis_tpr100.npy
    - make_probis_srfs.py
    - parse_json_tmscore_rocauc.py
    - run_probis.slurm
    - kripo_tpr100.npy
    - masif_fpr50.npy
    - data
      - pocket_to_pocket_align
        pocket_to_pocket_align.py
        all_test_to_all_train.sh
        get_split.py
        README.md
        testset_pocket_split_tmscore0.50.txt
        .gitignore
      - README.md
      - .gitignore
    - kripo_fpr050.npy
    - training_srf_fn_list_small.txt
    - train_pdbs_sequence.npy
    - README.md
    - make_ROC.ipynb
    - masif_tpr50.npy
    - kripo_tpr050.npy
    - masif_fpr100.npy
    - benchmark_set_full.txt
    - .gitignore
    - benchmark_set.txt
  - README.md
  - masif_site
    - masif_vs_sppider
      - masif_pred
      - testing_transient_old.txt
      - sppider_pred
      - intpred_pred
        orig_pdbs
        4JLR_S.pdb
        3R2X_C.pdb
        intpred_list.txt
        intpred_pdbs
        4JLR_S.pdb
        3R2X_C.pdb
        raw
        2V9T_B
        4YEB_A
        1F6M_A
        4X33_B
        3H6G_B
        3FHC_A
        4FZV_A
        1NCA_N
        4YC7_B
        2QXV_A
        2V3B_A
        4XL5_C
        4ZGY_A
        1XG2_A
        4ZRJ_A
        3R2X_C
        4C9B_B
        1EWY_A
        3ZWL_B
        1I2M_B
        3SJA_I
        2WUS_A
        3VYR_B
        3NVN_A
        1ZHH_A
        4HDO_A
        1WDW_H
        1XQS_A
        4ETP_A
        list.txt
        1W1W_B
        3QML_D
        5TIH_A
        3VV2_A
        3MCA_B
        2I3T_A
        4Y61_B
        4M0W_A
        3RT0_A
        3WN7_A
        4JLR_S
        4LVN_A
        4ETP_B
        2F4M_A
        2Y5B_A
        3BH6_B
        4DVG_B
        5J57_A
        4V0O_F
        2XWT_C
        2C0L_A
        3O5T_A
        4BKX_B
        2AYO_A
        2PMS_A
        1JTD_B
        make_intpred_pdbs.py
      - psiver_pred
        orig_pdbs
        ._3VCD_N.pdb
        ._3VCD_M.pdb
        4JLR_S.pdb
        3R2X_C.pdb
        psiver_pdbs
        4JLR_S.pdb
        3R2X_C.pdb
        psiver_list.txt
        .DS_Store
        seqs
        group6.fasta
        group4.fasta
        by_groups.fasta
        all_seqs.fasta
        group1.fasta
        group3.fasta
        group2.fasta
        group5.fasta
        raw
        2V9T_B
        4YEB_A
        1F6M_A
        4X33_B
        3H6G_B
        3FHC_A
        4FZV_A
        1NCA_N
        4YC7_B
        2QXV_A
        2V3B_A
        4XL5_C
        4ZGY_A
        ._3VCD_M
        1XG2_A
        4ZRJ_A
        3R2X_C
        4C9B_B
        1EWY_A
        3ZWL_B
        ._3VCD_N
        1I2M_B
        3SJA_I
        2WUS_A
        ._4ZGY_A
        3VYR_B
        3NVN_A
        1ZHH_A
        4HDO_A
        1WDW_H
        1XQS_A
        ._4YEB_A
        4ETP_A
        1W1W_B
        3QML_D
        5TIH_A
        3VV2_A
        3MCA_B
        2I3T_A
        4Y61_B
        4M0W_A
        3RT0_A
        3WN7_A
        4JLR_S
        ._4ZRJ_A
        4LVN_A
        4ETP_B
        2F4M_A
        2Y5B_A
        3VCD_N
        3BH6_B
        4DVG_B
        3VCD_M
        5J57_A
        4V0O_F
        ._5J57_A
        2XWT_C
        2C0L_A
        ._5TIH_A
        3O5T_A
        4BKX_B
        2AYO_A
        2PMS_A
        1JTD_B
        make_psiver_pdbs.py
        ._.DS_Store
      - ground_truth
      - README.md
      - testing_transient.txt
    - README.md
- citation.bib
- LICENSE
- docker_tutorial.md
- data
  - masif_ppi_search
    - train_nn.sh
    - lists
      - testing.txt
      - full_list.txt
      - training.txt
      - ransac_benchmark_list.txt
    - data_prepare.slurm
    - compute_gif_descriptors.sh
    - transformation_training_data
      - train_nn.sh
      - training_transformations.txt
      - generate_all_data.sh
      - models
        nn_score
        trained_model.hdf5.index
      - .ignore
      - generate_all.slurm
      - logs
        nn_score
        plugins
        profile
        2019-07-24_14-07-31
        2019-07-24_13-37-36
        2019-07-24_13-48-58
        2019-07-24_14-01-25
        2019-07-24_14-29-01
      - .gitignore
      - generate_data.sh
    - nn_models
      - sc05
        custom_params.py
        __init__.py
        all_feat
        custom_params.py
        model_data
        log.txt
        compute_roc_auc.py
        model.index
        __init__.py
      - __init__.py
    - masif_ppi_search_train.slurm
    - eval_gif_descriptors.sh
    - README.md
    - recompute_data_docking_benchmark.sh
    - data_prepare_one.sh
    - cache_nn.sh
    - masif_ppi_search_comp_desc.slurm
    - compute_descriptors.sh
  - masif_ppi_search_ub
    - lists
      - benchmark_list_ub.txt
    - data_prepare.slurm
    - compute_gif_descriptors.sh
    - nn_models
      - sc05
        __init__.py
        all_feat
        custom_params.py
        model_data
        log.txt
        model.index
        __init__.py
      - __init__.py
    - README.md
    - recompute_data_docking_benchmark.sh
    - data_prepare_one.sh
    - masif_ppi_search_comp_desc.slurm
    - compute_descriptors.sh
    - data_preparation
      - 00-raw_pdbs
        2uuy.pdb
        2sni.pdb
        1udi.pdb
        1eaw.pdb
        1s1q.pdb
        1hcf.pdb
        3sgq.pdb
        1z5y.pdb
        1kac.pdb
        1hia.pdb
        1r0r.pdb
        1gl1.pdb
        1d6r.pdb
        1xd3.pdb
        README.md
        1ppe.pdb
        1ay7.pdb
        1ak4.pdb
        1fle.pdb
  - masif_ligand
    - lists
      - full_list.txt
      - sequence_split_list.txt
      - val_pdbs_sequence.npy
      - test_pdbs_sequence.npy
      - selected_pdb_ids_30.npy
      - train_pdbs_sequence.npy
    - data_prepare.slurm
    - evaluate_test.sh
    - evaluate_test.slurm
    - train_model.slurm
    - make_tfrecord.slurm
    - nn_models
      - all_feat
        checkpoint
        model.index
    - README.md
    - data_prepare_one.sh
  - masif_pdl1_benchmark
    - lists
      - testing.txt
      - full_list.txt
      - training.txt
      - ransac_benchmark_list.txt
    - data_prepare.slurm
    - models
      - nn_score
        trained_model.hdf5.index
      - README.md
    - nn_models
      - all_feat_3l
        custom_params.py
        model_data
        log.txt
        model.data-00000-of-00001
        model.index
        __init__.py
      - sc05
        custom_params.py
        __init__.py
        all_feat
        custom_params.py
        model_data
        log.txt
        compute_roc_auc.py
        model.index
        __init__.py
      - __init__.py
    - README.md
    - .gitignore
    - data_prepare_compute_descriptors.sh
    - run_benchmark_nn.sh
  - masif_peptides
    - lists
      - process_bc_out.py
    - masif_site_masif_search_eval.slurm
    - data_extract_helix.slurm
    - predict_site.sh
    - data_extract_helix_one.sh
    - data_precompute_patches.slurm
    - in
      - x233
      - x221
      - x256
      - x187
      - x141
      - x238
      - x119
      - x107
      - x341
      - x216
      - x273
      - x228
      - x209
      - x251
      - x305
      - x224
      - x207
      - x285
      - x329
      - x104
      - x293
      - x247
      - x200
      - x322
      - x332
      - x136
      - x188
      - x123
      - x158
      - x177
      - x353
      - x195
      - x112
      - x189
      - x213
      - x197
      - x143
      - x218
      - x304
      - x183
      - x254
      - x151
      - x270
      - x229
      - x198
      - x348
      - x340
      - x164
      - x219
      - x281
      - x172
      - x271
      - x204
      - x208
      - x115
      - x159
      - x181
      - x133
      - x246
      - x319
      - x153
      - x161
      - x265
      - x308
      - x280
      - x103
      - x269
      - x125
      - x262
      - x210
      - x292
      - x202
      - x178
      - x118
      - x142
      - x253
      - x272
      - x241
      - x287
      - x352
      - x171
      - x315
      - x331
      - x166
      - x129
      - x346
      - x298
      - x205
      - x106
      - x267
      - x284
      - x140
      - x155
      - x215
      - x170
      - x192
      - x114
      - x211
      - x338
      - x232
      - x277
      - x147
      - x303
      - x225
      - x186
      - x138
      - x300
      - x120
      - x175
      - x343
      - x157
      - x236
      - x222
      - x169
      - x134
      - x249
      - x344
      - x255
      - x330
      - x100
      - x167
      - x350
      - x165
      - x333
      - x185
      - x168
      - x109
      - x180
      - x174
      - x148
      - x199
      - x121
      - x306
      - x264
      - x283
      - x275
      - x163
      - x108
      - x150
      - x320
      - x110
      - x102
      - x206
      - x162
      - x179
      - x266
      - x214
      - x173
      - x239
      - x349
      - x250
      - x316
      - x242
      - x318
      - x149
      - x201
      - x327
      - x131
      - x124
      - x244
      - x260
      - x297
      - x152
      - x252
      - x257
      - x126
      - x291
      - x230
      - x326
      - x347
      - x258
      - x191
      - x337
      - x128
      - x217
      - x248
      - x325
      - x282
      - x220
      - x135
      - x296
      - x309
      - x261
      - x101
      - x286
      - x132
      - x339
      - x301
      - x336
      - x154
      - x334
      - x263
      - x276
      - x311
      - x317
      - x137
      - x196
      - x243
      - x351
      - x323
      - x116
      - x279
      - x278
      - x235
      - x122
      - x156
      - x342
      - x227
      - x299
      - x328
      - x295
      - x146
      - x231
      - x145
      - x144
      - x182
      - x259
      - x127
      - x105
      - x294
      - x274
      - x139
      - x268
      - x203
      - x345
      - x237
      - x245
      - x313
      - x302
      - x312
      - x226
      - x190
      - x290
      - x176
      - x113
      - x130
      - x240
      - x321
      - x184
      - x310
      - x324
      - x307
      - x194
      - x212
      - x314
      - x193
      - x111
      - x335
      - x160
      - x223
      - x234
      - x288
      - x117
      - x289
    - nn_models
      - all_feat_3l
        custom_params.py
        model_data
        model.data-00000-of-00001
        model.index
        __init__.py
        model_data.bak
        model.data-00000-of-00001
        model.index
      - all_feat_1l
        custom_params.py
        __init__.py
      - sc05
        custom_params.py
        __init__.py
        all_feat
        custom_params.py
        model_data
        log.txt
        compute_roc_auc.py
        model.index
        __init__.py
      - hphob_only
        custom_params.py
        __init__.py
      - hbond_only
        custom_params.py
        __init__.py
      - shape_only
        custom_params.py
        __init__.py
      - __init__.py
      - pb_only
        custom_params.py
        __init__.py
    - README.md
    - .gitignore
    - compute_descriptors.sh
    - data_precompute_patches_one.sh
  - README.md
  - masif_site
    - submit_all.sh
    - train_nn.sh
    - lists
      - testing.txt
      - full_list.txt
      - training.txt
      - masif_site_only.txt
      - full_list_expanded.txt
      - testing_transient.txt
      - training_testing_30pc.txt
    - data_prepare.slurm
    - masif_site_eval.slurm
    - predict_site.sh
    - predict_site.slurm
    - masif_site_train.slurm
    - nn_models
      - all_feat_3l
        custom_params.py
        model_data
        log.txt
        model.data-00000-of-00001
        model.index
        __init__.py
      - all_feat_1l
        custom_params.py
        __init__.py
      - hphob_only
        custom_params.py
        __init__.py
      - hbond_only
        custom_params.py
        __init__.py
      - shape_only
        custom_params.py
        __init__.py
      - __init__.py
      - pb_only
        custom_params.py
        __init__.py
    - README.md
    - data_prepare_one.sh
    - reproduce_transient_benchmark.sh
    - data_prepare_all.sh
    - color_site.sh
- README.md
- requirements.txt
- .gitignore

import tensorflow as tf
import numpy as np


class MaSIF_ppi_search:

    """
    The neural network model to classify two patches into binders or not binders. 
    """

    def count_number_parameters(self):
        total_parameters = 0
        for variable in tf.trainable_variables():
            # shape is an array of tf.Dimension
            shape = variable.get_shape()
            print(variable)
            variable_parameters = 1
            for dim in shape:
                variable_parameters *= dim.value
            print(variable_parameters)
            total_parameters += variable_parameters
        print("Total number parameters: %d" % total_parameters)

    def frobenius_norm(self, tensor):
        square_tensor = tf.square(tensor)
        tensor_sum = tf.reduce_sum(square_tensor)
        frobenius_norm = tf.sqrt(tensor_sum)
        return frobenius_norm

    def build_sparse_matrix_softmax(self, idx_non_zero_values, X, dense_shape_A):
        A = tf.SparseTensorValue(idx_non_zero_values, tf.squeeze(X), dense_shape_A)
        A = tf.sparse_reorder(A)  # n_edges x n_edges
        A = tf.sparse_softmax(A)

        return A

    def compute_initial_coordinates(self):
        range_rho = [0.0, self.max_rho]
        range_theta = [0, 2 * np.pi]

        grid_rho = np.linspace(range_rho[0], range_rho[1], num=self.n_rhos + 1)
        grid_rho = grid_rho[1:]
        grid_theta = np.linspace(range_theta[0], range_theta[1], num=self.n_thetas + 1)
        grid_theta = grid_theta[:-1]

        grid_rho_, grid_theta_ = np.meshgrid(grid_rho, grid_theta, sparse=False)
        grid_rho_ = (
            grid_rho_.T
        )  # the traspose here is needed to have the same behaviour as Matlab code
        grid_theta_ = (
            grid_theta_.T
        )  # the traspose here is needed to have the same behaviour as Matlab code
        grid_rho_ = grid_rho_.flatten()
        grid_theta_ = grid_theta_.flatten()

        coords = np.concatenate((grid_rho_[None, :], grid_theta_[None, :]), axis=0)
        coords = coords.T  # every row contains the coordinates of a grid intersection
        print(coords.shape)
        return coords

    def inference(
        self,
        input_feat,
        rho_coords,
        theta_coords,
        mask,
        W_conv,
        b_conv,
        mu_rho,
        sigma_rho,
        mu_theta,
        sigma_theta,
        eps=1e-5,
        mean_gauss_activation=True,
    ):
        n_samples = tf.shape(rho_coords)[0]
        n_vertices = tf.shape(rho_coords)[1]
        # n_feat = input_feat.get_shape().as_list()[2]

        all_conv_feat = []
        for k in range(self.n_rotations):
            rho_coords_ = tf.reshape(rho_coords, [-1, 1])  # batch_size*n_vertices
            thetas_coords_ = tf.reshape(theta_coords, [-1, 1])  # batch_size*n_vertices

            thetas_coords_ += k * 2 * np.pi / self.n_rotations
            thetas_coords_ = tf.mod(thetas_coords_, 2 * np.pi)
            rho_coords_ = tf.exp(
                -tf.square(rho_coords_ - mu_rho) / (tf.square(sigma_rho) + eps)
            )
            thetas_coords_ = tf.exp(
                -tf.square(thetas_coords_ - mu_theta) / (tf.square(sigma_theta) + eps)
            )

            gauss_activations = tf.multiply(
                rho_coords_, thetas_coords_
            )  # batch_size*n_vertices, n_gauss
            gauss_activations = tf.reshape(
                gauss_activations, [n_samples, n_vertices, -1]
            )  # batch_size, n_vertices, n_gauss
            gauss_activations = tf.multiply(gauss_activations, mask)
            if (
                mean_gauss_activation
            ):  # computes mean weights for the different gaussians
                gauss_activations /= (
                    tf.reduce_sum(gauss_activations, 1, keep_dims=True) + eps
                )  # batch_size, n_vertices, n_gauss

            gauss_activations = tf.expand_dims(
                gauss_activations, 2
            )  # batch_size, n_vertices, 1, n_gauss,
            input_feat_ = tf.expand_dims(
                input_feat, 3
            )  # batch_size, n_vertices, n_feat, 1

            gauss_desc = tf.multiply(
                gauss_activations, input_feat_
            )  # batch_size, n_vertices, n_feat, n_gauss,
            gauss_desc = tf.reduce_sum(gauss_desc, 1)  # batch_size, n_feat, n_gauss,
            gauss_desc = tf.reshape(
                gauss_desc, [n_samples, self.n_thetas * self.n_rhos]
            )  # batch_size, 80

            conv_feat = tf.matmul(gauss_desc, W_conv) + b_conv  # batch_size, 80
            all_conv_feat.append(conv_feat)
        all_conv_feat = tf.stack(all_conv_feat)
        conv_feat = tf.reduce_max(all_conv_feat, 0)
        conv_feat = tf.nn.relu(conv_feat)
        return conv_feat

    # Softmax cross entropy
    def compute_data_loss_cross_entropy(self, pos, neg):
        epsilon = tf.constant(value=0.00001)
        logit = tf.nn.softmax([pos, neg])
        self.softmax_debug = logit
        cross_entropy = -(tf.log(logit[1] + epsilon) - tf.log(logit[0] + epsilon))
        return cross_entropy

    # Data loss
    # Values above 10 are ignored.
    def compute_data_loss(self, pos_thresh=0.0, neg_thresh=10):
        self.global_desc_pos = tf.gather(self.global_desc, tf.range(0, self.n_patches))
        self.global_desc_binder = tf.gather(
            self.global_desc, tf.range(self.n_patches, 2 * self.n_patches)
        )
        self.global_desc_neg = tf.gather(
            self.global_desc, tf.range(2 * self.n_patches, 3 * self.n_patches)
        )
        self.global_desc_neg_2 = tf.gather(
            self.global_desc, tf.range(3 * self.n_patches, 4 * self.n_patches)
        )

        pos_distances = tf.reduce_sum(
            tf.square(self.global_desc_binder - self.global_desc_pos), 1
        )
        neg_distances = tf.reduce_sum(
            tf.square(self.global_desc_neg - self.global_desc_neg_2), 1
        )
        self.score = tf.concat([pos_distances, neg_distances], axis=0)
        pos_distances = tf.nn.relu(
            tf.reduce_sum(tf.square(self.global_desc_binder - self.global_desc_pos), 1)
            - pos_thresh
        )
        neg_distances = tf.nn.relu(
            -tf.reduce_sum(tf.square(self.global_desc_neg - self.global_desc_neg_2), 1)
            + neg_thresh
        )

        pos_mean, pos_std = tf.nn.moments(pos_distances, [0])
        neg_mean, neg_std = tf.nn.moments(neg_distances, [0])
        data_loss = pos_std + neg_std + pos_mean + neg_mean

        return data_loss

    def __init__(
        self,
        max_rho,
        n_thetas=16,
        n_rhos=5,
        n_gamma=1.0,
        learning_rate=1e-3,
        n_rotations=16,
        idx_gpu="/device:GPU:0",
        feat_mask=[1.0, 1.0, 1.0, 1.0, 1.0],
    ):

        # order of the spectral filters
        self.max_rho = max_rho
        self.n_thetas = n_thetas
        self.n_rhos = n_rhos

        self.sigma_rho_init = (
            max_rho / 8
        )  # in MoNet was 0.005 with max radius=0.04 (i.e. 8 times smaller)
        self.sigma_theta_init = 1.0  # 0.25
        self.n_rotations = n_rotations
        self.n_feat = int(sum(feat_mask))

        with tf.Graph().as_default() as g:
            self.graph = g
            tf.set_random_seed(0)
            with tf.device(idx_gpu):

                initial_coords = self.compute_initial_coordinates()
                mu_rho_initial = np.expand_dims(initial_coords[:, 0], 0).astype(
                    "float32"
                )
                mu_theta_initial = np.expand_dims(initial_coords[:, 1], 0).astype(
                    "float32"
                )
                self.mu_rho = []
                self.mu_theta = []
                self.sigma_rho = []
                self.sigma_theta = []
                for i in range(self.n_feat):
                    self.mu_rho.append(
                        tf.Variable(mu_rho_initial, name="mu_rho_{}".format(i))
                    )  # 1, n_gauss
                    self.mu_theta.append(
                        tf.Variable(mu_theta_initial, name="mu_theta_{}".format(i))
                    )  # 1, n_gauss
                    self.sigma_rho.append(
                        tf.Variable(
                            np.ones_like(mu_rho_initial) * self.sigma_rho_init,
                            name="sigma_rho_{}".format(i),
                        )
                    )  # 1, n_gauss
                    self.sigma_theta.append(
                        tf.Variable(
                            (np.ones_like(mu_theta_initial) * self.sigma_theta_init),
                            name="sigma_theta_{}".format(i),
                        )
                    )  # 1, n_gauss

                self.keep_prob = tf.placeholder(tf.float32)
                # **Features for binder should be flipped before feeding to the NN.
                self.rho_coords = tf.placeholder(
                    tf.float32, shape=[None, None, 1]
                )  # batch_size, n_vertices, 1
                self.theta_coords = tf.placeholder(
                    tf.float32, shape=[None, None, 1]
                )  # batch_size, n_vertices, 1
                self.input_feat = tf.placeholder(
                    tf.float32, shape=[None, None, self.n_feat]
                )  # batch_size, n_vertices, n_feat
                self.mask = tf.placeholder(
                    tf.float32, shape=[None, None, 1]
                )  # batch_size, n_vertices, 1

                self.global_desc = []

                # Initialize b_conv for each feature.
                b_conv = []
                for i in range(self.n_feat):
                    b_conv.append(
                        tf.Variable(
                            tf.zeros([self.n_thetas * self.n_rhos]),
                            name="b_conv_{}".format(i),
                        )
                    )
                # Run the inference layer per feature.
                for i in range(self.n_feat):
                    my_input_feat = tf.expand_dims(self.input_feat[:, :, i], 2)

                    W_conv = tf.get_variable(
                        "W_conv_{}".format(i),
                        shape=[
                            self.n_thetas * self.n_rhos,
                            self.n_thetas * self.n_rhos,
                        ],
                        initializer=tf.contrib.layers.xavier_initializer(),
                    )

                    desc = self.inference(
                        my_input_feat,
                        self.rho_coords,
                        self.theta_coords,
                        self.mask,
                        W_conv,
                        b_conv[i],
                        self.mu_rho[i],
                        self.sigma_rho[i],
                        self.mu_theta[i],
                        self.sigma_theta[i],
                    )  # batch_size, n_gauss*1

                    self.global_desc.append(desc)

                # global_desc is [n_feat, batch_size, self.n_thetas*self.n_rhos].
                self.global_desc = tf.stack(self.global_desc, axis=1)  #
                self.global_desc = tf.reshape(
                    self.global_desc, [-1, self.n_thetas * self.n_rhos * self.n_feat]
                )

                # Refine global_desc with a FC layer.
                self.global_desc = tf.contrib.layers.fully_connected(
                    self.global_desc,
                    self.n_thetas * self.n_rhos,
                    activation_fn=tf.identity,
                )  # batch_size, n_thetas

                # compute data loss
                self.n_patches = tf.shape(self.global_desc)[0] // 4
                self.data_loss = self.compute_data_loss()

                # definition of the solver
                self.optimizer = tf.train.AdamOptimizer(
                    learning_rate=learning_rate
                ).minimize(self.data_loss)

                self.var_grad = tf.gradients(self.data_loss, tf.trainable_variables())
                # print self.var_grad
                for k in range(len(self.var_grad)):
                    if self.var_grad[k] is None:
                        print(tf.trainable_variables()[k])
                self.norm_grad = self.frobenius_norm(
                    tf.concat([tf.reshape(g, [-1]) for g in self.var_grad], 0)
                )

                # Create a session for running Ops on the Graph.
                config = tf.ConfigProto(allow_soft_placement=True)
                config.gpu_options.allow_growth = True
                self.session = tf.Session(config=config)
                self.saver = tf.train.Saver()

                # Run the Op to initialize the variables.
                init = tf.global_variables_initializer()
                self.session.run(init)
                self.count_number_parameters()