python source code of hmmer

ssbio-master
- LICENSE
- README.rst
- setup.py
- Binder.ipynb
- ssbio
  - viz
    - nglview.py
    - color.py
    - __init__.py
  - test
    - test_utils.py
    - test_protein_sequence_utils_fasta.py
    - test_protein_sequence_utils_alignment.py
    - test_protein_seqprop.py
    - test_protein_structure_utils_cleanpdb.py
    - test_files
      - structures
        1UPI.pdb
        1ecp.header.pdb
        1cbn.pdb
        1cbn_clean_tester.pdb
        3bwm.pdb
        DEOD_ECOLI_model1.pdb
        P9WG73
        P9WG73sim_2M
        comb8CA.dat
        rep1.tra6M.bz2
        rep1.tra3M.bz2
        out2M
        combo1.pdb
        out6M
        wdPPAS_P9WG73
        P9WG73sim_1A
        model1.pdb
        rep1.tra5M.bz2
        rep3.tra3A.bz2
        out10M
        rep3.tra7M.bz2
        in4M.dd
        in6M.dd
        rep4.tra3A.bz2
        rep8.tra1A.bz2
        rep7.tra4A.bz2
        rep6.tra4A.bz2
        comb.dat
        closc2.pdb
        rep8.tra2A.bz2
        P9WG73sim_1M
        rep4.tra1A.bz2
        seq.ss
        model2.pdb
        P9WG73.faa
        seq.txt
        out4A
        rep2.tra8M.bz2
        dist.dat
        rep2.tra2M.bz2
        P9WG73sim_9M
        rep8.tra3A.bz2
        rep1.tra1M.bz2
        rep3.tra4M.bz2
        rep2.tra7M.bz2
        in9M.dd
        out9M
        rep2.tra3M.bz2
        rep1.tra4M.bz2
        rep8.tra4A.bz2
        in3M.dd
        rep2.tra10M.bz2
        rep7.tra1A.bz2
        rep7.tra2A.bz2
        rep2.tra5M.bz2
        rep3.tra8M.bz2
        rep2.tra1A.bz2
        rep2.tra9M.bz2
        rep5.tra1A.bz2
        P9WG73sim_4M
        rep3.tra1M.bz2
        P9WG73sim_3M
        rep5.tra4A.bz2
        combo3.pdb
        wMUSTER_P9WG73
        out4M
        P9WG73sim_5M
        rep3.tra1A.bz2
        rep3.tra9M.bz2
        dPPAS_P9WG73
        rep1.tra4A.bz2
        P9WG73sim_3A
        psitmp.chk
        in7M.dd
        rep5.tra3A.bz2
        out3A
        out8M
        PPAS_P9WG73
        rep5.tra2A.bz2
        rep2.tra6M.bz2
        closc1.pdb
        pssm.txt
        combCA.dat
        rep3.tra6M.bz2
        in8M.dd
        rep1.tra2A.bz2
        seq.dat
        rep6.tra3A.bz2
        rep2.tra4A.bz2
        rep3.tra2A.bz2
        rep6.tra2A.bz2
        rep1.tra7M.bz2
        out1M
        rep3.tra5M.bz2
        wPPAS_P9WG73
        rst.dat
        in2M.dd
        P9WG73sim_10M
        exp.dat
        rep2.tra4M.bz2
        rep4.tra4A.bz2
        Env-PPAS_P9WG73
        rep7.tra3A.bz2
        seq.fasta
        rmsinp
        out2A
        mtx
        rep2.tra2A.bz2
        rep1.tra2M.bz2
        rep4.tra2A.bz2
        P9WG73sim_6M
        rep6.tra1A.bz2
        in3A.dd
        rep1.tra9M.bz2
        rep1.tra1A.bz2
        dPPAS2_P9WG73
        combo2.pdb
        MUSTER_P9WG73
        P9WG73sim_7M
        out3M
        ncaco.pdb
        closc3.pdb
        P9WG73sim_2A
        rep1.tra8M.bz2
        in5M.dd
        rep2.tra1M.bz2
        rep3.tra4A.bz2
        in2A.dd
        model3.pdb
        out1A
        fulinit.pdb
        P9WG73sim_8M
        P9WG73sim_4A
        in10M.dd
        in1A.dd
        rep1.tra3A.bz2
        cscore
        rep1.tra10M.bz2
        out5M
        in4A.dd
        in1M.dd
        tra.in
        lscore.txt
        out7M
        rep2.tra3A.bz2
        E04142.pdb
      - models
        Ec_core_flux1.xml
        mini.json
      - scratch
        test.ss8
        test.ss
        test.fasta
        test.acc20
        test.acc
      - sequences
        X5D299-1.faa
        P0ABP8.xml
        P08559.fasta
        TESTER.faa
        P0ABP8.gff
        eco-b4384.faa
        mtu-Rv0417.kegg
        eco-b4384.kegg
        P9WGE7.fasta
        P9WGE7_1gn3_A_align.txt
        P0ABP8.fasta
        P08559.xml
        P21964.xml
        P0ABP8.txt
        1gn3_A.faa
        P21964.fasta
        Rv0973c_Rv0973c_1126684.4.needle
        mtu-Rv0417.faa
    - test_core_genepro.py
    - test_protein_structure_utils_mutatepdb.py
    - test_databases_uniprot.py
    - test_protein_sequence_properties_scratch.py
    - test_pipeline_atlas.py
    - __init__.py
    - test_pipeline_gempro.py
    - test_databases_kegg.py
    - test_protein_sequence_properties_thermostability.py
    - test_protein_structure_properties_fatcat.py
    - test_core_protein.py
    - test_databases_pdb.py
    - test_databases_bigg.py
    - conftest.py
    - test_core_object.py
    - test_protein_structure_homology_itasserparse.py
  - protein
    - structure
      - utils
        foldx.py
        tleap.py
        cleanpdb.py
        dock.py
        structureio.py
        __init__.py
        README.md
        mutatepdb.py
      - properties
        residues.py
        freesasa.py
        opm.py
        fatcat.py
        stride.py
        quality.py
        __init__.py
        msms.py
        dssp.py
      - homology
        itasser
        itasserprep.py
        itasserprop.py
        __init__.py
        __init__.py
      - __init__.py
      - chainprop.py
      - structprop.py
    - sequence
      - utils
        alignment.py
        fasta.py
        blast.py
        __init__.py
        utils.py
      - properties
        cctop.py
        residues.py
        thermostability.py
        tmhmm.py
        kinetic_folding_rate.py
        __init__.py
        aggregation_propensity.py
        scratch.py
      - seqprop.py
      - __init__.py
    - __init__.py
  - io
    - validation.py
    - __init__.py
  - __init__.py
  - utils.py
  - complex
    - bioassembly.py
    - __init__.py
    - oligomer.py
  - biopython
    - bp_mmcif2dict.py
    - Bio
      - Struct
        protein_residues.py
        Hydrogenate.py
        Geometry.py
        cpv.py
        Protein.py
        WWW
        WHATIFXML.py
        __init__.py
        WHATIF.py
        __init__.py
        CG_Models.py
        bond_amber.py
    - bp_mmcifparser.py
    - __init__.py
  - core
    - complex.py
    - genepro.py
    - modelpro.py
    - object.py
    - __init__.py
    - protein.py
  - pipeline
    - gempro.py
    - atlas2.py
    - atlas.py
    - __init__.py
    - atlas3.py
  - databases
    - patric.py
    - hmmer.py
    - kegg.py
    - swissmodel.py
    - pdb_seq.py
    - ncbi.py
    - pdbflex.py
    - pisa.py
    - uniprot.py
    - __init__.py
    - bigg.py
    - metalpdb.py
    - pdb.py
- requirements.txt
- .gitignore
- docs
  - Makefile
  - make.bat
  - software.rst
  - protein.rst
  - tutorials.ipynb
  - gempro.rst
  - structure.rst
  - getting_started.rst
  - instructions
    - msms.rst
    - scratch.rst
    - emboss.rst
    - dssp.rst
    - freesasa.rst
    - dummies.rst
    - stride.rst
    - fatcat.rst
    - foldrate.rst
    - opm.rst
    - tmhmm.rst
    - amylpred.rst
    - itasser.rst
  - notebooks
    - Protein - Structure Mapping, Alignments, and Visualization.ipynb
    - SeqProp - Protein Sequence Properties.ipynb
    - FATCAT - Structure Similarity.ipynb
    - GEM-PRO - Calculating Protein Properties.ipynb
    - SWISS-MODEL - Downloading homology models.ipynb
    - Software Installation Tester.ipynb
    - I-TASSER and TMHMM Install Guide.ipynb
    - GEM-PRO - Genes & Sequences.ipynb
    - Complex - Testing (undergrads).ipynb
    - GEM-PRO - List of Gene IDs.ipynb
    - GEM-PRO - SBML Model.ipynb
    - PDBProp - Working With a Single PDB Structure.ipynb
  - sequence.rst
  - requirements.txt
  - index.rst
  - conf.py
  - _templates
    - layout.html
    - instructions.rst
  - _static
    - theme_overrides.css
  - assets
  - python_api.rst
- binder
  - postBuild
  - apt.txt
  - requirements.txt
- MANIFEST.in

import urllib.parse as urllib
import urllib.request as urllib2
from urllib.request import urlopen, Request
from urllib.error import URLError
import json

import os.path as op


def manual_get_pfam_annotations(seq, outpath, searchtype='phmmer', force_rerun=False):
    """Retrieve and download PFAM results from the HMMER search tool.

    Args:
        seq:
        outpath:
        searchtype:
        force_rerun:

    Returns:

    Todo:
        * Document and test!

    """
    if op.exists(outpath):
        with open(outpath, 'r') as f:
            json_results = json.loads(json.load(f))

    else:
        fseq = '>Seq\n' + seq
        if searchtype == 'phmmer':
            parameters = {'seqdb': 'pdb', 'seq': fseq}
        if searchtype == 'hmmscan':
            parameters = {'hmmdb': 'pfam', 'seq': fseq}
        enc_params = urllib.urlencode(parameters).encode('utf-8')
        request = urllib2.Request('http://www.ebi.ac.uk/Tools/hmmer/search/{}'.format(searchtype), enc_params)
        url = (urllib2.urlopen(request).geturl() + '?output=json')
        request = str(url)
        request_read = urlopen(request).read().decode("utf-8")

        with open(outpath, 'w') as f:
            json.dump(request_read, f)

        json_results = json.loads(request_read)

    return json_results['results']['hits']