python source code of file

seqr-master
- .github
  - ISSUE_TEMPLATE
    - feature_request.md
    - bug_report.md
- install_dependencies.sh
- servctl
- seqr
  - apps.py
  - utils
    - redis_utils.py
    - redis_utils_2_3_tests.py
    - middleware.py
    - gene_utils.py
    - xpos_utils_2_3_tests.py
    - elasticsearch
      - es_gene_agg_search.py
      - es_search.py
      - constants.py
      - __init__.py
      - utils.py
      - es_utils_2_3_tests.py
    - file_utils.py
    - communication_utils.py
    - __init__.py
    - xpos_utils.py
  - views
    - utils
      - individual_utils.py
      - dataset_utils.py
      - orm_to_json_utils_2_3_tests.py
      - test_utils.py
      - pedigree_image_utils_tests.py
      - pedigree_info_utils_2_3_tests.py
      - export_utils_2_3_tests.py
      - file_utils.py
      - pedigree_info_utils.py
      - pedigree_image_utils.py
      - export_utils.py
      - variant_utils.py
      - json_to_orm_utils.py
      - __init__.py
      - permissions_utils.py
      - orm_to_json_utils.py
      - file_utils_2_3_tests.py
      - json_utils.py
    - apis
      - dataset_api.py
      - dashboard_api.py
      - staff_api.py
      - family_api.py
      - awesomebar_api_2_3_tests.py
      - auth_api.py
      - family_api_2_3_tests.py
      - locus_list_api.py
      - auth_api_2_3_tests.py
      - saved_variant_api_2_3_tests.py
      - dataset_api_2_3_tests.py
      - awesomebar_api.py
      - project_categories_api_2_3_tests.py
      - individual_api.py
      - locus_list_api_2_3_tests.py
      - igv_api.py
      - gene_api_2_3_tests.py
      - variant_search_api_2_3_tests.py
      - project_api_2_3_tests.py
      - gene_api.py
      - case_review_api_2_3_tests.py
      - igv_api_2_3_tests.py
      - analysis_group_api.py
      - users_api.py
      - __init__.py
      - case_review_api.py
      - variant_search_api.py
      - dashboard_api_tests.py
      - saved_variant_api.py
      - users_api_2_3_tests.py
      - project_api.py
      - analysis_group_api_2_3_tests.py
      - individual_api_2_3_tests.py
      - project_categories_api.py
      - staff_api_tests.py
    - react_app.py
    - __init__.py
    - react_app_2_3_tests.py
  - fixtures
    - users.json
    - 1kg_project.json
    - variant_searches.json
    - README.txt
    - variant_tag_types.json
    - new_variant_tag_types.json
    - reference_data.json
  - INSTALL.rst
  - models.py
  - urls.py
  - __init__.py
  - README.md
  - migrations
    - 0002_auto_20191203_1913.py
    - 0011_individual_proband_relationship.py
    - 0009_auto_20200402_2219.py
    - 0006_family_mme_notes.py
    - 0001_squashed_0067_remove_project_custom_reference_populations.py
    - 0010_auto_20200413_2159.py
    - 0007_auto_20200303_1842.py
    - 0005_locuslist_projects.py
    - __init__.py
    - 0003_auto_20191203_1130.py
    - 0004_auto_20200124_1912.py
    - 0012_auto_20200603_1924.py
    - 0008_auto_20200317_1716.py
  - admin.py
  - management
    - commands
      - lift_variant_to_hg38.py
      - check_bam_cram_paths.py
      - add_project_tag.py
      - transfer_families_to_different_project.py
      - resend_welcome_email.py
      - lift_project_to_hg38.py
      - run_settings_backup.py
      - run_postgres_database_backup.py
      - copy_project_tags.py
      - reset_cached_search_results.py
      - __init__.py
      - reload_saved_variant_json.py
    - __init__.py
    - tests
      - lift_project_to_hg38_2_3_tests.py
      - check_bam_cram_paths_2_3_tests.py
      - run_settings_backup_2_3_tests.py
      - reload_saved_variant_json_2_3_tests.py
      - transfer_families_to_different_project_2_3_tests.py
      - run_postgres_database_backup_2_3_tests.py
      - add_project_tag_2_3_tests.py
      - resend_welcome_email_2_3_tests.py
      - copy_project_tags_2_3_tests.py
      - __init__.py
      - lift_variant_to_hg38_2_3_tests.py
      - reset_cached_search_results_tests.py
- wsgi.py
- hail_elasticsearch_pipelines
- .gitmodules
- ui
  - .env
  - Makefile
  - pages
    - Project
      - fixtures.js
      - components
        PageHeader.jsx
        ProjectCollaborators.test.js
        edit-families-and-individuals
        BulkEditForm.jsx
        EditHpoTermsButton.jsx
        EditFamiliesForm.jsx
        EditIndividualsForm.jsx
        EditFamiliesAndIndividualsButton.jsx
        AnalysisGroups.jsx
        AnalysisGroupButtons.jsx
        CaseReview.test.js
        GeneLists.jsx
        CaseReview.jsx
        PageHeader.test.js
        SavedVariants.jsx
        ProjectCollaborators.jsx
        ProjectPageUI.test.js
        FamilyTable
        CaseReviewStatusDropdown.jsx
        EmptyTableRow.jsx
        header
        TableHeaderRow.test.js
        TableHeaderRow.jsx
        SortDirectionToggle.test.js
        SortDirectionToggle.jsx
        CaseReviewStatusDropdown.test.js
        IndividualRow.test.js
        FamilyTable.test.js
        IndividualRow.jsx
        FamilyTable.jsx
        EmptyTableRow.test.js
        AnalysisGroupButtons.test.js
        FamilyPage.test.js
        Matchmaker.test.js
        Matchmaker.jsx
        EditDatasetsButton.jsx
        FamilyPage.jsx
        VariantTags.jsx
        ProjectPageUI.jsx
        ProjectOverview.jsx
        EditDatasetButton.test.js
      - reducers.js
      - selectors.test.js
      - Project.jsx
      - selectors.js
      - constants.js
    - Public
      - MatchmakerInfo.jsx
      - LandingPage.jsx
      - MatchmakerDisclaimer.jsx
    - LocusLists.jsx
    - Login
      - components
        Login.jsx
        SetPassword.test.js
        ForgotPassword.test.js
        ForgotPassword.jsx
        SetPassword.jsx
        UserFormLayout.jsx
        Login.test.js
      - reducers.js
      - selectors.js
    - GeneInfoSearch.jsx
    - Staff
      - Staff.jsx
      - components
        SampleMetadata.jsx
        CustomSearch.jsx
        ElasticsearchStatus.jsx
        DiscoverySheet.jsx
        SeqrStats.jsx
        BaseReport.jsx
        SampleQc.jsx
        SuccessStory.jsx
        SavedVariants.jsx
        Users.jsx
        Matchmaker.jsx
        Anvil.jsx
        CreateUser.jsx
      - reducers.js
      - selectors.js
      - constants.js
    - Search
      - fixtures.js
      - components
        VariantSearchFormContent.jsx
        PageHeader.jsx
        VariantSearchFormContent.test.js
        SavedSearch.jsx
        VariantSearchForm.jsx
        VariantSearchForm.test.js
        SavedSearch.test.js
        PageHeader.test.js
        filters
        CustomInheritanceFilter.test.js
        LocusListSelector.test.js
        CustomInheritanceFilter.jsx
        ProjectFamiliesField.jsx
        LocusListSelector.jsx
        ProjectFamiliesField.test.js
        VariantSearchResults.jsx
        VariantSearchResults.test.js
      - reducers.js
      - selectors.test.js
      - selectors.js
      - VariantSearch.jsx
      - constants.js
    - Dashboard
      - fixtures.js
      - components
        CategoryIndicator.jsx
        ProjectEllipsisMenu.jsx
        EditProjectCategoriesModal.jsx
        FilterSelector.jsx
        ProjectEllipsisMenu.test.js
        CategoryIndicator.test.js
        EditProjectCategoriesModal.test.js
        ProjectsTable.test.js
        ProjectsTable.jsx
        FilterSelector.test.js
        CreateProjectButton.jsx
      - reducers.js
      - selectors.test.js
      - Dashboard.jsx
      - selectors.js
      - constants.js
  - .stylelintrc
  - dist
    - asset-manifest.json
    - hijack
      - hijack-styles.css
    - admin
      - img
        search.svg
        icon-no.svg
        tooltag-arrowright.svg
        gis
        move_vertex_on.svg
        move_vertex_off.svg
        icon-deletelink.svg
        icon-unknown.svg
        calendar-icons.svg
        LICENSE
        README.txt
        sorting-icons.svg
        selector-icons.svg
        icon-calendar.svg
        icon-changelink.svg
        icon-unknown-alt.svg
        icon-clock.svg
        icon-alert.svg
        icon-addlink.svg
        icon-yes.svg
        tooltag-add.svg
        inline-delete.svg
      - fonts
        README.txt
        Roboto-Light-webfont.woff
        Roboto-Bold-webfont.woff
        LICENSE.txt
        Roboto-Regular-webfont.woff
      - js
        popup_response.js
        prepopulate.min.js
        change_form.js
        SelectFilter2.js
        admin
        DateTimeShortcuts.js
        RelatedObjectLookups.js
        timeparse.js
        collapse.js
        core.js
        vendor
        xregexp
        xregexp.min.js
        xregexp.js
        LICENSE-XREGEXP.txt
        jquery
        jquery.min.js
        LICENSE-JQUERY.txt
        prepopulate.js
        prepopulate_init.js
        jquery.init.js
        inlines.min.js
        cancel.js
        inlines.js
        actions.min.js
        urlify.js
        collapse.min.js
        calendar.js
        actions.js
        SelectBox.js
      - css
        forms.css
        login.css
        widgets.css
        base.css
        fonts.css
        changelists.css
        rtl.css
        dashboard.css
    - guardian
      - img
        icon-no.svg
        icon-yes.svg
    - app.html
  - redux
    - rootReducer.js
    - utils
      - configureStore.js
      - reducerFactories.test.js
      - reducerFactories.js
      - modalReducer.js
    - selectors.test.js
    - selectors.js
  - .eslintrc
  - .settings
    - org.eclipse.wst.jsdt.ui.superType.container
    - org.eclipse.wst.jsdt.ui.superType.name
  - config
    - env.js
    - polyfills.js
    - webpackDevServer.config.js
    - paths.js
    - webpack.config.dev.js
    - README.md
    - webpack.config.dev.js~
    - jest
      - cssTransform.js
      - fileTransform.js
    - webpack.config.prod.js
  - semantic.json
  - create_jsx_test.py
  - package.json
  - scripts
    - test.js
    - README.md
    - build.js
    - start.js
  - shared
    - utils
      - sortUtils.test.js
      - stringUtils.js
      - stringUtils.test.js
      - httpRequestHelper.js
      - sortUtils.js
      - localStorage.js
      - constants.js
    - components
      - icons
        StaffOnlyIcon.test.js
        PedigreeIcon.jsx
        PedigreeIcon.test.js
        StaffOnlyIcon.jsx
      - page
        Footer.jsx
        PageHeader.jsx
        __snapshots__
        AwesomeBar.test.js.snap
        Errors.jsx
        AwesomeBar.test.js
        Header.jsx
        BreadCrumbs.test.js
        Header.test.js
        AwesomeBar.jsx
        README
        Footer.test.js
        BaseLayout.jsx
        BreadCrumbs.jsx
        BaseLayout.test.js
      - graph
        IGV.jsx
        HorizontalStackedBar.jsx
        README
        Gtex.jsx
        VariantTagTypeBar.jsx
        HorizontalStackedBar.test.js
      - LocusListLoader.jsx
      - DataLoader.jsx
      - Spacers.jsx
      - Spacers.test.js
      - QueryParamEditor.test.js
      - table
        LocusListTabels.test.js
        TableLoading.jsx
        DataTable.jsx
        DataTable.test.js
        LocusListTables.jsx
      - StyledComponents.jsx
      - form
        Inputs.test.js
        ButtonPanel.jsx
        MessagesPanel.jsx
        EditRecordsForm.jsx
        README
        Inputs.jsx
        XHRUploaderField.jsx
        ReduxFormWrapper.jsx
        RichTextEditor.jsx
      - modal
        README
        Modal.jsx
        Modal.test.js
      - QueryParamEditor.jsx
      - panel
        view-fields
        ListFieldView.test.js
        NullableBoolFieldView.test.js
        BaseFieldView.jsx
        TextFieldView.jsx
        TagFieldView.jsx
        README
        TagFieldView.test.js
        ListFieldView.jsx
        OptionFieldView.jsx
        TextFieldView.test.js
        OptionFieldView.test.js
        SingleFieldView.jsx
        NullableBoolFieldView.jsx
        MatchmakerPanel.jsx
        search
        FrequencyFilter.test.js
        FrequencyFilter.jsx
        VariantSearchResults.jsx
        VariantSearchFormPanels.jsx
        VariantSearchFormContainer.jsx
        ProjectsField.jsx
        VariantSearchResults.test.js
        GeneBreakdown.test.js
        GeneBreakdown.jsx
        constants.js
        fixtures.js
        sample.jsx
        RequestStatus.jsx
        README
        MatchmakerPanel.test.js
        genes
        LocusListDetail.jsx
        GeneDetail.test.js
        LocusListDetail.test.js
        GeneDetail.jsx
        HpoPanel.test.js
        variants
        Annotations.jsx
        Annotations.test.js
        Predictions.test.js
        Transcripts.jsx
        VariantIndividuals.test.js
        Variants.test.js
        VariantGene.test.js
        SavedVariants.test.js
        Pathogenicity.jsx
        Frequencies.jsx
        FamilyVariantReads.jsx
        FamilyVariantReads.test.js
        FamilyVariantTags.jsx
        SavedVariants.jsx
        Predictions.jsx
        VariantGene.jsx
        FamilyVariantTags.test.js
        Pathogenicity.test.js
        Variants.jsx
        Transcripts.test.js
        VariantIndividuals.jsx
        Frequencies.test.js
        RequestStatus.test.js
        family.test.js
        view-pedigree-image
        PedigreeImagePanel.test.js
        README
        PedigreeImagePanel.jsx
        HpoPanel.jsx
        family.jsx
      - buttons
        FamilyLink.jsx
        UpdateButton.test.js
        EditProjectButton.jsx
        ExportTableButton.test.js
        CreateVariantButton.jsx
        ShowGeneModal.test.js
        DeleteButton.test.js
        ShowReadsButton.test.js
        DispatchRequestButton.jsx
        DeleteButton.jsx
        LocusListButtons.jsx
        LocusListButtons.test.js
        ExportTableButton.jsx
        UpdateButton.jsx
        ShowReadsButton.jsx
        CreateVariantsButton.test.js
        ShowGeneModal.jsx
        DispatchRequestButton.test.js
        SearchResultsLink.jsx
      - PopupWithModal.jsx
    - global.css
  - app.html
  - .project
  - install_npm_packages.sh
  - app.jsx
- manage.py
- deploy
  - MIGRATE.md
  - LOCAL_INSTALL.md
  - READVIZ_SETUP.md
  - servctl_utils
    - other_command_utils.py
    - deploy_command_utils.py
    - shell_utils.py
    - __init__.py
  - docker
    - seqr
      - entrypoint.sh
      - bashrc
      - readiness_probe
      - gitconfig
      - config
        gunicorn_config.py
      - bin
        start_server.sh
        stop_server.sh
        restart_server.sh
      - Dockerfile
    - redis
      - bashrc
      - Dockerfile
      - redis.conf
    - elasticsearch
      - entrypoint.sh
      - elasticsearch.yml
      - Dockerfile
    - kibana
      - entrypoint.sh
      - kibana.yml
      - Dockerfile
    - postgres
      - bashrc
      - postgresql.conf
      - restore_database_backup.sh
      - Dockerfile
    - pipeline-runner
      - entrypoint.sh
      - bashrc
      - spark-defaults.conf
      - vep-GRCh37.json
      - gitconfig
      - Dockerfile
      - vep-GRCh38.json
  - __init__.py
  - kubernetes
    - gcloud-prod-es-settings.yaml
    - nginx
      - nginx.yaml
    - seqr
      - seqr.gcloud.yaml
    - redis
      - redis.gcloud.yaml
    - elasticsearch
      - ssd-storage-class.yaml
      - elasticsearch.gcloud.yaml
      - es-persistent-volume.yaml
    - kibana
      - kibana.gcloud.yaml
    - postgres
      - postgres.gcloud.yaml
    - gcloud-dev-settings.yaml
    - shared-settings.yaml
    - external-connectors
      - external-elasticsearch.yaml
    - pipeline-runner
      - pipeline-runner.gcloud.yaml
    - namespace.yaml
    - gcloud-prod-settings.yaml
  - secrets
    - gcloud
      - .gitignore
    - shared
      - gcloud
        service-account-key.json
        README.md
        boto
- requirements-dev.txt
- .travis.yml
- README.md
- settings.py
- requirements.txt
- settings
- matchmaker
  - apps.py
  - views
    - external_api_2_3_tests.py
    - external_api.py
    - __init__.py
    - matchmaker_api.py
    - matchmaker_api_2_3_tests.py
  - models.py
  - __init__.py
  - migrations
    - 0001_initial.py
    - __init__.py
  - matchmaker_utils.py
  - management
    - commands
      - __init__.py
    - __init__.py
- .gitignore
- LICENSE.txt
- collect_static.sh
- docker-compose.yml
- reference_data
  - apps.py
  - models.py
  - __init__.py
  - migrations
    - 0004_auto_20170626_1401.py
    - 0005_auto_20170627_0318.py
    - 0017_auto_20190909_2102.py
    - 0012_auto_20190321_1656.py
    - 0010_auto_20190319_1518.py
    - 0001_initial.py
    - 0008_geneexpression.py
    - 0016_dbnsfpgene_gene_names.py
    - 0006_auto_20170630_1754.py
    - 0002_auto_20170319_0332.py
    - 0009_auto_20180917_2015.py
    - 0013_auto_20190404_1953.py
    - 0003_clinvar.py
    - 0007_auto_20180809_2053.py
    - __init__.py
    - 0011_primateai.py
    - 0014_auto_20190510_2150.py
    - 0015_auto_20190625_1813.py
  - admin.py
  - management
    - commands
      - update_gene_constraint.py
      - utils
        gene_utils.py
        update_utils.py
        __init__.py
        download_utils_2_3_tests.py
        download_utils.py
      - update_all_reference_data.py
      - update_mgi.py
      - update_human_phenotype_ontology.py
      - __init__.py
      - run_reference_data_database_backup.py
      - update_primate_ai.py
      - update_omim.py
      - update_gencode.py
      - update_dbnsfp_gene.py
    - __init__.py
    - tests
      - run_reference_data_database_backup_2_3_tests.py
      - update_gene_constraint_2_3_tests.py
      - update_primate_ai_2_3_tests.py
      - update_all_reference_data_2_3_tests.py
      - update_gencode_2_3_tests.py
      - update_omim_2_3_tests.py
      - __init__.py
      - update_dbnsfp_gene_2_3_tests.py
      - update_hpo_2_3_tests.py
      - update_mgi_2_3_tests.py

from __future__ import unicode_literals
from builtins import str

from io import TextIOWrapper

import csv
import gzip
import hashlib
import json
import logging
import os
import tempfile
import openpyxl as xl

from django.contrib.auth.decorators import login_required
from django.views.decorators.csrf import csrf_exempt

from settings import API_LOGIN_REQUIRED_URL
from seqr.views.utils.json_utils import create_json_response

logger = logging.getLogger(__name__)


@login_required(login_url=API_LOGIN_REQUIRED_URL)
@csrf_exempt
def save_temp_file(request):

    try:
        uploaded_file_id, filename, json_records = save_uploaded_file(request)
    except Exception as e:
        return create_json_response({'errors': [str(e)]}, status=400)

    response = {'uploadedFileId': uploaded_file_id}
    if request.GET.get('parsedData'):
        response['parsedData'] = json_records
    else:
        response['info'] = ['Parsed {num_rows} rows from {filename}'.format(num_rows=len(json_records), filename=filename)]

    return create_json_response(response)


def parse_file(filename, stream):
    if filename.endswith('.tsv') or filename.endswith('.fam') or filename.endswith('.ped'):
        return [[s.strip().strip('"') for s in line.rstrip('\n').split('\t')] for line in stream]

    elif filename.endswith('.csv'):
        return [row for row in csv.reader(stream)]

    elif filename.endswith('.xls') or filename.endswith('.xlsx'):
        wb = xl.load_workbook(stream, read_only=True)
        ws = wb[wb.sheetnames[0]]
        rows = [[_parse_excel_string_cell(cell) for cell in row] for row in ws.iter_rows()]
        # trim trailing empty rows
        last_row_index = max(i for i, row in enumerate(rows) if any(val for val in row))
        rows = rows[:last_row_index+1]
        # all rows should have same column count
        last_col_index = max(max(i for i, val in enumerate(row) if val) for row in rows)
        padding = [''] * last_col_index
        rows = [(row + padding)[:last_col_index+1] for row in rows]

        return rows

    elif filename.endswith('.json'):
        return json.loads(stream.read())

    raise ValueError("Unexpected file type: {}".format(filename))


def _parse_excel_string_cell(cell):
    cell_value = cell.value
    if cell_value is not None and cell.data_type == 'n' and int(cell_value) == cell_value:
        cell_value = '{:.0f}'.format(cell_value)
    return cell_value or ''


def _compute_serialized_file_path(uploaded_file_id):
    """Compute local file path, and make sure the directory exists"""

    upload_directory = os.path.join(tempfile.gettempdir(), 'temp_uploads')
    if not os.path.isdir(upload_directory):
        logger.info("Creating directory: " + upload_directory)
        os.makedirs(upload_directory)

    return os.path.join(upload_directory, "temp_upload_{}.json.gz".format(uploaded_file_id))


def save_uploaded_file(request, process_records=None):

    if len(request.FILES) != 1:
        raise ValueError("Received %s files instead of 1" % len(request.FILES))

    # parse file
    stream = next(iter(request.FILES.values()))
    filename = stream._name

    if not filename.endswith('.xls') and not filename.endswith('.xlsx'):
        stream = TextIOWrapper(stream.file, encoding = 'utf-8')

    json_records = parse_file(filename, stream)
    if process_records:
        json_records = process_records(json_records, filename=filename)

    # save json to temporary file
    uploaded_file_id = hashlib.md5(str(json_records).encode('utf-8')).hexdigest()
    serialized_file_path = _compute_serialized_file_path(uploaded_file_id)
    with gzip.open(serialized_file_path, "wt") as f:
        json.dump(json_records, f)

    return uploaded_file_id, filename, json_records


def load_uploaded_file(upload_file_id):
    serialized_file_path = _compute_serialized_file_path(upload_file_id)
    with gzip.open(serialized_file_path, "rt") as f:
        json_records = json.load(f)

    os.remove(serialized_file_path)

    return json_records