python source code of __init_

Project: listenbrainz-server (GitHub Link)

listenbrainz-server-master
- set_rate_limits.py
- .github
  - PULL_REQUEST_TEMPLATE.md
  - CONTRIBUTING.md
  - release-drafter.yml
  - CODE_OF_CONDUCT.md
- HACKING.md
- jest.config.js
- spark_manage.py
- listenbrainz_spark
  - config.py.sample
  - hdfs_connection.py
  - query_map.py
  - exceptions.py
  - path.py
  - testdata
    - user_listening_activity.json
    - user_listening_activity_all_time.json
    - user_top_releases.json
    - user_top_recordings.json
    - user_top_releases_empty.json
    - user_top_artists.json
  - schema.py
  - ftp
    - download.py
    - __init__.py
    - tests
      - test_init.py
      - __init__.py
      - test_download.py
  - hdfs
    - upload.py
    - __init__.py
    - tests
      - test_upload.py
      - test_init.py
      - __init__.py
  - constants.py
  - mlhd
    - setup
      - hdfs_upload.py
      - __init__.py
    - schema.py
    - __init__.py
    - README.md
    - scripts
      - artist_popularity.py
      - __init__.py
  - __init__.py
  - README.md
  - utils.py
  - tests
    - test_utils.py
    - __init__.py
  - stats
    - user
      - release.py
      - entity.py
      - listening_activity.py
      - artist.py
      - recording.py
      - __init__.py
      - utils.py
      - tests
        test_utils.py
        test_release.py
        test_artist.py
        test_listening_activity.py
        test_recording.py
        test_entity.py
    - __init__.py
    - tests
      - test_init.py
      - __init__.py
  - recommendations
    - recommend.py
    - create_dataframes.py
    - templates
      - candidate.html
      - index.html
      - model.html
    - train_models.py
    - __init__.py
    - README.md
    - utils.py
    - tests
      - test_candidate.py
      - test_models.py
      - test_recommend.py
      - __init__.py
      - test_dataframe.py
    - candidate_sets.py
  - request_consumer
    - request_consumer.py
    - jobs
      - import_dump.py
      - __init__.py
      - tests
        test_import_dump.py
        __init__.py
    - test_request_consumer.py
- pytest.msb.ini
- queries.md
- relations
  - config.py.sample
  - test.sh
  - README.md
  - utils.py
  - write_artist_relations.py
  - tests
    - test_artist_relations.py
  - create_artist_relations.py
  - requirements.txt
  - create_artist_credit_relations.py
  - get_relations.py
  - data_dump_files
    - README
    - README_data_dump_files.md
- admin
  - sql
    - create_indexes.sql
    - create_types.sql
    - create_db.sql
    - create_schema.sql
    - drop_tables.sql
    - create_tables.sql
    - create_extensions.sql
    - util
      - restart_spotify_imports.sql
    - drop_db.sql
    - create_primary_keys.sql
    - create_foreign_keys.sql
    - drop_schema.sql
    - create_test_db.sql
    - updates
      - 2019-02-26-add-follow-list.sql
      - 2018-05-09-add-on-delete-cascade-to-user-foreign-keys.sql
      - 2018-06-22-spotify-listen-importer.sql
      - 2020-05-20-change-lovehate-to-feedback.sql
      - 2018-06-13-add-musicbrainz-row-id-column.sql
      - 2017-06-05-add-last-login.sql
      - 2019-02-08-save-spotify-permissions.sql
      - 2019-07-09-add-recommendation-table.sql
      - 2020-05-16-rename-recommendation-table-col.sql
      - 2018-05-22-add-gdpr-user-columns.sql
      - 2017-06-23-add-latest-import.sql
      - 2017-07-03-alter-last-login.sql
      - 2020-05-20-truncate-user-stats-table.sql
      - 2017-08-03-make-stats-updated-not-null.sql
      - 2020-05-20-drop-recommendation-cf-recording-col.sql
      - 2019-01-04-add-user-login-id.sql
      - 2018-11-17-add-on-delete-cascade-to-spotify-fk.sql
      - 2019-02-13-change-login-id-type.sql
      - 2017-09-03-make-column-names-singular.sql
      - 2018-06-21-make-musicbrainz-row-id-not-null.sql
      - 2017-10-14-add-incremental-dump-table.sql
      - 2017-07-28-add-stats-tables.sql
      - 2017-10-15-remove-listen-tables.sql
      - 2020-05-20-change-recommendation-cf-recording-col-type.sql
      - 2020-06-17-add-listening-activity-col.sql
    - drop_test_db.sql
  - bigquery
    - listen-schema.json
  - config.sh.ctmpl
  - messybrainz
    - sql
      - create_indexes.sql
      - create_db.sql
      - create_functions.sql
      - drop_tables.sql
      - create_tables.sql
      - create_extensions.sql
      - drop_db.sql
      - create_primary_keys.sql
      - create_foreign_keys.sql
      - create_test_db.sql
      - updates
        2018-06-25-create-recording-release-join-table.sql
        2018-07-05-alter-recording-artist-join.sql
        2018-05-29-create-table-to-store-artist-mbids.sql
        2019-06-13-migrate-to-jsonb.sql
        2018-06-12-create-and-modify-indexes-and-constraints.sql
        2018-06-26-alter-table-artist-credit-redirect.sql
      - drop_test_db.sql
  - config.sh.sample
  - config
    - listenbrainz.ini.uwsgi
    - listenbrainz.nginx
  - rsync-dump-files.sh
  - functions.sh
  - create-dumps.sh
- bigquery-credentials.json.ctmpl
- develop.sh
- Dockerfile.nginx.prod
- test.sh
- LICENSE
- messybrainz
  - db
    - testing.py
    - data.py
    - exceptions.py
    - release.py
    - artist.py
    - recording.py
    - common.py
    - __init__.py
    - tests
      - test_release.py
      - test_artist.py
      - test_data.py
      - test_recording.py
      - __init__.py
  - webserver
    - testing.py
    - decorators.py
    - views
      - index.py
      - test
        test_index.py
        __init__.py
        test_api.py
      - api.py
      - __init__.py
    - test
      - test_utils.py
      - __init__.py
    - templates
      - macros.html
      - index
        home.html
      - base.html
      - errors
        base.html
        404.html
        503.html
        403.html
        400.html
        500.html
    - external
      - __init__.py
      - musicbrainz.py
    - flash.py
    - __init__.py
    - utils.py
    - errors.py
    - static
      - img
        musicbrainz.svg
        logo_big.svg
        acousticbrainz_logo.svg
        metabrainz.svg
        listenbrainz_logo.svg
      - fonts
        glyphicons-halflings-regular.woff
        glyphicons-halflings-regular.eot
        glyphicons-halflings-regular.woff2
        glyphicons-halflings-regular.ttf
        glyphicons-halflings-regular.svg
      - js
        lib
        less.min.js
      - css
        main.less
        theme
        links.less
        boostrap
        responsive-embed.less
        pagination.less
        labels.less
        normalize.less
        navbar.less
        wells.less
        glyphicons.less
        navs.less
        pager.less
        scaffolding.less
        close.less
        panels.less
        input-groups.less
        list-group.less
        media.less
        alerts.less
        forms.less
        button-groups.less
        jumbotron.less
        carousel.less
        responsive-utilities.less
        component-animations.less
        modals.less
        utilities.less
        breadcrumbs.less
        thumbnails.less
        theme.less
        badges.less
        type.less
        progress-bars.less
        tables.less
        code.less
        popovers.less
        dropdowns.less
        boostrap.less
        mixins.less
        grid.less
        tooltip.less
        mixins
        opacity.less
        nav-vertical-align.less
        pagination.less
        labels.less
        image.less
        vendor-prefixes.less
        border-radius.less
        text-emphasis.less
        hide-text.less
        panels.less
        tab-focus.less
        list-group.less
        responsive-visibility.less
        table-row.less
        alerts.less
        forms.less
        reset-filter.less
        gradients.less
        nav-divider.less
        reset-text.less
        text-overflow.less
        clearfix.less
        progress-bar.less
        center-block.less
        grid.less
        resize.less
        grid-framework.less
        size.less
        background-variant.less
        buttons.less
        variables.less
        print.less
        buttons.less
        theme.less
        variables.less
        navbars.less
        buttons.less
        .gitignore
  - testdata
    - data_for_creating_recording_cluster.json
    - recordings_for_clustering_using_fetched_artist_mbids.json
    - recordings_for_testing_artist_clusters.json
    - valid_recordings_with_recording_mbids.json
    - recordings_for_fetch_releases.json
    - recordings_for_release_clusters.json
  - default_config.py
  - test_config.py
  - __init__.py
  - README.md
  - custom_config.py.sample
- manage.py
- config.sh.sample
- requirements_development.txt
- .gitattributes
- run.sh
- webpack.config.js
- msb-develop.sh
- read.py
- babel.config.js
- msb_manage.py
- docker
  - create-cluster.py
  - nginx_custom
    - nginx.conf
    - Dockerfile
  - start-request-consumer-container.sh
  - push-master.sh
  - push-jobs-image.sh
  - push-request-consumer.sh
  - Dockerfile.test
  - stop-request-consumer-container.sh
  - readme.txt
  - push-worker.sh
  - messybrainz
    - push.sh
    - prod
      - uwsgi
        uwsgi.service
  - docker-compose.integration.yml
  - stop-master-service.sh
  - jenkins-test.sh
  - push.sh
  - tunnel
    - ssh_config
    - README.md
    - Dockerfile
    - build.sh
  - setup-worker-node.sh
  - docker-compose.test.yml
  - consul-template.conf
  - stats-crontab
  - apache-download.sh
  - common.yml
  - setup-master-node.sh
  - docker-compose.spark.yml
  - docker-compose.jenkins.yml
  - start-worker-service.sh
  - dump-crontab
  - rc.local
  - start-master-service.sh
  - prod
    - nginx
      - nginx.conf
    - uwsgi
      - uwsgi-api-compat.ini
      - uwsgi.ini
      - uwsgi.service
  - docker-compose.spark.test.yml
  - Dockerfile.webpack
  - beta
    - uwsgi
      - uwsgi.ini
      - uwsgi.service
  - stop-worker-service.sh
  - docker-compose.yml
- enzyme.config.ts
- data
  - __init__.py
  - model
    - user_release_stat.py
    - user_entity.py
    - user_artist_stat.py
    - __init__.py
    - user_listening_activity.py
    - user_recording_stat.py
- SCRIPTS.md
- .pep8speaks.yml
- .travis.yml
- README.md
- consul_config.py.ctmpl
- package.json
- requirements_spark.txt
- pytest.ini
- Dockerfile.spark
- requirements.txt
- pytest.spark.ini
- lint.sh
- Dockerfile
- .eslintrc.js
- tsconfig.json
- .gitignore
- docs
  - Makefile
  - favicon.ico
  - dev
    - api-usage.rst
    - develop-sh.rst
    - faqs.rst
    - clients.rst
    - images
    - api-compat.rst
    - feedback-json.rst
    - api_usage_examples
      - submit_listens.py
      - set_latest_import.py
      - get_listens.py
      - get_latest_import.py
    - api.rst
    - devel-env.rst
    - spark-devel-env.rst
    - spark-architecture.rst
    - json.rst
    - dump_examples
      - read_listens_dump.py
    - listenbrainz-dumps.rst
  - requirements.txt
  - index.rst
  - conf.py
  - .gitignore
- .dockerignore
- msb-test.sh
- mlhd_manage.py
- spark-submit.sh
- listenbrainz
  - follow_server
    - follow_server.py
    - __init__.py
    - dispatcher.py
  - config.py.sample
  - listenstore
    - influx_listenstore.py
    - redis_listenstore.py
    - __init__.py
    - tests
      - util.py
      - test_influxlistenstore.py
      - test_redislistenstore.py
      - __init__.py
    - listenstore.py
  - db
    - testing.py
    - exceptions.py
    - dump.py
    - licenses
      - COPYING-PublicDomain
      - README.md
    - dump_manager.py
    - feedback.py
    - lastfm_token.py
    - user.py
    - lastfm_user.py
    - stats.py
    - lastfm_session.py
    - __init__.py
    - tests
      - test_recommendations_cf_recording.py
      - test_lastfm_session.py
      - test_spotify.py
      - test_user.py
      - test_dump_manager.py
      - test_follow_list.py
      - test_dump.py
      - __init__.py
      - test_lastfm_token.py
      - test_feedback.py
      - test_lastfm_user.py
      - test_stats.py
    - model
      - feedback.py
      - __init__.py
    - recommendations_cf_recording.py
    - spotify.py
    - follow_list.py
  - webserver
    - testing.py
    - decorators.py
    - test_rabbitmq_connection.py
    - static_manager.py
    - views
      - index.py
      - api_tools.py
      - test
        test_user.py
        test_index.py
        test_status.py
        test_profile.py
        __init__.py
        test_follow.py
        test_login.py
      - feedback_api.py
      - api_compat.py
      - user.py
      - profile.py
      - player.py
      - api.py
      - stats_api.py
      - follow.py
      - recommendations_cf_recording_api.py
      - follow_api.py
      - __init__.py
      - login.py
      - api_compat_deprecated.py
      - status_api.py
    - redis_connection.py
    - admin
      - views.py
      - __init__.py
      - test_admin.py
    - rate_limiter.py
    - test
      - test_utils.py
      - __init__.py
      - test_api_errors.py
    - scheduler.py
    - templates
      - macros.html
      - index
        roadmap.html
        data.html
        gdpr.html
        api-docs.html
        lastfm-proxy.html
        contribute.html
        follow.html
        faq.html
        goals.html
        current-status.html
        recent.html
        index.html
        player.html
      - user
        auth.html
        profile.html
        import.html
        base.html
        spotify.html
        export.html
        resettoken.html
        charts.html
      - base-react.html
      - admin
        home.html
        master.html
      - base.html
      - profile
        delete_listens.html
        resetlatestimportts.html
        delete.html
        info.html
      - errors
        413.html
        401.html
        base.html
        404.html
        503.html
        403.html
        400.html
        500.html
      - navbar.html
      - emails
        data_dump_created_notification.txt
        cf_recording_recommendation_notification.txt
        user_stats_notification.txt
        cf_recording_model_upload_notification.txt
        spotify_import_error.txt
        dump_import_notification.txt
        artist_relation_import_notification.txt
        mapping_import_notification.txt
        cf_recording_dataframes_upload_notification.txt
        cf_candidate_sets_upload_notification.txt
      - login
        login.html
    - external
      - messybrainz.py
      - __init__.py
    - influx_connection.py
    - rabbitmq_connection.py
    - flash.py
    - __init__.py
    - utils.py
    - errors.py
    - postgres_connection.py
    - static
      - robots.txt
      - img
        navbar_logo.svg
        MetaBrainz_logo_no_text.svg
        musicbrainz.svg
        musicbrainz-16.svg
        logo_big.svg
        metabrainz.svg
        listenbrainz-logo.svg
      - fonts
        glyphicons-halflings-regular.woff
        glyphicons-halflings-regular.eot
        glyphicons-halflings-regular.woff2
        glyphicons-halflings-regular.ttf
        glyphicons-halflings-regular.svg
      - js
        src
        LastFMImporterModal.test.tsx
        LastFMImporter.tsx
        __snapshots__
        YoutubePlayer.test.tsx.snap
        LastFMImporter.test.tsx.snap
        LastFMImporterModal.test.tsx.snap
        RecentListens.test.tsx.snap
        SpotifyPlayer.test.tsx.snap
        Loader.test.tsx.snap
        BrainzPlayer.test.tsx.snap
        PlaybackControls.test.tsx.snap
        ErrorBoundary.test.tsx.snap
        SoundcloudPlayer.test.tsx.snap
        SoundcloudPlayer.test.tsx
        PlaybackControls.test.tsx
        Scrobble.ts
        Loader.test.tsx
        LastFMImporterModal.tsx
        RecentListens.tsx
        FollowUsers.tsx
        SpotifyPlayer.tsx
        ErrorBoundary.test.tsx
        BrainzPlayer.tsx
        ErrorBoundary.tsx
        index.jsx
        Importer.tsx
        APIError.ts
        RecentListens.test.tsx
        PlaybackControls.tsx
        SoundcloudPlayer.tsx
        Importer.test.ts
        YoutubePlayer.test.tsx
        LastFMImporter.test.tsx
        __mocks__
        recentListensProps.json
        userArtistsProcessData.json
        userReleasesProcessData.json
        getInfo.json
        userReleases.json
        getInfoNoPlayCount.json
        recentListensPropsTooManyListens.json
        userArtists.json
        recentListensPropsPlayingNow.json
        encodeScrobbleOutput.json
        userRecordings.json
        userRecordingsProcessData.json
        page.json
        recentListensPropsOneListen.json
        Loader.tsx
        types.d.ts
        SpotifyPlayer.test.tsx
        BrainzPlayer.test.tsx
        stats
        __snapshots__
        UserEntityChart.test.tsx.snap
        Bar.test.tsx
        UserEntityChart.tsx
        UserEntityChart.test.tsx
        Bar.tsx
        YoutubePlayer.tsx
        APIService.test.ts
        APIService.ts
        utils.tsx
        node_modules
        react-youtube
        index.d.ts
        info.js
        lib
        jquery.timeago.js
        bootstrap.min.js
        soundcloud-player-api.js
        jquery-2.1.0.min.js
        spotify-player-sdk-1.7.1.js
        less.min.js
      - .gitignore
      - css
        main.less
        listens-page.less
        theme
        links.less
        boostrap
        responsive-embed.less
        pagination.less
        labels.less
        normalize.less
        navbar.less
        wells.less
        glyphicons.less
        navs.less
        pager.less
        scaffolding.less
        close.less
        panels.less
        input-groups.less
        list-group.less
        media.less
        alerts.less
        forms.less
        button-groups.less
        jumbotron.less
        carousel.less
        responsive-utilities.less
        component-animations.less
        modals.less
        utilities.less
        breadcrumbs.less
        thumbnails.less
        theme.less
        badges.less
        type.less
        progress-bars.less
        tables.less
        code.less
        popovers.less
        dropdowns.less
        boostrap.less
        mixins.less
        grid.less
        tooltip.less
        mixins
        opacity.less
        nav-vertical-align.less
        pagination.less
        labels.less
        image.less
        vendor-prefixes.less
        border-radius.less
        text-emphasis.less
        hide-text.less
        panels.less
        tab-focus.less
        list-group.less
        responsive-visibility.less
        table-row.less
        alerts.less
        forms.less
        reset-filter.less
        gradients.less
        nav-divider.less
        reset-text.less
        text-overflow.less
        clearfix.less
        progress-bar.less
        center-block.less
        grid.less
        resize.less
        grid-framework.less
        size.less
        background-variant.less
        buttons.less
        variables.less
        print.less
        buttons.less
        theme.less
        variables.less
        navbars.less
        buttons.less
        highlight.css
        .gitignore
    - login
      - provider.py
      - __init__.py
  - spotify_updater
    - spotify_read_listens.py
    - __init__.py
    - tests
      - test_spotify_read_listens.py
      - data
        spotify_play_two_artists.json
        spotify_play_no_isrc.json
      - __init__.py
  - testdata
    - user_listening_activity_db.json
    - cf_recommendations_db_data_for_api_test_recording.json
    - user_export_test.json
    - invalid_artist_mbid.json
    - artist_name_list.json
    - user_top_releases_db_data_for_api_test_year.json
    - too_long_tag.json
    - same_timestamp_diff_track_valid_single.json
    - user_top_recordings_db.json
    - user_top_recordings_db_data_for_api_test.json
    - single_more_than_one_listen.json
    - user_top_releases_db.json
    - user_top_artists_db.json
    - user_top_recordings_db_data_for_api_test_year.json
    - user_top_artists_db_data_for_api_test_week.json
    - invalid_release_mbid.json
    - user_top_artists_db_data_for_api_test.json
    - playing_now_with_duration.json
    - same_timestamp_diff_track_valid_single_2.json
    - too_many_tags.json
    - too_large_listen.json
    - user_top_artists_db_data_for_api_test_month.json
    - playing_now_more_than_one_listen.json
    - invalid_recording_mbid.json
    - playing_now_with_ts.json
    - playing_now_with_duration_ms.json
    - valid_import.json
    - valid_playing_now.json
    - user_top_artists_db_data_for_api_test_year.json
    - user_top_artists_db_data_for_api_test_too_many.json
    - additional_info.json
    - same_timestamp_diff_track_valid_single_3.json
    - user_top_recordings_db_data_for_api_test_week.json
    - same_batch_duplicates.json
    - user_listening_activity_db_data_for_api_test_year.json
    - user_top_recordings_db_data_for_api_test_too_many.json
    - user_top_releases_db_data_for_api_test_too_many.json
    - user_listening_activity_db_data_for_api_test.json
    - user_listening_activity_db_data_for_api_test_month.json
    - user_listening_activity_db_data_for_api_test_week.json
    - playing_now_ts.json
    - user_top_releases_db_data_for_api_test_week.json
    - valid_single.json
    - user_top_releases_db_data_for_api_test.json
    - timestamp_in_ns.json
    - user_top_releases_db_data_for_api_test_month.json
    - influx_listenstore_test_listens.json
    - user_top_recordings_db_data_for_api_test_month.json
  - server.py
  - bigquery_writer
    - bigquery_writer.py
    - __init__.py
    - test_bigquery_writer.py
  - redis_keys.py
  - bigquery
    - user.py
    - __init__.py
  - api_compat.py
  - listen_replay
    - cli.py
    - __init__.py
    - utils.py
    - replay_user.py
  - listen_writer.py
  - spark
    - test_handlers.py
    - test_query_list.py
    - request_manage.py
    - __init__.py
    - spark_reader.py
    - request_queries.json
    - handlers.py
    - test_request_manage.py
  - listen.py
  - __init__.py
  - utils.py
  - domain
    - __init__.py
    - tests
      - test_spotify.py
      - __init__.py
    - spotify.py
  - tests
    - integration
      - test_influx_writer.py
      - test_api_compat.py
      - test_recommendations_cf_api.py
      - test_api_compat_deprecated.py
      - test_stats_api.py
      - test_feedback_api.py
      - test_profile_views.py
      - __init__.py
      - test_api.py
    - __init__.py
    - utils.py
    - unit
      - test_utils.py
      - test_listen.py
      - test_listen_writer.py
  - model
    - user.py
    - __init__.py
    - spotify.py
  - stats
    - exceptions.py
    - user.py
    - __init__.py
    - utils.py
    - tests
      - __init__.py
      - test_stats.py
    - sitewide.py
  - rtd_config.py
  - influx_writer
    - influx_writer.py
    - count_flusher.py
    - __init__.py

import googleapiclient
import logging
import os
import time

from flask import current_app
from googleapiclient import discovery
from googleapiclient.errors import HttpError
from listenbrainz import config
from oauth2client.client import GoogleCredentials

APP_CREDENTIALS_FILE = os.environ.get('GOOGLE_APPLICATION_CREDENTIALS')
JOB_COMPLETION_CHECK_DELAY = 5
DML_STREAMING_ROWS_DELAY = 30


def create_bigquery_object():
    """ Initiates the connection to Google BigQuery. Returns a BigQuery object. """

    if not APP_CREDENTIALS_FILE:
        current_app.logger.error("The GOOGLE_APPLICATIONS_CREDENTIALS variable is undefined, cannot connect to BigQuery")
        raise NoCredentialsVariableException

    if not os.path.exists(APP_CREDENTIALS_FILE):
        current_app.logger.error("The BigQuery credentials file does not exist, cannot connect to BigQuery")
        raise NoCredentialsFileException

    credentials = GoogleCredentials.get_application_default()
    return discovery.build('bigquery', 'v2', credentials=credentials)


def get_parameters_dict(parameters):
    """ Converts a list of parameters to be passed to BigQuery into the standard format that the API requires.
        The format can be seen here:
        https://developers.google.com/resources/api-libraries/documentation/bigquery/v2/python/latest/bigquery_v2.jobs.html#query

        Args: parameters: a list of dictionaries of the following form
                {
                    "name" (str): name of the parameter,
                    "type" (str): type of the parameter,
                    "value" (str): value of the parameter
                }

        Returns: A list of dictionaries that can be passed to the API call
    """

    bq_params = []
    for param in parameters:
        # construct parameter dict
        temp = {}
        temp["name"] = param["name"]
        temp["parameterType"] = {
            "type": param["type"],
        }
        temp["parameterValue"] = {
            "value": param["value"],
        }

        # append parameter dict to main list
        bq_params.append(temp)

    return bq_params


def wait_for_completion(projectId, jobId):
    """ Make requests periodically until the passed job has been completed """

    while True:

        try:
            job = bigquery.jobs().get(projectId=projectId, jobId=jobId).execute(num_retries=5)
        except googleapiclient.errors.HttpError as err:
            current_app.logger.error("HttpError while waiting for completion of job: {}".format(err), exc_info=True)
            time.sleep(JOB_COMPLETION_CHECK_DELAY)
            continue

        if job["status"]["state"] == "DONE":
            return
        else:
            time.sleep(JOB_COMPLETION_CHECK_DELAY)


def format_results(data):
    """ The data returned by BigQuery contains a dict for the schema and a seperate dict for
        the rows. This function formats the data into a form similar to the data returned
        by sqlalchemy i.e. a dictionary keyed by row names
    """

    formatted_data = []
    for row in data['rows']:
        formatted_row = {}
        for index, val in enumerate(row['f']):
            formatted_row[data['schema']['fields'][index]['name']] = val['v']
        formatted_data.append(formatted_row)
    return formatted_data


def run_query(bigquery, query, parameters=None, dml=False):
    """ Run provided query on Google BigQuery and return the results in the form of a dictionary

        Args:
            bigquery: the bigquery connection object
            query: the BigQuery standard SQL query (not legacy SQL)
            parameters: the parameters to be passed to the query
            dml: a flag which specifies whether the query is a DML (insert, update, delete) query
                or not

        Note: This is a synchronous action
    """

    # Run the query
    query_body = {
        "kind": "bigquery#queryRequest",
        "parameterMode": "NAMED",
        "default_dataset": {
            "projectId": current_app.config['BIGQUERY_PROJECT_ID'],
            "datasetId": current_app.config['BIGQUERY_DATASET_ID'],
        },
        "useLegacySql": False,
        "queryParameters": get_parameters_dict(parameters) if parameters else [],
        "query": query,
    }

    while True:
        try:
            response = bigquery.jobs().query(
                projectId=config.BIGQUERY_PROJECT_ID,
                body=query_body).execute(num_retries=5)
            break
        except HttpError as e:
            # BigQuery does not allow deletion of rows which may be
            # in the streaming buffer, so if an error is returned
            # because of that, sleep and try again.
            current_app.logger.error('HttpError while running query %s: %s', query, str(e), exc_info=True)
            if dml and '400' in str(e):
                time.sleep(DML_STREAMING_ROWS_DELAY)
            else:
                raise

    job_reference = response['jobReference']

    # Check response to see if query was completed before request timeout.
    # If it wasn't, wait until it has been completed.

    if not response['jobComplete']:
        wait_for_completion(**job_reference)
    else:
        have_results = True

    # if this is a dml query then we don't need results.
    if dml:
        return

    data = {}
    prev_token = None
    if have_results:
        first_page = response
    else:
        while True:
            try:
                first_page = bigquery.jobs().getQueryResults(**job_reference).execute(num_retries=5)
                break
            except googleapiclient.errors.HttpError as err:
                current_app.logger.error("HttpError when getting first page after completion of job: {}".format(err), exc_info=True)
                time.sleep(JOB_COMPLETION_CHECK_DELAY)


    data['schema'] = first_page['schema']
    data['rows']   = first_page['rows']
    try:
        prev_token = first_page['pageToken']
    except KeyError:
        # if there is no page token, we have all the results
        # so just return the data
        return format_results(data)

    # keep making requests until we reach the last page and return the data
    # as soon as we do
    while True:
        try:
            query_result = bigquery.jobs().getQueryResults(pageToken=prev_token, **job_reference).execute(num_retries=5)
        except googleapiclient.errors.HttpError as err:
            current_app.logger.error("HttpError when getting query results: {}".format(err), exc_info=True)
            continue

        data['rows'].extend(query_result['rows'])
        try:
            prev_token = query_result['pageToken']
        except KeyError:
            return format_results(data)


# Exceptions
class BigQueryException(Exception):
    pass


class NoCredentialsVariableException(BigQueryException):
    pass


class NoCredentialsFileException(BigQueryException):
    pass