python source code of utils

Project: freesound-datasets (GitHub Link)

freesound-datasets-master
- .env
- datasets
  - apps.py
  - fixtures
    - example_dog_cat_dataset.json
  - templates
    - datasets
      - download_script.py
      - taxonomy_node_info.html
      - refine_annotations.html
      - taxonomy_node.html
      - dataset_explore.html
      - dataset_releases_table.html
      - downloads.html
      - contribute_validate_annotations_category.html
      - contribute_validate_annotations_category_easy.html
      - dataset_taxonomy_choose_category_all.html
      - dataset.html
      - dataset_taxonomy_table_search.html
      - dataset_taxonomy_table_extended.html
      - sound_examples.html
      - contribute.html
      - dataset_taxonomy_table.html
      - ontology_tree.html
      - taxonomy_node_small_info.html
      - goal_progress_bar.html
      - contribute_validate_annotations_help.html
      - include_player_resources.html
      - taxonomy_node_mini_info.html
      - __init__.py
      - explore_taxonomy.html
      - player.html
      - contribute_validate_annotations.html
      - taxonomy_node_info_for_taxonomy_table.html
      - curate_sounds.html
      - download.html
      - dataset_taxonomy_choose_category.html
      - dataset_taxonomy_table_choose.html
  - freesound.py
  - templatetags
    - __init__.py
    - dataset_templatetags.py
    - general_templatetags.py
  - models.py
  - views.py
  - tasks.py
  - urls.py
  - forms.py
  - __init__.py
  - utils.py
  - migrations
    - 0024_annotation_ground_truth.py
    - 0014_auto_20170403_1541.py
    - 0053_auto_20181123_1420.py
    - 0028_profile_last_category_annotated.py
    - 0052_merge_20181106_1927.py
    - 0044_auto_20171116_1637.py
    - 0011_auto_20170322_1140.py
    - 0003_auto_20170314_1633.py
    - 0039_auto_20171020_1318.py
    - 0050_candidateannotation_priority_score.py
    - 0012_auto_20170322_1703.py
    - 0038_vote_from_test_page.py
    - 0051_auto_20180712_1733.py
    - 0002_remove_taxonomy_created.py
    - 0017_categorycomment_dataset.py
    - 0023_auto_20170623_1416.py
    - 0055_vote_from_expert.py
    - 0025_profile.py
    - 0048_taxonomynode_advanced_task.py
    - 0030_sound_deleted_in_freesound.py
    - 0018_auto_20170620_1305.py
    - 0026_vote_is_trustable.py
    - 0034_auto_20170919_1518.py
    - 0049_auto_20180220_1606.py
    - 0057_auto_20181205_1230.py
    - 0008_datasetrelease_processing_last_updated.py
    - 0032_auto_20170919_1233.py
    - 0029_taxonomynode_freesound_false_examples.py
    - 0046_vote_from_task.py
    - 0043_auto_20171116_1547.py
    - 0001_initial.py
    - 0059_taxonomynode_omitted_curation_task.py
    - 0004_auto_20170315_1150.py
    - 0050_auto_20180622_1604.py
    - 0005_auto_20170320_1615.py
    - 0019_auto_20170621_1528.py
    - 0058_auto_20181212_1231.py
    - 0052_auto_20180831_1652.py
    - 0035_taxonomynode_faq.py
    - 0015_vote_visited_sound.py
    - 0040_auto_20171020_1759.py
    - 0031_auto_20170919_1201.py
    - 0020_annotation_taxonomy_node.py
    - 0009_auto_20170322_1136.py
    - 0042_taxonomynode_propagate_to_parents.py
    - 0060_auto_20190219_1403.py
    - 0022_taxonomynode_priority_score.py
    - 0056_groundtruthannotation_from_candidate_annotations.py
    - 0007_auto_20170321_1741.py
    - 0010_auto_20170322_1139.py
    - __init__.py
    - 0037_taxonomynode_freesound_examples_verification.py
    - 0033_auto_20170919_1451.py
    - 0027_profile_countdown_trustable.py
    - 0041_auto_20171107_1609.py
    - 0054_merge_20181129_1304.py
    - 0045_auto_20171116_1744.py
    - 0016_categorycomment.py
    - 0021_remove_annotation_value.py
    - 0013_auto_20170324_2041.py
    - 0047_taxonomynode_beginner_task.py
    - 0036_auto_20171013_1837.py
    - 0006_datasetrelease.py
  - tests
    - test_models.py
    - __init__.py
    - test_views.py
  - admin.py
  - management
    - commands
      - refresh_sound_deleted_state.py
      - load_beginner_categories.py
      - load_freesound_false_examples.py
      - extract_votes.py
      - stem_dataset_sound_tags.py
      - clear_computing_keys.py
      - remove_non_leaf_annotations.py
      - update_taxonomy.py
      - propagate_ground_truth_annotations.py
      - load_sounds_for_dataset.py
      - generate_fake_data.py
      - transfer_user_votes.py
      - refresh_sound_extra_data.py
      - compute_priority_score_taxonomy_node.py
      - clear_store.py
      - compute_priority_score_candidate_annotations.py
      - create_taxonomy_node_instances.py
      - __init__.py
      - load_freesound_examples.py
      - load_taxonomy.py
    - __init__.py
- utils
  - async_tasks.py
  - redis_store.py
  - __init__.py
- LICENSE
- templates
  - discussion.html
  - base.html
  - faq.html
  - index.html
  - login.html
- manage.py
- uwsgi.ini
- example_sounds_dog_cat_dataset.json
- monitor
  - apps.py
  - templates
    - monitor
      - monitor_category.html
      - monitor_sound.html
      - mapping_category.html
      - monitor_user.html
      - monitor.html
  - models.py
  - views.py
  - tasks.py
  - urls.py
  - tests.py
  - __init__.py
  - migrations
    - __init__.py
  - admin.py
- .travis.yml
- README.md
- requirements.txt
- Dockerfile
- freesound_datasets
  - local_settings.example.py
  - freesound_auth_backend.py
  - wsgi.py
  - templatetags
    - __init__.py
  - views.py
  - urls.py
  - __init__.py
  - migrations
    - __init__.py
  - settings.py
  - celery.py
- .gitignore
- .dockerignore
- static
  - img
    - audioset_logo.svg
    - freesound_datasets_logo.afdesign
    - freesound_annotator_logo.afdesign
    - freesound_dataset_logo_a.svg
    - train_interface.gif
    - freesound_dataset_logo_b.afdesign
    - interface_sound.gif
    - audioset_logo_blue.svg
    - freesound_annotator_logo_for_white_bg.svg
    - freesound_dataset_logo_a.afdesign
    - mtg_upf_logo.svg
    - freesound_dataset_logo_b.svg
    - freesound_annotator_logo_for_black_bg.svg
    - freesound_datasets_logo.svg
    - freesound_annotator_logo.svg
    - funding_logos
    - freesound_logo.svg
  - bibtex
    - fonseca2017freesound.bib
  - semanticui
    - themes
      - default
        assets
        images
        fonts
        icons.woff
        icons.otf
        icons.woff2
        icons.eot
        icons.ttf
  - audio-annotator
    - fonts
      - roboto
        Roboto-Bold.eot
        Roboto-Regular.ttf
        Roboto-Medium.ttf
        Roboto-Bold.woff
        Roboto-Light.woff
        Roboto-Thin.woff
        Roboto-Light.ttf
        Roboto-Light.eot
        Roboto-Medium.woff2
        Roboto-Thin.eot
        Roboto-Thin.ttf
        Roboto-Medium.woff
        Roboto-Regular.woff2
        Roboto-Regular.woff
        Roboto-Bold.woff2
        Roboto-Regular.eot
        Roboto-Bold.ttf
        Roboto-Medium.eot
        Roboto-Thin.woff2
        Roboto-Light.woff2
    - js
      - src
        wavesurfer.js
        webaudio.js
        peakcache.js
        plugin
        cursor.js
        microphone.js
        elan.js
        regions.js
        mediasession.js
        minimap.js
        timeline.js
        spectrogram.js
        player.js
        util
        request-animation-frame.js
        extend.js
        style.js
        observer.js
        ajax.js
        frame.js
        max.js
        prevent-click.js
        min.js
        index.js
        get-id.js
        mediaelement.js
        html-init.js
        drawer.js
        wavesurfer.min.js
        drawer.multicanvas.js
      - lib
        jquery-2.2.3.min.js
        wavesurfer.spectrogram.min.js
        materialize.min.js
        wavesurfer.min.js
        wavesurfer.min.js.map
      - colormap
        gen_colormap.js
        gen_colormap.sh
        colormap.min.js
    - css
      - player.css
      - materialize.min.css
      - audio-annotator.css
  - js
    - jquery.min.js
    - d3.v3.min.js
    - main.js
    - dataTables.semanticui.min.js
    - jquery.dataTables.min.js
  - taxonomy-explorer
    - js
      - load-taxonomy.js
  - css
    - main.css
    - dataTables.semanticui.min.css
    - .Rhistory
    - exploreTaxonomy.css
    - popupUi.css
- docker-compose.yml

import os
from urllib.parse import urljoin
from django.conf import settings
from django.urls import reverse
from django.template.loader import render_to_string
import datasets.freesound as fs
from nltk import PorterStemmer


def generate_download_script(dataset):
    access_token_url = urljoin(settings.BASE_URL, reverse('get_access_token'))
    dataset_url = urljoin(settings.BASE_URL, reverse('dataset-sounds',
        kwargs={"short_name": dataset.short_name}))

    tvars = {
        'access_token_url': access_token_url,
        'dataset_url': dataset_url,
        'get_code_url': settings.FS_CLIENT_ID
    }
    return render_to_string('datasets/download_script.py', tvars)


def chunks(l, n):
    """Yield successive n-sized chunks from l."""
    for i in range(0, len(l), n):
        yield l[i:i + n]


def query_freesound_by_id(list_ids, fields="id,name", descriptors=""):
    """ Query Freesound by chunk of 50 sounds
        Retrieves only id of sounds """
    client = fs.FreesoundClient()
    client.set_token(settings.FS_CLIENT_SECRET)
    results = []
    for sub_list_ids in chunks(list_ids, 50):
        filter_str = 'id:(' + ' OR '.join([str(i) for i in sub_list_ids]) + ')'
        page_result = client.text_search(query="", fields=fields, page_size=50, filter=filter_str,
                                         descriptors=descriptors)
        results += [s for s in page_result]
    return results


def stem(word):
    ps = PorterStemmer()
    return ps.stem(word)