python source code of metric

Project: asteroid (GitHub Link)

asteroid-master
- .github
  - ISSUE_TEMPLATE
    - how-to-question.md
    - feature_request.md
    - documentation.md
    - bug_report.md
- egs
  - whamr
    - TasNet
      - utils
        prepare_python_env.sh
        parse_options.sh
      - eval.py
      - run.sh
      - model.py
      - train.py
      - README.md
      - local
        preprocess_whamr.py
        prepare_data.sh
        convert_sphere2wav.sh
        conf.yml
    - README.md
  - wsj0-mix
    - README.md
    - DeepClustering
      - utils
        prepare_python_env.sh
        parse_options.sh
      - eval.py
      - run.sh
      - model.py
      - train.py
      - README.md
      - local
        preprocess_wsj0mix.py
        convert_sphere2wav.sh
        conf.yml
      - requirements.txt
  - musdb18
    - README.md
    - OpenUnmix
      - test_dataloader.py
  - sms_wsj
    - CaCGMM
      - utils
        prepare_python_env.sh
        parse_options.sh
      - start_evaluation.py
      - run.sh
      - README.md
      - local
        prepare_data.sh
        conf.yml
    - README.md
  - fuss
    - baseline
      - utils
        prepare_python_env.sh
        parse_options.sh
      - run.sh
      - local
        get_dev_data.sh
        data_augmentation.sh
    - README.md
  - kinect-wsj
    - README.md
    - DeepClustering
      - utils
        prepare_python_env.sh
        parse_options.sh
      - eval.py
      - run.sh
      - model.py
      - train.py
      - README.md
      - local
        preprocess_kinect_wsj.py
        convert_sphere2wav.sh
        conf.yml
      - requirements.txt
  - README.md
  - dns_challenge
    - baseline
      - utils
        prepare_python_env.sh
        parse_options.sh
      - eval_on_synthetic.py
      - run.sh
      - model.py
      - train.py
      - local
        preprocess_dns.py
        download_data.sh
        install_git_lfs.sh
        conf.yml
        create_dns_dataset.sh
      - denoise.py
    - README.md
  - librimix
    - ConvTasNet
      - utils
        prepare_python_env.sh
        parse_options.sh
      - eval.py
      - run.sh
      - model.py
      - train.py
      - README.md
      - local
        prepare_data.sh
        create_local_metadata.py
        conf.yml
    - README.md
  - avspeech
    - looking-to-listen
      - utils
        parse_options.sh
      - eval.py
      - run.sh
      - model.py
      - train.py
      - local
        postprocess
        postprocess_audio.py
        __init__.py
        data_prep.yml
        loader
        remove_corrupt.py
        download.py
        generate_video_embedding.py
        constants
        __init__.py
        extract_audio.py
        remove_empty_audio.py
        __init__.py
        audio_mixer_generator.py
        frames.py
        __init__.py
        conf.yml
        requirements.txt
      - train
        config.py
        metric_utils.py
        __init__.py
        callbacks.py
        trainer.py
    - README.md
  - wham
    - TwoStep
      - utils
        prepare_python_env.sh
        parse_options.sh
      - eval.py
      - system.py
      - run.sh
      - model.py
      - train.py
      - README.md
      - local
        prepare_data.sh
        preprocess_wham.py
        convert_sphere2wav.sh
        conf.yml
    - DynamicMixing
      - utils
        get_training_stats.py
        prepare_python_env.sh
        parse_options.sh
      - eval.py
      - run.sh
      - model.py
      - train.py
      - README.md
      - local
        prepare_data.sh
        preprocess_wham.py
        resample_dataset.py
        augmented_wham.py
        convert_sphere2wav.sh
        conf.yml
      - requirements.txt
    - ConvTasNet
      - utils
        prepare_python_env.sh
        parse_options.sh
      - eval.py
      - run.sh
      - train.py
      - README.md
      - local
        prepare_data.sh
        preprocess_wham.py
        convert_sphere2wav.sh
        conf.yml
    - README.md
    - DPRNN
      - utils
        prepare_python_env.sh
        parse_options.sh
      - eval.py
      - run.sh
      - train.py
      - README.md
      - local
        prepare_data.sh
        preprocess_wham.py
        convert_sphere2wav.sh
        conf.yml
    - FilterbankDesign
      - model.py
      - train.py
      - local
        conf.yml
- .coveragerc
- model_cards
  - README.md
  - by_username
    - Cosentino
      - ConvTasNet_LibriMix_sepclean.md
      - ConvTasNet_LibriMix_sepnoisy.md
    - mpariente
      - DPRNNTasNet(ks=16)_WHAM_sepclean.md
      - ConvTasNet_WHAM_sepclean.md
      - DPRNNTasNet_WHAM_sepclean.md
- codecov.yml
- LICENSE
- CONTRIBUTING.md
- CHANGELOG.md
- notebooks
  - 02_Filterbank.ipynb
  - README.md
  - 01_AsteroidGettingStarted.ipynb
  - 03_PITLossWrapper.ipynb
- setup.py
- .travis.yml
- README.md
- tests
  - utils
    - utils_test.py
    - hub_utils_test.py
    - torch_utils_test.py
  - filterbanks
    - transforms_test.py
    - stft_test.py
    - filterbanks_test.py
  - metrics_test.py
  - models
    - publish_test.py
    - models_test.py
  - losses
    - loss_functions_test.py
    - pit_wrapper_test.py
  - engine
    - system_test.py
    - optimizers_test.py
  - README.md
  - masknn
    - activations_test.py
    - convolutional_test.py
    - norms_test.py
    - consistency_test.py
    - recurrent_test.py
- requirements.txt
- pylintrc
- .gitignore
- docs
  - Makefile
  - source
    - writing_a_new_loss.rst
    - why_use_asteroid.rst
    - losses.rst
    - running_a_recipe.rst
    - masknn.rst
    - index.rst
    - conf.py
    - supported_datasets.rst
    - _templates
      - theme_variables.jinja
    - _static
      - images
        asteroid_logo.svg
    - writing_a_new_filterbank.rst
    - filterbanks.rst
  - make.bat
  - README.md
  - requirements.txt
- hubconf.py
- MANIFEST.in
- asteroid
  - utils
    - deprecation_utils.py
    - parser_utils.py
    - generic_utils.py
    - hub_utils.py
    - torch_utils.py
    - __init__.py
  - filterbanks
    - stft_fb.py
    - griffin_lim.py
    - multiphase_gammatone_fb.py
    - param_sinc_fb.py
    - enc_dec.py
    - free_fb.py
    - analytic_free_fb.py
    - __init__.py
    - transforms.py
  - metrics.py
  - models
    - conv_tasnet.py
    - zenodo.py
    - publisher.py
    - __init__.py
    - README.md
    - dprnn_tasnet.py
    - base_models.py
  - losses
    - bark_matrix_8k.mat
    - bark_matrix_16k.mat
    - pmsqe.py
    - mse.py
    - __init__.py
    - cluster.py
    - multi_scale_spectral.py
    - stoi.py
    - sdr.py
    - pit_wrapper.py
  - engine
    - optimizers.py
    - system.py
    - __init__.py
  - data
    - dns_dataset.py
    - kinect_wsj.py
    - wham_dataset.py
    - musdb18_dataset.py
    - wsj0_mix.py
    - whamr_dataset.py
    - avspeech_dataset.py
    - librimix_dataset.py
    - __init__.py
  - __init__.py
  - scripts
    - asteroid_cli.py
    - __init__.py
  - masknn
    - convolutional.py
    - consistency.py
    - norms.py
    - activations.py
    - blocks.py
    - recurrent.py
    - __init__.py

import sys
import torch
import mir_eval
import numpy as np
from asteroid.data.avspeech_dataset import AVSpeechDataset


def snr(pred_signal: torch.Tensor, true_signal: torch.Tensor) -> torch.FloatTensor:
    """
        Calculate the Signal-to-Noise Ratio
        from two signals

        Args:
            pred_signal (torch.Tensor): predicted signal spectrogram.
            true_signal (torch.Tensor): original signal spectrogram.

    """
    inter_signal = true_signal - pred_signal

    true_power = (true_signal ** 2).sum()
    inter_power = (inter_signal ** 2).sum()

    snr = 10*torch.log10(true_power / inter_power)

    return snr

def sdr(pred_signal: torch.Tensor, true_signal: torch.Tensor) -> torch.FloatTensor:
    """
        Calculate the Signal-to-Distortion Ratio
        from two signals

        Args:
            pred_signal (torch.Tensor): predicted signal spectrogram.
            true_signal (torch.Tensor): original signal spectrogram.

    """
    n_sources = pred_signal.shape[0]

    y_pred_wav = np.zeros((n_sources, 48_000))
    y_wav = np.zeros((n_sources, 48_000))

    for i in range(n_sources):
        y_pred_wav[i] = AVSpeechDataset.decode(pred_signal[i, ...]).numpy()
        y_wav[i] = AVSpeechDataset.decode(true_signal[i, ...]).numpy()
    sdr, sir, sar, _ = mir_eval.separation.bss_eval_sources(y_wav, y_pred_wav)

    return sdr