Lightning-AI · Borda · Jun 22, 2021 · Jun 13, 2021 · Jun 13, 2021 · Jun 13, 2021
@@ -17,7 +17,7 @@ jobs:
  pytorch-version: [1.3, 1.4, 1.5, 1.6, 1.7, 1.8, 1.9]
 
  # Timeout: https://stackoverflow.com/a/59076067/4521646
- timeout-minutes: 35
+ timeout-minutes: 55
  steps:
  - uses: actions/checkout@v2
 
@@ -54,9 +54,11 @@ jobs:
 
  - name: Update Environment
  run: |
+ sudo apt install libsndfile1
  conda info
  conda install mkl pytorch=${{ matrix.pytorch-version }} cpuonly
  conda install cpuonly $(python ./requirements/adjust-versions.py conda)
+ conda install -c conda-forge ffmpeg
  conda list
  pip --version
  python ./requirements/adjust-versions.py requirements.txt

@@ -26,7 +26,7 @@ jobs:
  requires: 'minimal'
 
  # Timeout: https://stackoverflow.com/a/59076067/4521646
- timeout-minutes: 35
+ timeout-minutes: 55
 
  steps:
  - uses: actions/checkout@v2
@@ -43,7 +43,15 @@ jobs:
  - name: Setup macOS
  if: runner.os == 'macOS'
  run: |
- brew install libomp # https://github.com/pytorch/pytorch/issues/20030
+ brew install gcc libomp ffmpeg # https://github.com/pytorch/pytorch/issues/20030
+ - name: Setup Linux
+ if: runner.os == 'Linux'
+ run: |
+ sudo apt install -y ffmpeg
+ - name: Setup Windows
+ if: runner.os == 'windows'
+ run: |
+ choco install ffmpeg
 
  - name: Set min. dependencies
  if: matrix.requires == 'minimal'
@@ -70,7 +78,6 @@ jobs:
 
  - name: Install dependencies
  run: |
- python --version
  pip --version
  pip install --requirement requirements.txt --upgrade --find-links https://download.pytorch.org/whl/cpu/torch_stable.html
  python ./requirements/adjust-versions.py requirements.txt

@@ -52,7 +52,7 @@ jobs:
  pip list
  - name: mypy
  run: |
- mypy
+ mypy --show-error-codes
 
 # format-check-yapf:
 # runs-on: ubuntu-20.04

@@ -36,6 +36,12 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 - Added `is_differentiable` property to `ConfusionMatrix`, `F1`, `FBeta`, `Hamming`, `Hinge`, `IOU`, `MatthewsCorrcoef`, `Precision`, `Recall`, `PrecisionRecallCurve`, `ROC`, `StatScores` ([#253](https://github.com/PyTorchLightning/metrics/pull/253))
 
 
+- Added audio metrics: SNR, SI_SDR, SI_SNR ([#292](https://github.com/PyTorchLightning/metrics/pull/292))
+
+
+- Added Inception Score metric to image module ([#299](https://github.com/PyTorchLightning/metrics/pull/299))
+
+
 ### Changed
 
 - Forward cache is now reset when `reset` method is called ([#260](https://github.com/PyTorchLightning/metrics/pull/260))

@@ -19,14 +19,14 @@ pr:
 jobs:
  - job: pytest
  # how long to run the job before automatically cancelling
- timeoutInMinutes: 25
+ timeoutInMinutes: 45
  # how much time to give 'run always even if cancelled tasks' before stopping them
  cancelTimeoutInMinutes: 2
 
  pool: gridai-spot-pool
 
  container:
- image: "pytorch/pytorch:1.7.1-cuda11.0-cudnn8-runtime"
+ image: "pytorch/pytorch:1.8.1-cuda11.1-cudnn8-runtime"
  options: "--runtime=nvidia -e NVIDIA_VISIBLE_DEVICES=all"
 
  workspace:
@@ -44,11 +44,14 @@ jobs:
  displayName: 'Image info & NVIDIA'
 
  - bash: |
- #sudo apt-get install -y cmake
+ sudo apt-get update
+ sudo apt install -y cmake ffmpeg git libsndfile1
  # python -m pip install "pip==20.1"
  pip install --requirement ./requirements/devel.txt --upgrade-strategy only-if-needed
  pip uninstall -y torchmetrics
  pip list
+ env:
+ DEBIAN_FRONTEND: noninteractive
  displayName: 'Install dependencies'
 
  - bash: |

@@ -5,6 +5,31 @@
 Functional metrics
 ##################
 
+*************
+Audio Metrics
+*************
+
+si_sdr [func]
+~~~~~~~~~~~~~
+
+.. autofunction:: torchmetrics.functional.si_sdr
+ :noindex:
+
+
+si_snr [func]
+~~~~~~~~~~~~~
+
+.. autofunction:: torchmetrics.functional.si_snr
+ :noindex:
+
+
+snr [func]
+~~~~~~~~~~
+
+.. autofunction:: torchmetrics.functional.snr
+ :noindex:
+
+
 **********************
 Classification Metrics
 **********************

@@ -18,6 +18,46 @@ your own metric type might be too burdensome.
 .. autoclass:: torchmetrics.AverageMeter
  :noindex:
 
+*************
+Audio Metrics
+*************
+
+About Audio Metrics
+~~~~~~~~~~~~~~~~~~~
+
+For the purposes of audio metrics, inputs (predictions, targets) must have the same size.
+If the input is 1D tensors the output will be a scalar. If the input is multi-dimensional with shape [..., time]` the metric will be computed over the `time` dimension.
+
+.. doctest::
+
+ >>> import torch
+ >>> from torchmetrics import SNR
+ >>> target = torch.tensor([3.0, -0.5, 2.0, 7.0])
+ >>> preds = torch.tensor([2.5, 0.0, 2.0, 8.0])
+ >>> snr = SNR()
+ >>> snr_val = snr(preds, target)
+ >>> snr_val
+ tensor(16.1805)
+
+SI_SDR
+~~~~~~
+
+.. autoclass:: torchmetrics.SI_SDR
+ :noindex:
+
+SI_SNR
+~~~~~~
+
+.. autoclass:: torchmetrics.SI_SNR
+ :noindex:
+
+SNR
+~~~
+
+.. autoclass:: torchmetrics.SNR
+ :noindex:
+
+
 **********************
 Classification Metrics
 **********************
@@ -257,9 +297,17 @@ Image Quality Metrics
 Image quality metrics can be used to access the quality of synthetic generated images from machine
 learning algorithms such as `Generative Adverserial Networks (GANs) <https://en.wikipedia.org/wiki/Generative_adversarial_network>`_.
 
+FID
+~~~
+
 .. autoclass:: torchmetrics.FID
  :noindex:
 
+IS
+~~
+
+.. autoclass:: torchmetrics.IS
+ :noindex:
 
 ******************
 Regression Metrics

@@ -19,3 +19,8 @@ nltk>=3.6
 
 # add extra requirements
 -r image.txt
+
+# audio
+pypesq
+mir_eval>=0.6
+https://github.com/aliutkus/speechmetrics/archive/refs/heads/master.zip
@@ -0,0 +1,131 @@
+# Copyright The PyTorch Lightning team.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from collections import namedtuple
+from functools import partial
+
+import pytest
+import speechmetrics
+import torch
+from torch import Tensor
+
+from tests.helpers import seed_all
+from tests.helpers.testers import BATCH_SIZE, NUM_BATCHES, MetricTester
+from torchmetrics.audio import SI_SDR
+from torchmetrics.functional import si_sdr
+from torchmetrics.utilities.imports import _TORCH_GREATER_EQUAL_1_6
+
+seed_all(42)
+
+Time = 100
+
+Input = namedtuple('Input', ["preds", "target"])
+
+inputs = Input(
+ preds=torch.rand(NUM_BATCHES, BATCH_SIZE, 1, Time),
+ target=torch.rand(NUM_BATCHES, BATCH_SIZE, 1, Time),
+)
+
+speechmetrics_sisdr = speechmetrics.load('sisdr')
+
+
+def speechmetrics_si_sdr(preds: Tensor, target: Tensor, zero_mean: bool):
+ # shape: preds [BATCH_SIZE, 1, Time] , target [BATCH_SIZE, 1, Time]
+ # or shape: preds [NUM_BATCHES*BATCH_SIZE, 1, Time] , target [NUM_BATCHES*BATCH_SIZE, 1, Time]
+ if zero_mean:
+ preds = preds - preds.mean(dim=2, keepdim=True)
+ target = target - target.mean(dim=2, keepdim=True)
+ target = target.detach().cpu().numpy()
+ preds = preds.detach().cpu().numpy()
+ mss = []
+ for i in range(preds.shape[0]):
+ ms = []
+ for j in range(preds.shape[1]):
+ metric = speechmetrics_sisdr(preds[i, j], target[i, j], rate=16000)
+ ms.append(metric['sisdr'][0])
+ mss.append(ms)
+ return torch.tensor(mss)
+
+
+def average_metric(preds, target, metric_func):
+ # shape: preds [BATCH_SIZE, 1, Time] , target [BATCH_SIZE, 1, Time]
+ # or shape: preds [NUM_BATCHES*BATCH_SIZE, 1, Time] , target [NUM_BATCHES*BATCH_SIZE, 1, Time]
+ return metric_func(preds, target).mean()
+
+
+speechmetrics_si_sdr_zero_mean = partial(speechmetrics_si_sdr, zero_mean=True)
+speechmetrics_si_sdr_no_zero_mean = partial(speechmetrics_si_sdr, zero_mean=False)
+
+
+@pytest.mark.parametrize(
+ "preds, target, sk_metric, zero_mean",
+ [
+ (inputs.preds, inputs.target, speechmetrics_si_sdr_zero_mean, True),
+ (inputs.preds, inputs.target, speechmetrics_si_sdr_no_zero_mean, False),
+ ],
+)
+class TestSISDR(MetricTester):
+ atol = 1e-2
+
+ @pytest.mark.parametrize("ddp", [True, False])
+ @pytest.mark.parametrize("dist_sync_on_step", [True, False])
+ def test_si_sdr(self, preds, target, sk_metric, zero_mean, ddp, dist_sync_on_step):
+ self.run_class_metric_test(
+ ddp,
+ preds,
+ target,
+ SI_SDR,
+ sk_metric=partial(average_metric, metric_func=sk_metric),
+ dist_sync_on_step=dist_sync_on_step,
+ metric_args=dict(zero_mean=zero_mean),
+ )
+
+ def test_si_sdr_functional(self, preds, target, sk_metric, zero_mean):
+ self.run_functional_metric_test(
+ preds,
+ target,
+ si_sdr,
+ sk_metric,
+ metric_args=dict(zero_mean=zero_mean),
+ )
+
+ def test_si_sdr_differentiability(self, preds, target, sk_metric, zero_mean):
+ self.run_differentiability_test(
+ preds=preds,
+ target=target,
+ metric_module=SI_SDR,
+ metric_functional=si_sdr,
+ metric_args={'zero_mean': zero_mean}
+ )
+
+ @pytest.mark.skipif(
+ not _TORCH_GREATER_EQUAL_1_6, reason='half support of core operations on not support before pytorch v1.6'
+ )
+ def test_si_sdr_half_cpu(self, preds, target, sk_metric, zero_mean):
+ pytest.xfail("SI-SDR metric does not support cpu + half precision")
+
+ @pytest.mark.skipif(not torch.cuda.is_available(), reason='test requires cuda')
+ def test_si_sdr_half_gpu(self, preds, target, sk_metric, zero_mean):
+ self.run_precision_test_gpu(
+ preds=preds,
+ target=target,
+ metric_module=SI_SDR,
+ metric_functional=si_sdr,
+ metric_args={'zero_mean': zero_mean}
+ )
+
+
+def test_error_on_different_shape(metric_class=SI_SDR):
+ metric = metric_class()
+ with pytest.raises(RuntimeError, match='Predictions and targets are expected to have the same shape'):
+ metric(torch.randn(100, ), torch.randn(50, ))