diff --git a/src/ttsds/__about__.py b/src/ttsds/__about__.py index bc1e75b..40ebfb7 100644 --- a/src/ttsds/__about__.py +++ b/src/ttsds/__about__.py @@ -1,4 +1,4 @@ # SPDX-FileCopyrightText: 2024-present Christoph Minixhofer # # SPDX-License-Identifier: MIT -__version__ = "0.0.3" +__version__ = "0.0.4" diff --git a/src/ttsds/__init__.py b/src/ttsds/__init__.py index 3c67e9f..f489a0a 100644 --- a/src/ttsds/__init__.py +++ b/src/ttsds/__init__.py @@ -45,7 +45,8 @@ "wada_snr": WadaSNRBenchmark, } -with importlib.resources.path("ttsds", "data") as data_path: +with importlib.resources.files("ttsds") as data_path: + data_path = data_path / "data" # if they don't exist, download from github for noise_name in [ "esc50", diff --git a/src/ttsds/benchmarks/speaker/dvector.py b/src/ttsds/benchmarks/speaker/dvector.py index 343b97e..ec4860f 100644 --- a/src/ttsds/benchmarks/speaker/dvector.py +++ b/src/ttsds/benchmarks/speaker/dvector.py @@ -9,12 +9,8 @@ from tqdm import tqdm import numpy as np -with importlib.resources.path("ttsds", "data") as dp: - dvector_pt = dp / "dvector" / "dvector.pt" - -# wav_tensor, sample_rate = torchaudio.load("example.wav") -# mel_tensor = wav2mel(wav_tensor, sample_rate) # shape: (frames, mel_dim) -# emb_tensor = dvector.embed_utterance(mel_tensor) # shape: (emb_dim) +with importlib.resources.files("ttsds") as dp: + dvector_pt = dp / "data" / "dvector" / "dvector.pt" from ttsds.benchmarks.benchmark import Benchmark, BenchmarkCategory, BenchmarkDimension from ttsds.util.dataset import Dataset