diff --git a/dataset_analysis/AnalyzeDataset.ipynb b/dataset_analysis/AnalyzeDataset.ipynb index 784784ef..1b04a746 100644 --- a/dataset_analysis/AnalyzeDataset.ipynb +++ b/dataset_analysis/AnalyzeDataset.ipynb @@ -753,7 +753,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.6.5" + "version": "3.7.2" } }, "nbformat": 4, diff --git a/setup.py b/setup.py index 0308dffb..d55e0c59 100644 --- a/setup.py +++ b/setup.py @@ -83,6 +83,7 @@ setup( # "lws", "tqdm", "phonemizer", + "soundfile", ], dependency_links=[ 'http://github.com/bootphon/phonemizer/tarball/master#egg=phonemizer' diff --git a/utils/audio.py b/utils/audio.py index 08dda0a8..83b929cb 100644 --- a/utils/audio.py +++ b/utils/audio.py @@ -1,5 +1,6 @@ import os import librosa +import soundfile as sf import pickle import copy import numpy as np @@ -230,7 +231,7 @@ class AudioProcessor(object): # return np.sign(signal) * magnitude def load_wav(self, filename, encode=False): - x, sr = librosa.load(filename, sr=self.sample_rate) + x, sr = sf.read(filename) if self.do_trim_silence: x = self.trim_silence(x) # sr, x = io.wavfile.read(filename)