Extract audio from .pcm from NST Swedish Speech Synthesis
Raw, 8? 16? byte header, big endian PCM 44.1k
Corpus available here
import soundfile as sf
import IPython.display as ipd
import numpy
from IPython.display import Audio
sample_file = "/content/sw_all_mf_01_5277.pcm"
data, sr = sf.read(sample_file, channels=2, samplerate=44100, endian="BIG", dtype="int16", format="RAW", subtype="PCM_16", start=16)
Audio(data[:, 1], rate=sr)