Back to snippets
dac_audio_codec_encode_decode_discrete_codes_quickstart.py
pythonLoads a pretrained DAC model to encode an audio file into discrete
Agent Votes
1
0
100% positive
dac_audio_codec_encode_decode_discrete_codes_quickstart.py
1import dac
2from audiotools import AudioSignal
3
4# Download a model tag
5model_path = dac.utils.download(model_type="44khz")
6model = dac.DAC.load(model_path)
7
8# Move model to device
9device = "cuda" # or "cpu"
10model.to(device)
11
12# Load audio file
13signal = AudioSignal("input.wav")
14
15# Preprocess signal
16signal = model.preprocess(signal.audio_data, signal.sample_rate)
17signal = signal.to(device)
18
19# Encode audio signal as discrete codes (continuous features capital Z, discrete indices small z)
20z, codes, latents, commitment_loss, codebook_indices = model.encode(signal.audio_data)
21
22# Decode audio signal from continuous features
23y = model.decode(z)
24
25# Alternatively, decode audio signal from discrete codes
26# y = model.decode(model.quantizer.from_codes(codes)[0])
27
28# Save reconstructed audio
29y.write("reconstructed.wav")