-
-
Notifications
You must be signed in to change notification settings - Fork 23
/
librosa_example.py
42 lines (37 loc) · 1.31 KB
/
librosa_example.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
import torch
import librosa
import numpy as np
import matplotlib.pyplot as plt
from librosa import display, feature
from torchnmf.nmf import NMFD
if __name__ == '__main__':
y, sr = librosa.load(librosa.util.example_audio_file())
y = torch.from_numpy(y)
windowsize = 2048
S = torch.stft(y, windowsize, window=torch.hann_window(windowsize)).pow(2).sum(2).sqrt()
S = torch.FloatTensor(S).unsqueeze(0)
R = 3
T = 400
F = S.shape[0] - 1
net = NMFD(S.shape, T=T, rank=R).cuda()
net.fit(S.cuda(), verbose=True)
V = net()
W, H = net.W.detach().cpu().numpy(), net.H.squeeze().detach().cpu().numpy()
V = V.squeeze().detach().cpu().numpy()
if len(W.shape) < 3:
W = W.reshape(*W.shape, 1)
plt.figure(figsize=(10, 8))
for i in range(R):
plt.subplot(3, R, i + 1)
display.specshow(librosa.amplitude_to_db(W[:, i], ref=np.max), y_axis='log')
plt.title('Template ' + str(i + 1))
plt.subplot(3, 1, 2)
display.specshow(librosa.amplitude_to_db(H, ref=np.max), x_axis='time')
plt.colorbar()
plt.title('Activations')
plt.subplot(3, 1, 3)
display.specshow(librosa.amplitude_to_db(V, ref=np.max), y_axis='log', x_axis='time')
plt.colorbar(format='%+2.0f dB')
plt.title('Reconstructed spectrogram')
plt.tight_layout()
plt.show()