-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathbert_visualization.py
More file actions
89 lines (81 loc) · 2.66 KB
/
Copy pathbert_visualization.py
File metadata and controls
89 lines (81 loc) · 2.66 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
import os
import random
import time
import matplotlib.pyplot as plt
import muspy
import numpy as np
import seaborn as sns
import torch
import torch.nn.functional as F
from torch.utils import data
from torch.utils.data.dataloader import DataLoader
from torch.utils.data.dataset import Dataset
from bert import PianoBERT
from config import BERTCONFIG
from preprocess import MidiDataset
from utils import emb_to_index
if __name__ == "__main__":
vis_attn = True
gen_midi = True
config = BERTCONFIG()
device = torch.device("cpu")
model = PianoBERT(
embedding_dim=config.EMBEDDING_DIM,
seq_length=config.SEQ_LENGTH,
num_heads=config.NUM_HEADS,
num_layers=config.NUM_LAYERS,
).to(device)
model.load_state_dict(
torch.load("checkpoints/checkpoints_07_CE_loss/model_epoch-2000.pt")[
"model_state_dict"
]
)
dataset = MidiDataset(seq_len=512, mask_prob=0.15)
loader = DataLoader(dataset, shuffle=True, batch_size=1, drop_last=True)
X, Y, mask = next(iter(loader))
# Forward pass
outputs = model(X)
indices = []
for output in outputs:
index = torch.argmax(output, dim=-1)
indices.append(index)
indices = torch.stack(indices, dim=-1).squeeze().numpy()
# Attention Visualization
if vis_attn:
target_layer = 12
x = model.note_embed(X)
for ii in range(target_layer):
x, attn = model.layers[ii](x)
attn = F.normalize(attn)
# print(attn.shape)
attn = attn.detach().numpy()[0]
fig, ax = plt.subplots(2, 4)
for ii in range(8):
sns.heatmap(attn[ii], ax=ax[ii // 4, ii % 4], square=True, cmap="YlGnBu")
ax[ii // 4, ii % 4].set_title(f"Head {ii+1}")
plt.show()
# Generate music
if gen_midi:
midi = muspy.Music(tempos=[muspy.Tempo(0, 60)], resolution=1000)
midi.tracks.append(muspy.Track())
current_time = 0
for i, output in enumerate(indices):
octave = output[0]
pitch = output[1]
s_duration = output[2] * 20
m_duration = output[3] * 200
l_duration = output[4] * 2000
velocity = output[5] * 8 + 4
s_shift = output[6] * 20
l_shift = output[7] * 400
note = muspy.Note(
current_time,
20 + octave * 12 + pitch,
s_duration + m_duration + l_duration,
velocity,
)
if i < 1000:
print(note)
midi.tracks[0].append(note)
current_time += s_shift + l_shift
midi.write_midi(f"Generated-{time.time():2.2f}.mid")