forked from teddykoker/pedalnet
-
Notifications
You must be signed in to change notification settings - Fork 9
/
plot_wav.py
134 lines (113 loc) · 5.13 KB
/
plot_wav.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
import matplotlib.pyplot as plt
import numpy as np
#import wave
from scipy.io import wavfile
import sys
from scipy import signal
import argparse
import struct
def error_to_signal(y, y_pred, use_filter=1):
"""
Error to signal ratio with pre-emphasis filter:
https://www.mdpi.com/2076-3417/10/3/766/htm
"""
if use_filter == 1:
y, y_pred = pre_emphasis_filter(y), pre_emphasis_filter(y_pred)
return np.sum(np.power(y - y_pred, 2)) / (np.sum(np.power(y, 2) + 1e-10))
def pre_emphasis_filter(x, coeff=0.95):
return np.concatenate([x, np.subtract(x, np.multiply(x, coeff))])
def read_wave(wav_file):
# Extract Audio and framerate from Wav File
fs, signal = wavfile.read(wav_file)
return signal, fs
def analyze_pred_vs_actual(args):
''' Generate plots to analyze the predicted signal vs the actual
signal.
Inputs:
output_wav : The actual signal, by default will use y_test.wav from the test.py output
pred_wav : The predicted signal, by default will use y_pred.wav from the test.py output
input_wav : The pre effect signal, by default will use x_test.wav from the test.py output
model_name : Used to add the model name to the plot .png filename
show_plots : Default is 1 to show plots, 0 to only generate .png files and suppress plots
1. Plots the two signals
2. Calculates Error to signal ratio the same way Pedalnet evauluates the model for training
3. Plots the absolute value of pred_signal - actual_signal (to visualize abs error over time)
4. Plots the spectrogram of (pred_signal - actual signal)
The idea here is to show problem frequencies from the model training
'''
output_wav = args.output_wav
pred_wav = args.pred_wav
input_wav = args.input_wav
model_name = args.model_name
show_plots = args.show_plots
# Read the input wav file
signal3, fs3 = read_wave(input_wav)
# Read the output wav file
signal1, fs = read_wave(output_wav)
Time = np.linspace(0, len(signal1) / fs, num=len(signal1))
fig, (ax3, ax1, ax2) = plt.subplots(3, sharex=True, figsize=(13, 8))
fig.suptitle('Predicted vs Actual Signal')
ax1.plot(Time, signal1, label=output_wav, color='red')
# Read the predicted wav file
signal2, fs2 = read_wave(pred_wav)
Time2 = np.linspace(0, len(signal2) / fs2, num=len(signal2))
ax1.plot(Time2, signal2, label=pred_wav, color='green')
ax1.legend(loc='upper right')
ax1.set_xlabel("Time (s)")
ax1.set_ylabel("Amplitude")
ax1.set_title("Wav File Comparison")
ax1.grid('on')
error_list = []
for s1, s2 in zip(signal1, signal2):
error_list.append(abs(s2 - s1))
# Calculate error to signal ratio with pre-emphasis filter as
# used to train the model
e2s = error_to_signal(signal1, signal2)
e2s_no_filter = error_to_signal(signal1, signal2, use_filter=0)
print("Error to signal (with pre-emphasis filter): ", e2s)
print("Error to signal (no pre-emphasis filter): ", e2s_no_filter)
fig.suptitle('Predicted vs Actual Signal (error to signal: '+ str(round(e2s, 4))+')')
# Plot signal difference
signal_diff = signal2 - signal1
ax2.plot(Time2, error_list, label="signal diff", color='blue')
ax2.set_xlabel("Time (s)")
ax2.set_ylabel("Amplitude")
ax2.set_title("abs(pred_signal-actual_signal)")
ax2.grid('on')
# Plot the original signal
Time3 = np.linspace(0, len(signal3) / fs3, num=len(signal3))
ax3.plot(Time3, signal3, label=input_wav, color='purple')
ax3.legend(loc='upper right')
ax3.set_xlabel("Time (s)")
ax3.set_ylabel("Amplitude")
ax3.set_title("Original Input")
ax3.grid('on')
# Save the plot
plt.savefig(model_name+'_signal_comparison_e2s_' + str(round(e2s,4)) + '.png',bbox_inches='tight')
# Create a zoomed in plot of 0.01 seconds centered at the max input signal value
sig_temp = signal1.tolist()
plt.axis([Time3[sig_temp.index((max(sig_temp)))]-.005, Time3[sig_temp.index((max(sig_temp)))]+0.005, min(signal2),max(signal2)])
plt.savefig(model_name+'_Detail_signal_comparison_e2s_' +str(round(e2s,4)) + '.png',bbox_inches='tight')
# Reset the axis
plt.axis([0,Time3[-1],min(signal2),max(signal2)])
# Plot spectrogram difference
plt.figure(figsize=(12, 8))
print("Creating spectrogram data..")
frequencies, times, spectrogram = signal.spectrogram(signal_diff, 44100)
plt.pcolormesh(times, frequencies, 10*np.log10(spectrogram))
plt.colorbar()
plt.title("Diff Spectrogram")
plt.ylabel('Frequency [Hz]')
plt.xlabel('Time [sec]')
plt.savefig(model_name+'_diff_spectrogram.png', bbox_inches='tight')
if show_plots == 1:
plt.show()
if __name__ == "__main__":
parser = argparse.ArgumentParser()
parser.add_argument("--output_wav", default="y_test.wav")
parser.add_argument("--pred_wav", default="y_pred.wav")
parser.add_argument("--input_wav", default="x_test.wav")
parser.add_argument("--model_name", default='plot')
parser.add_argument("--show_plots", default=1)
args = parser.parse_args()
analyze_pred_vs_actual(args)