... | ... | @@ -37,9 +37,86 @@ The scales are very different. However, the spectrograms are normalized before b |
|
|
|
|
|
ok.
|
|
|
|
|
|
|
|
|
### case 1
|
|
|
|
|
|

|
|
|
|
|
|

|
|
|
|
|
|
|
|
|

|
|
|
|
|
|
|
|
|
### case 2
|
|
|
|
|
|

|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
# code
|
|
|
```
|
|
|
try_index = 954 # 2841 # 5519 # 2841
|
|
|
#a = map_stft(y_tns[try_index: try_index + 1].float()) # extracted
|
|
|
a = map_stft(y_tns_ds[try_index: try_index + 1].float()) # downsampled
|
|
|
b = (a[:, :, :, 0] ** 2 + a[:, :, :, 1] ** 2) ** 0.5
|
|
|
d = b[0].numpy()
|
|
|
time_resolution_step = np.linspace(0, chopped_duration, d.shape[-1], endpoint=False)
|
|
|
freq_resolution_step = np.linspace(0, target_sample_rate / 2, d.shape[0], endpoint=False)
|
|
|
print('Time resolution in the image: {:.4f} sec'.format(time_resolution_step[1] - time_resolution_step[0]))
|
|
|
print('Frequency resolution in the image: {:.4f} Hz'.format(freq_resolution_step[1] - freq_resolution_step[0]))
|
|
|
|
|
|
im = plt.imshow(d, origin='lower', cmap='OrRd', aspect='auto', vmax=np.percentile(d, 99.))
|
|
|
cbar = plt.colorbar(im)
|
|
|
plt.title("strian, max = {}".format(np.amax(d)))
|
|
|
plt.xticks(np.linspace(0, d.shape[-1], 5), np.linspace(0, chopped_duration, 5, endpoint=True))
|
|
|
plt.yticks(np.linspace(0, d.shape[0], 5), np.linspace(0, target_sample_rate / 2, 5, endpoint=True))
|
|
|
plt.savefig('test.png')
|
|
|
plt.close()
|
|
|
print(d.shape)
|
|
|
|
|
|
|
|
|
#a = map_stft(y_tns[try_index: try_index + 1].float()) # extracted
|
|
|
a = map_stft(X3_tns[try_index: try_index + 1].float()) # downsampled
|
|
|
b = (a[:, :, :, 0] ** 2 + a[:, :, :, 1] ** 2) ** 0.5
|
|
|
d = b[0].numpy()
|
|
|
time_resolution_step = np.linspace(0, chopped_duration, d.shape[-1], endpoint=False)
|
|
|
freq_resolution_step = np.linspace(0, target_sample_rate / 2, d.shape[0], endpoint=False)
|
|
|
print('Time resolution in the image: {:.4f} sec'.format(time_resolution_step[1] - time_resolution_step[0]))
|
|
|
print('Frequency resolution in the image: {:.4f} Hz'.format(freq_resolution_step[1] - freq_resolution_step[0]))
|
|
|
|
|
|
im = plt.imshow(d, origin='lower', cmap='OrRd', aspect='auto', vmax=np.percentile(d, 99.))
|
|
|
cbar = plt.colorbar(im)
|
|
|
plt.title("X3, max = {}".format(np.amax(d)))
|
|
|
plt.xticks(np.linspace(0, d.shape[-1], 5), np.linspace(0, chopped_duration, 5, endpoint=True))
|
|
|
plt.yticks(np.linspace(0, d.shape[0], 5), np.linspace(0, target_sample_rate / 2, 5, endpoint=True))
|
|
|
plt.savefig('test.png')
|
|
|
plt.close()
|
|
|
print(d.shape)
|
|
|
|
|
|
|
|
|
plt.plot(d.flatten())
|
|
|
plt.axhline(np.percentile(d, 99), c='black', ls='--')
|
|
|
plt.xlabel('pixels')
|
|
|
plt.savefig('test.png')
|
|
|
plt.close()
|
|
|
|
|
|
#f, t, Zxx = signal.stft(y_chopped[try_index: try_index + 1], fs=target_sample_rate, nperseg=None) # extraced
|
|
|
f, t, Zxx = signal.stft(y_ds_chopped[try_index: try_index + 1], fs=target_sample_rate, nperseg=None) # downsampled
|
|
|
d = np.abs(Zxx[0])
|
|
|
im = plt.imshow(np.abs(d), origin='lower', cmap='OrRd', aspect='auto', vmax=np.percentile(np.abs(d), 99.))
|
|
|
cbar = plt.colorbar(im)
|
|
|
plt.title("strian, max = {}".format(np.amax(np.abs(d))))
|
|
|
plt.xticks(np.linspace(0, d.shape[-1], 5), np.linspace(0, chopped_duration, 5, endpoint=True))
|
|
|
plt.yticks(np.linspace(0, d.shape[0], 5), np.linspace(0, target_sample_rate / 2, 5, endpoint=True))
|
|
|
plt.savefig('test.png')
|
|
|
plt.close()
|
|
|
print(d.shape)
|
|
|
|
|
|
plt.plot(d.flatten())
|
|
|
plt.axhline(np.percentile(d, 99), c='black', ls='--')
|
|
|
plt.xlabel('pixels')
|
|
|
plt.savefig('test.png')
|
|
|
plt.close()
|
|
|
``` |
|
|
\ No newline at end of file |