forked from felixkreuk/HideAndSpeak
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathadd_noise.py
96 lines (81 loc) · 3.51 KB
/
add_noise.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
from os.path import join
import os
import numpy as np
import soundfile as sf
import random
from boltons import fileutils
import argparse
### ADD DIFFERENT TYPES OF NOISE ON TENSOR ###
def generate_gaussian_noise(tensor, noise_norm, mean=0.0, stddev=1.0):
return tensor + noise_norm * tensor.data.new(tensor.size()).normal_(mean, stddev)
def generate_speckle_noise(tensor, noise_norm, mean=0.0, stddev=1.0):
return tensor * (1 + noise_norm * tensor.data.new(tensor.size()).normal_(mean, stddev))
def generate_salt_and_pepper_noise(tensor, prob=0.05):
mx, mn = tensor.max(), tensor.min()
rnd = tensor.data.new(tensor.size()).uniform_(0, 1)
tensor[rnd < prob/2] = mx
tensor[rnd > 1 - prob/2] = mn
return tensor
def generate_salt_noise(tensor, prob=0.05):
mx, mn = tensor.max(), tensor.min()
rnd = tensor.data.new(tensor.size()).uniform_(0, 1)
tensor[rnd < prob] = mx
return tensor
def generate_pepper_noise(tensor, prob=0.05):
mx, mn = tensor.max(), tensor.min()
rnd = tensor.data.new(tensor.size()).uniform_(0, 1)
tensor[rnd > 1 - prob] = mn
return tensor
def add_noise(tensor, noise_type, noise_norm=0.01):
if noise_type == 'gaussian':
return generate_gaussian_noise(tensor, noise_norm)
elif noise_type == 'salt':
return generate_salt_noise(tensor, noise_norm)
elif noise_type == 'pepper':
return generate_pepper_noise(tensor, noise_norm)
elif noise_type == 'snp':
return generate_salt_and_pepper_noise(tensor, noise_norm)
elif noise_type == 'speckle':
return generate_speckle_noise(tensor, noise_norm)
else:
raise Exception(f"Noise type '{noise_type}' not implemented!")
### ADD WAV AS BACKGROUND NOISE ###
def inject_noise_sample(data_path, noise_path, noise_level):
data, sr = sf.read(data_path)
noise, sr = sf.read(noise_path)
noise_len = len(noise)
data_len = len(data)
if noise_len > data_len:
diff = noise_len-data_len
noise_start = random.randint(0, diff - 1)
noise_end = noise_start + data_len
noise = noise[noise_start:noise_end]
noise_len = len(noise)
data_len = len(data)
start = int(np.random.rand() * (data_len - noise_len))
end = int(start + noise_len)
noise_energy = np.sqrt(noise.dot(noise) / noise.size)
data_energy = np.sqrt(data.dot(data) / data.size)
data[start:end] += noise_level * noise* data_energy / noise_energy
return data, sr
def inject_noise_sample_write(data_path, noise_path, target_path, noise_level):
data, sr = inject_noise_sample(data_path, noise_path, noise_level)
sf.write(target_path, data, sr)
def inject_noise_folder(wav_folder, noise_levels, n_items):
if type(noise_levels) == float:
noise_levels = [noise_levels]
trg_dir = join(wav_folder, 'out')
os.makedirs(trg_dir, exist_ok=True)
wavs = list(fileutils.iter_find_files(wav_folder, "*.wav"))
for noise_level in noise_levels:
for i in range(n_items):
w1, w2 = random.sample(wavs, 2)
inject_noise_sample(w1, w2, join(trg_dir, f"{i}_{noise_level}_noise.wav"), noise_level)
if __name__ == '__main__':
parser = argparse.ArgumentParser(description='')
parser.add_argument('--wav_folder', type=str, help='')
parser.add_argument('--noise_levels', type=str, help='')
parser.add_argument('--n_items', type=int, help='')
args = parser.parse_args()
args.noise_levels = list(map(float, args.noise_levels.split(',')))
inject_noise_folder(args.wav_folder, args.noise_levels, args.n_items)