-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathsample_data.py
109 lines (81 loc) · 3.94 KB
/
sample_data.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
import itertools
import numpy as np
from keras.preprocessing.sequence import pad_sequences
def phase_to_sin_cos(Y):
"""Reparametrize sinusoid parameters:
w, A, phi, b --> p, A_cos, A_sin, b
Estimating these parameters seems to be easier in practice.
"""
w, A, phi, b = Y.T
A_cos = A * np.sin(phi)
A_sin = A * np.cos(phi)
p = w ** -1
return np.c_[p, A_cos, A_sin, b]
def _random_times(N, even=True, t_max=4 * np.pi, n_min=None, n_max=None, t_shape=2, t_scale=0.05):
if n_min is None and n_max is None:
raise ValueError("Either n_min or n_max is required.")
elif n_min is None:
n_min = n_max
elif n_max is None:
n_max = n_min
if even:
return np.tile(np.linspace(0., t_max, n_max), (N, 1))
else:
lags = [t_scale * np.random.pareto(t_shape, size=np.random.randint(n_min, n_max + 1))
for i in range(N)]
return [np.r_[0, np.cumsum(lags_i)] for lags_i in lags]
def _periodic_params(N, A_min, A_max, w_min, w_max):
w = 1. / np.random.uniform(1. / w_max, 1. / w_min, size=N)
A = np.random.uniform(A_min, A_max, size=N)
phi = 2 * np.pi * np.random.random(size=N)
b = np.random.normal(scale=1, size=N)
return w, A, phi, b
def _sinusoid(w, A, phi, b):
return lambda t: A * np.sin(2 * np.pi * w * t + phi) + b
def _square(w, A, phi, b):
return lambda t: A * np.sign(np.sin(2 * np.pi * w * t + phi)) + b
def _sawtooth(w, A, phi, b):
return lambda t: 2 * A * (w * t - np.floor(1 / 2 + w * t)) + b
def _triangular(w, A, phi, b):
return lambda t: 4 * A * np.abs(w * t - np.floor(1 / 2 + w * t)) - A + b
def periodic(N, n_min, n_max, t_max=4 * np.pi, even=True, A_min=0.5, A_max=2.0,
noise_sigma=0., w_min=0.1, w_max=1., t_shape=2, t_scale=0.05,
kind='sinusoid'):
"""Returns periodic data (values, (freq, amplitude, phase, offset))"""
t = _random_times(N, even, t_max, n_min, n_max, t_shape, t_scale)
w, A, phi, b = _periodic_params(N, A_min, A_max, w_min, w_max)
func_dict = {'sinusoid': _sinusoid, 'square': _square,
'triangular': _triangular, 'sawtooth': _sawtooth}
if kind == 'mixed':
labels = np.array(list(itertools.islice(itertools.cycle(func_dict.keys()), N)))
np.random.shuffle(labels)
else:
labels = np.repeat(kind, N)
X_list = [np.c_[t[i], func_dict[labels[i]](w[i], A[i], phi[i], b[i])(t[i])] for i in range(N)]
X_raw = pad_sequences(X_list, maxlen=n_max, value=np.nan, dtype='float', padding='post')
X = X_raw.copy()
X[:, :, 1] = X_raw[:, :, 1] + np.random.normal(scale=noise_sigma + 1e-9, size=(N, n_max))
Y = np.c_[w, A, phi, b]
return X, Y, X_raw, labels
def synthetic_control(N, n_min, n_max, t_max=None, even=True, sigma=2.):
if t_max is None:
t_max = float(n_max)
base = lambda t: 30. + sigma * np.random.uniform(-3, 3, size=len(t))
patterns = [base,
lambda t: base(t) + (np.random.uniform(10, 15) *
np.sin(2 * np.pi * t / np.random.uniform(10, 15))),
lambda t: base(t) + np.random.uniform(0.2, 0.5) * t,
lambda t: base(t) - np.random.uniform(0.2, 0.5) * t,
lambda t: base(t) + ((t >= np.random.uniform(t_max / 3., 2. * t_max / 3.)) *
np.random.uniform(7.5, 20)),
lambda t: base(t) - ((t >= np.random.uniform(t_max / 3., 2. * t_max / 3.)) *
np.random.uniform(7.5, 20))]
y = np.random.randint(6, size=N)
if even and n_min == n_max:
t = np.linspace(0., t_max, n_max)
X = np.asarray([patterns[y[i]](t) for i in range(N)]).reshape((-1, n_max, 1))
else:
t = random_uneven_times(N, n_min, n_max, t_max)
X = pad_sequences([np.c_[t[i], patterns[y[i]](t[i])] for i in range(N)], maxlen=n_max,
value=0., dtype='float', padding='post')
return X, y