forked from neuropsychology/NeuroKit
-
Notifications
You must be signed in to change notification settings - Fork 0
/
entropy_increment.py
122 lines (97 loc) · 5.05 KB
/
entropy_increment.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
import numpy as np
import pandas as pd
from .utils_complexity_embedding import complexity_embedding
from .entropy_shannon import entropy_shannon
def entropy_increment(signal, dimension=2, q=4, **kwargs):
"""**Increment Entropy (IncrEn) and its Multiscale variant (MSIncrEn)**
Increment Entropy (IncrEn) quantifies the magnitudes of the variations between adjacent
elements into ranks based on a precision factor *q* and the standard deviation of the time
series. IncrEn is conceptually similar to :func:`permutation entropy <entropy_permutation>` in
that it also uses the concepts of symbolic dynamics.
In the IncrEn calculation, two letters are used to describe the relationship between adjacent
elements in a time series. One letter represents the volatility direction, and the other
represents the magnitude of the variation between the adjacent elements.
The time series is reconstructed into vectors of *m* elements. Each element of each vector
represents the increment between two neighbouring elements in the original time series.
Each increment element is mapped to a word consisting of two letters (one letter represents
the volatility direction, and the other represents the magnitude of the variation between
the adjacent elements), and then, each vector is described as a symbolic (discrete) pattern.
The :func:`Shannon entropy <entropy_shannon>` of the probabilities of independent patterns is
then computed.
Parameters
----------
signal : Union[list, np.array, pd.Series]
The signal (i.e., a time series) in the form of a vector of values.
dimension : int
Embedding Dimension (*m*, sometimes referred to as *d* or *order*). See
:func:`complexity_dimension` to estimate the optimal value for this parameter.
q : float
The quantifying resolution *q* represents the precision of *IncrEn*, with larger values
indicating a higher precision, causing IncrEn to be more sensitive to subtle fluctuations.
The IncrEn value increases with increasing *q*, until reaching a plateau. This property can
be useful to selecting an optimal *q* value.
**kwargs : optional
Other keyword arguments, such as the logarithmic ``base`` to use for
:func:`entropy_shannon`.
Returns
--------
incren : float
The Increment Entropy of the signal.
info : dict
A dictionary containing additional information regarding the parameters used, such as the
average entropy ``AvEn``.
See Also
--------
entropy_shannon, entropy_multiscale
Examples
----------
.. ipython:: python
import neurokit2 as nk
# Simulate a Signal
signal = nk.signal_simulate(duration=2, sampling_rate=200, frequency=[5, 6], noise=0.5)
# IncrEn
incren, _ = nk.entropy_increment(signal, dimension=3, q=2)
incren
# Multiscale IncrEn (MSIncrEn)
@savefig p_entropy_increment1.png scale=100%
msincren, _ = nk.entropy_multiscale(signal, method="MSIncrEn", show=True)
@suppress
plt.close()
References
-----------
* Liu, X., Jiang, A., Xu, N., & Xue, J. (2016). Increment entropy as a measure of complexity
for time series. Entropy, 18(1), 22.
* Liu, X., Jiang, A., Xu, N., & Xue, J. (2016). Correction on Liu, X.; Jiang, A.; Xu, N.; Xue,
J. Increment Entropy as a Measure of Complexity for Time Series. Entropy 2016, 18, 22.
Entropy, 18(4), 133.
* Liu, X., Wang, X., Zhou, X., & Jiang, A. (2018). Appropriate use of the increment entropy for
electrophysiological time series. Computers in Biology and Medicine, 95, 13-23.
"""
# Sanity checks
if isinstance(signal, (np.ndarray, pd.DataFrame)) and signal.ndim > 1:
raise ValueError(
"Multidimensional inputs (e.g., matrices or multichannel data) are not supported yet."
)
# Store parameters
info = {"Dimension": dimension, "q": q}
# Time-embedding of the consecutive differences ("increment series")
embedded = complexity_embedding(np.diff(signal), dimension=dimension, **kwargs)
# The sign indicates the direction of the volatility between the corresponding neighbouring
# elements in the original time series; it takes values of 1, 0, or 1, indicating a rise, no
# change, or a decline
sign = np.sign(embedded)
# The size describes the magnitude of the variation between these adjacent elements
Temp = np.tile(np.std(embedded, axis=1, ddof=1, keepdims=True), (1, dimension))
size = np.minimum(q, np.floor(abs(embedded) * q / Temp))
size[np.any(Temp == 0, axis=1), :] = 0
# Each element in each vector is mapped to a word consisting of the sign and the size
words = sign * size
# Get probabilities of occurence
freq = np.unique(words, axis=0)
freq = [np.sum(~np.any(words - freq[k, :], axis=1)) for k in range(len(freq))]
freq = np.array(freq) / np.sum(freq)
# Compute entropy
incren, _ = entropy_shannon(freq=freq, **kwargs)
# Normalize
incren = incren / (dimension - 1)
return incren, info