learning-to-learn/complexity.py at main · TimeDelta/learning-to-learn · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
import math

import numpy as np
from astropy.stats import bayesian_blocks
from pyentrp import entropy
from scipy.stats import kurtosis, skew
from sklearn.neighbors import NearestNeighbors

# TODO: numpy, sklearn imports together causing:
#   /usr/local/lib/python3.8/site-packages/threadpoolctl.py:1214: RuntimeWarning:
#   Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
#   the same time. Both libraries are known to be incompatible and this
#   can cause random crashes or deadlocks on Linux when loaded in the
#   same Python program.
#   Using threadpoolctl may cause crashes or deadlocks. For more
#   information and possible workarounds, please see
#       https://github.com/joblib/threadpoolctl/blob/master/multiple_openmp.md


SERIES_STATS = [
    # lambda to map a set of sample time series into single value
    # aggregated per series then per state then per feature
    lambda samples: np.mean(np.median(np.ptp(samples, axis=0), axis=0)),
    lambda samples: np.mean(np.median(np.percentile(samples, 75, axis=0) - np.percentile(samples, 25, axis=0), axis=0)),
    lambda samples: np.mean(np.median(np.mean(samples, axis=0), axis=0)),
    lambda samples: np.mean(np.median(np.std(samples, axis=0), axis=0)),
    lambda samples: np.mean(np.median([skew(series) for series in samples], axis=0)),
    lambda samples: np.mean(np.median([kurtosis(series) for series in samples], axis=0)),
    lambda samples: np.median(
        [
            np.median(
                NearestNeighbors(n_neighbors=2)
                .fit(samples[:, :, i])
                .kneighbors(samples[:, :, i], return_distance=True)[0][:, 1]
            )
            for i in range(samples.shape[2])
        ]
    ),
    lambda samples: np.median(hurst_exponent(samples)),
    lambda samples: np.median(lempel_ziv_complexity_continuous(samples, quantize_signal_bayesian_block_feature_bins)),
    lambda samples: np.median(optimized_multiscale_permutation_entropy(samples)),
    lambda samples: np.median(differential_entropy(samples, quantize_signal_bayesian_block_feature_bins)),
]


def differential_entropy(data, quantizer):
    discrete_signals = quantizer(data)
    entropies = []
    for discrete_signal in discrete_signals:
        hist, _ = np.histogram(discrete_signal, density=True)
        nonzero = hist > 0
        entropies.append(-np.sum(hist[nonzero] * np.log(hist[nonzero])) / np.log(len(np.unique(discrete_signal))))
    return entropies


def lempel_ziv_complexity_continuous(data, quantizer):
    symbol_seqs = quantizer(data)
    complexities = []
    for symbol_seq in symbol_seqs:
        phrase_start = 0
        complexity = 0
        while phrase_start < len(symbol_seq):
            phrase_length = 1
            while True:
                # so that a substring of target phrase length sits entirely before phrase_start
                max_prefix_start = phrase_start - phrase_length + 1

                if max_prefix_start > 0:
                    # all substrings of phrase_length in the prefix [0 : phrase_start]
                    previous_substrings = {tuple(symbol_seq[k : k + phrase_length]) for k in range(max_prefix_start)}
                else:
                    previous_substrings = set()

                end_of_candidate = phrase_start + phrase_length

                # does it still perfectly match something in the prefix?
                if (
                    end_of_candidate <= len(symbol_seq)
                    and tuple(symbol_seq[phrase_start:end_of_candidate]) in previous_substrings
                ):
                    phrase_length += 1
                    continue
                else:
                    break
            complexity += 1
            phrase_start += phrase_length
        alphabet_size = len(np.unique(symbol_seq))
        max_complexity = len(symbol_seq) / np.emath.logn(alphabet_size, len(symbol_seq))
        complexities.append(complexity / max_complexity)
    return complexities


def _hurst_exponent_1d(data):
    """
    slope of log-log regression
    """
    RS = []
    # use logspace for mixed local / ranged correlation structure
    window_sizes = np.unique(np.floor(np.logspace(1, int(np.log10(data.shape[0] // 2)), num=20)).astype(int))
    window_sizes = window_sizes[window_sizes > 0]
    for window in window_sizes:
        n_segments = len(data) // window
        RS_vals = []
        for i in range(n_segments):
            segment = data[i * window : (i + 1) * window]
            mean_seg = np.mean(segment)
            Y = segment - mean_seg
            cumulative_Y = np.cumsum(Y)
            R = np.max(cumulative_Y) - np.min(cumulative_Y)
            S = np.std(segment)
            if S != 0:
                RS_vals.append(R / S)
        if RS_vals:
            RS.append(np.mean(RS_vals))
    if len(RS) == 0:
        raise ValueError("No valid RS values computed; check window sizes and data.")
    logs = np.log(window_sizes[: len(RS)])
    log_RS = np.log(RS)
    mask = np.isfinite(logs) & np.isfinite(log_RS)
    logs, log_RS = logs[mask], log_RS[mask]
    cov = np.cov(logs, log_RS, bias=True)
    slope = cov[0, 1] / cov[0, 0]
    return slope


def hurst_exponent(data):
    if data.ndim == 1:
        return _hurst_exponent_1d(data)
    # compute separately for each feature (column)
    n_features = data.shape[-1]
    hurst_vals = []
    for f_i in range(n_features):
        col = data[..., f_i]
        hurst_vals.append(_hurst_exponent_1d(col))
    return hurst_vals


def optimized_multiscale_permutation_entropy(data) -> float:
    """
    Compute the mean Multiscale Permutation Entropy (MPE) over:
      - orders m = 2 and 3 (averaged)
      - delays swept from min_delay to max_delay (averaged)
      - scale fixed to 3
    """
    scale = 3

    def single_feature(feature_series):
        mpe_vals = []
        for order in [2, 3]:  # Orders to average over (maintains N ≫ m! guideline)
            for delay in delays:
                mpe = entropy.multiscale_permutation_entropy(feature_series, order, delay, scale) / np.log2(
                    math.factorial(order)
                )
                mpe_vals.append(mpe.mean())
        return float(np.mean(mpe_vals))

    entropies = []
    for time_series in data:
        delays = list(range(1, time_series.shape[0] // 20))
        if time_series.ndim == 1:
            return single_feature(time_series)
        per_feature = []
        for f_i in range(time_series[0].shape[0]):
            per_feature.append(single_feature(time_series[:, f_i]))
        entropies.append(np.mean(per_feature))
    return entropies


def quantize_signal_bayesian_block_feature_bins(data):
    def quantize_features(data):
        n_features = data.shape[-1]
        quantized_features = []
        bases = []

        # quantize each feature and record its number of bins
        for i in range(n_features):
            edges = bayesian_blocks(data[:, i])
            quantized_features.append(np.digitize(data[:, i], edges) - 1)
            bases.append(len(edges))

        quantized_features = np.stack(quantized_features, axis=1)
        bases = np.array(bases, dtype=int)

        # compute mixed‑radix weights: product of previous bases
        # weights[0] = 1, weights[i] = prod(bases[:i])
        weights = np.cumprod(np.concatenate(([1], bases[:-1])))
        composite_symbols = np.sum(quantized_features * weights, axis=1)
        return composite_symbols.tolist()

    if data.ndim == 1:
        edges = bayesian_blocks(data)
        quantized = np.digitize(data, edges) - 1
        return quantized.tolist()
    elif data.ndim == 2:
        return quantize_features(data)
    elif data.ndim == 3:
        discrete = []
        for sample in data:
            discrete.append(quantize_features(sample))
        return discrete
    else:
        raise ValueError("Data must be 1D, 2D or 3D.")