OSEkit/src/osekit/public_api/analysis.py at 9e96213c250ba1bd27b73c583b4eb803eb3f6254 · Project-OSmOSE/OSEkit · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
from __future__ import annotations

from enum import Flag, auto
from typing import TYPE_CHECKING, Literal

from scipy.signal import ShortTimeFFT

from osekit.utils.audio_utils import Normalization

if TYPE_CHECKING:
    from pandas import Timedelta, Timestamp

    from osekit.core_api.frequency_scale import Scale


class AnalysisType(Flag):
    """Enum of flags that should be use to specify the type of analysis to run.

    AUDIO:
        Will add an AudioDataset to the datasets and write the reshaped audio files
        to disk.
        The new AudioDataset will be linked to the reshaped audio files rather than to
        the original files.
    MATRIX:
        Will write the npz SpectroFiles to disk and link the SpectroDataset to
        these files.
    SPECTROGRAM:
        Will export the spectrogram png images.
    WELCH:
        Will write the npz welches to disk.

    Multiple flags can be enabled thanks to the logical or | operator:
    AnalysisType.AUDIO | AnalysisType.SPECTROGRAM will export both audio files and
    spectrogram images.

    >>> # Exporting both the reshaped audio and the spectrograms
    >>> # (without the npz matrices):
    >>> export = AnalysisType.AUDIO | AnalysisType.SPECTROGRAM
    >>> AnalysisType.AUDIO in export
    True
    >>> AnalysisType.SPECTROGRAM in export
    True
    >>> AnalysisType.MATRIX in export
    False

    """

    AUDIO = auto()
    MATRIX = auto()
    SPECTROGRAM = auto()
    WELCH = auto()


class Analysis:
    """Class that contains all parameter of an analysis.

    Analysis instances are passed to the public API dataset, which runs the analysis.
    The Analysis object contains all info on the analysis to be done: the type(s) of
    core_api dataset(s) that will be created and added to the Dataset.datasets property and
    which output files will be written to disk (reshaped audio files, npz spectra
    matrices, png spectrograms...) depend on the analysis_type parameter.
    The Analysis instance also contains the technical parameters of the analyses (begin/end times,
    sft, sample rate...).
    """

    def __init__(
        self,
        analysis_type: AnalysisType,
        begin: Timestamp | None = None,
        end: Timestamp | None = None,
        data_duration: Timedelta | None = None,
        mode: Literal["files", "timedelta_total", "timedelta_file"] = "timedelta_total",
        overlap: float = 0.0,
        sample_rate: float | None = None,
        normalization: Normalization = Normalization.RAW,
        name: str | None = None,
        subtype: str | None = None,
        fft: ShortTimeFFT | None = None,
        v_lim: tuple[float, float] | None = None,
        colormap: str | None = None,
        scale: Scale | None = None,
        nb_ltas_time_bins: int | None = None,
        zoom_levels: list[int] | None = None,
        zoom_ffts: list[ShortTimeFFT] | None = None,
    ) -> None:
        """Initialize an Analysis object.

        Parameters
        ----------
        analysis_type: AnalysisType
            The type of analysis to run.
            See AnalysisType docstring for more info.
        begin: Timestamp | None
            The begin of the analysis dataset.
            Defaulted to the begin of the original dataset.
        end: Timestamp | None
            The end of the analysis dataset.
            Defaulted to the end of the original dataset.
        data_duration: Timedelta | None
            Duration of the data within the analysis dataset.
            If provided, audio data will be evenly distributed between begin and end.
            Else, one data object will cover the whole time period.
        mode: Literal["files", "timedelta_total", "timedelta_file"]
            Mode of creation of the dataset data from the original files.
            "files": one data will be created for each file.
            "timedelta_total": data objects of duration equal to data_duration will
            be created from the begin timestamp to the end timestamp.
            "timedelta_file": data objects of duration equal to data_duration will
            be created from the beginning of the first file that the begin timestamp is into, until it would resume
            in a data beginning between two files. Then, the next data object will be created from the
            beginning of the next original file and so on.
        overlap: float
            Overlap percentage between consecutive data.
        sample_rate: float | None
            Sample rate of the new analysis data.
            Audio data will be resampled if provided, else the sample rate
            will be set to the one of the original dataset.
        normalization: Normalization
            The type of normalization to apply to the audio data.
        name: str | None
            Name of the analysis dataset.
            Defaulted as the begin timestamp of the analysis dataset.
            If both audio and spectro analyses are selected, the audio
            analysis dataset name will be suffixed with "_audio".
        subtype: str | None
            Subtype of the written audio files as provided by the soundfile module.
            Defaulted as the default 16-bit PCM for WAV audio files.
            This parameter has no effect if Analysis.AUDIO is not in analysis.
        fft: ShortTimeFFT | None
            FFT to use for computing the spectra.
            This parameter is mandatory if either Analysis.MATRIX
            or Analysis.SPECTROGRAM is in analysis.
            This parameter has no effect if neither Analysis.MATRIX
            nor Analysis.SPECTROGRAM is in the analysis.
        v_lim: tuple[float, float] | None
            Limits (in dB) of the colormap used for plotting the spectrogram.
            Has no effect if Analysis.SPECTROGRAM is not in analysis.
        colormap: str | None
            Colormap to use for plotting the spectrogram.
            Has no effect if Analysis.SPECTROGRAM is not in analysis.
        scale: osekit.core_api.frequecy_scale.Scale
            Custom frequency scale to use for plotting the spectrogram.
            Has no effect if Analysis.SPECTROGRAM is not in analysis.
        nb_ltas_time_bins: int | None
            If None, the spectrogram will be computed regularly.
            If specified, the spectrogram will be computed as LTAS, with the value
            representing the maximum number of averaged time bins.
        zoom_levels: list[int] | None
            If specified, additional analyses datasets will be created at the requested
            zoom levels.
            e.g. with a data_duration of 10s and zoom_levels = [2,4], 3 SpectroDatasets
            will be created, with data_duration = 5s and 2.5s.
            This will only affect spectral exports, and if AnalysisType.AUDIO is
            included in the analysis, zoomed SpectroDatasets will be linked to the
            x1 zoom SpectroData.
        zoom_ffts: list[ShortTimeFFT | None]
            FFT to use for computing the zoomed spectra.
            By default, SpectroDatasets with a zoomed factor z will use the
            same FFT as the z=1 SpectroDataset, but with a hop that is
            divided by z.

        """
        self.analysis_type = analysis_type
        self.begin = begin
        self.end = end
        self.data_duration = data_duration
        self.mode = mode
        self.overlap = overlap
        self.sample_rate = sample_rate
        self.name = name
        self.normalization = normalization
        self.subtype = subtype
        self.v_lim = v_lim
        self.colormap = colormap
        self.scale = scale
        self.nb_ltas_time_bins = nb_ltas_time_bins

        if self.is_spectro and fft is None:
            msg = "FFT parameter should be given if spectra outputs are selected."
            raise ValueError(msg)

        self.fft = fft
        self.zoom_levels = list({1, *zoom_levels}) if zoom_levels else None
        self.zoom_ffts = zoom_ffts

    @property
    def is_spectro(self) -> bool:
        """Return True if the analysis contains spectral computations, False otherwise."""
        return any(
            flag in self.analysis_type
            for flag in (
                AnalysisType.MATRIX,
                AnalysisType.SPECTROGRAM,
                AnalysisType.WELCH,
            )
        )