Source code for meganorm.src.featureExtraction

import numpy as np
import os
import sys
import tqdm
import json
import pickle
import argparse
import logging
import pyrasa
import fooof as f
import pandas as pd
from typing import Union
from typing import Dict, List
from abc import ABC, abstractmethod
from pyrasa.irasa_mne import irasa_epochs

# from layouts import load_specific_layout
from meganorm.layouts.layouts import load_specific_layout

logger = logging.getLogger(__name__)



[docs]
def abs_canonical_power(
    psd: np.ndarray, freqs: np.ndarray, fmin: Union[int, float], fmax: Union[int, float]
) -> float:
    """
    Calculates absolute canonical power of a frequency band from a power spectrum density (PSD).

    Parameters
    ----------
    psd : np.ndarray
        Power spectral density values (in linear scale).
    freqs : np.ndarray
        A 1D array of frequency values that were used to compute the PSD.
    fmin : Union[int, float]
        Lower bound of the frequency band
    fmax : Union[int, float]
        Upper bound of the frequency band.

    Returns
    -------
    float
        Log-transformed absolute power in the specified frequency band.

    Notes
    -------
    'psd' can be both original PSD or periodic PSD.
    """

    band_indices = np.logical_and(freqs >= fmin, freqs <= fmax)
    band_power = np.trapezoid(psd[band_indices], freqs[band_indices])

    return np.log10(band_power)




[docs]
def rel_canonical_power(
    psd: np.ndarray, freqs: np.ndarray, fmin: Union[int, float], fmax: Union[int, float]
) -> float:
    """
    Calculates relative canonical power of a frequency band from a power spectrum density.

    Parameters
    ----------
    psd : np.ndarray
        Power spectral density values (in linear scale).
    freqs : np.ndarray
        A 1D array of frequency values that were used to compute the PSD.
    fmin : Union[int, float]
        Lower bound of the frequency band.
    fmax : Union[int, float]
        Upper bound of the frequency band.

    Returns
    -------
    float
        Relative power in the specified frequency band. Returns np.nan if total power is zero.

    Notes
    -------
    'psd' can be both original PSD or periodic PSD.
    """

    band_indices = np.logical_and(freqs >= fmin, freqs <= fmax)
    band_power = np.trapezoid(psd[band_indices], freqs[band_indices])
    total_power = np.trapezoid(psd, freqs)

    if total_power == 0:
        return np.nan

    return band_power / total_power




[docs]
def abs_individual_power(psd, freqs, band_peaks, individualized_band_ranges, band_name):
    """Calculates absolute power in an individualized frequency band centered around the dominant peak.

    Parameters
    ----------
    psd : np.ndarray
        Power spectral density values (in linear scale).
    freqs : np.ndarray
        A 1D array of frequency values that were used to compute the PSD.
    band_peaks : list
        List of peak tuples (frequency, power, width).
    individualized_band_ranges : dict
        Dictionary mapping band names to (lower_offset, upper_offset) in Hz.
    band_name : str
         Name of the frequency band to compute power for.

    Returns
    -------
    float
        Log-transformed absolute power in the individualized frequency band. Returns np.nan if no peaks are found.

    Notes
    -------
    'psd' can be both original PSD or periodic PSD.
    """

    if not band_peaks or band_name not in individualized_band_ranges:
        return np.nan

    # Find the dominant peak
    dominant_peak = max(band_peaks, key=lambda x: x[1])
    peak_freq = dominant_peak[0]
    lower_offset, upper_offset = individualized_band_ranges[band_name]

    # Define the frequency range around the peak and find matching indices
    peak_range_indices = np.logical_and(
        freqs >= peak_freq + lower_offset, freqs <= peak_freq + upper_offset
    )

    band_power = np.trapezoid(psd[peak_range_indices], freqs[peak_range_indices])
    return np.log10(band_power)




[docs]
def rel_individual_power(psd, freqs, band_peaks, individualized_band_ranges, band_name):
    """
    Calculates relative power in an individualized frequency band centered around the dominant peak.

    Parameters
    ----------
    psd : np.ndarray
        Power spectral density values (in linear scale).
    freqs : list
        List of peak tuples (frequency, power, width)
    band_peaks : list
        List of peak tuples (frequency, power, width)
    individualized_band_ranges : dict
        Dictionary mapping band names to (lower_offset, upper_offset) in Hz.
    band_name : str
        Name of the frequency band to compute power for.

    Returns
    -------
    float
        Relative power in the individualized frequency band. Returns np.nan if total power is zero or input is invalid.

    Notes
    -------
    'psd' can be both original PSD or periodic PSD.
    """

    if not band_peaks or band_name not in individualized_band_ranges:
        return np.nan

    # Find the dominant peak
    dominant_peak = max(band_peaks, key=lambda x: x[1])
    peak_freq = dominant_peak[0]
    lower_offset, upper_offset = individualized_band_ranges[band_name]

    # Define the range around the peak frequency
    peak_range_indices = np.logical_and(
        freqs >= peak_freq + lower_offset, freqs <= peak_freq + upper_offset
    )

    band_power = np.trapezoid(psd[peak_range_indices], freqs[peak_range_indices])
    total_power = np.trapezoid(psd, freqs)

    if total_power == 0:
        return np.nan

    return band_power / total_power




[docs]
def summarizeFeatures(df, device, which_layout, which_sensor):
    """
    Summarizes a feature DataFrame by averaging channels based on a specified sensor layout.

    Since sensor positions may differ across datasets recorded with different MEG hardware systems,
    this function enables consistent feature extraction by averaging signals across the whole brain
    or predefined brain regions (e.g., lobes).

    The function computes the mean of selected channels (e.g., MEG, EEG) according to a layout
    specified in a JSON file. The layout file is selected based on the recording device
    (e.g., 'FIF', 'DS') and contains channel groupings for either whole-brain or regional (lobe-level)
    parcellation.

    Example layout for regional parcellation:
        "FIF_MEG_LOBE": {
            "MAG_frontal_left": ["MEG0121", "MEG0341", "MEG0311", "MEG0321", ...],
            "MAG_frontal_right": ["MEG1411", "MEG1221", "MEG1211", "MEG1231", ...]
        }

    Example layout for whole-brain averaging:
        "FIF_MAG_ALL": {
            "MAG_ALL": ["MEG0121", "MEG0341", "MEG0311", ...]
        }

    Layout files must be stored in a dedicated layout directory and named based on the recording
    device (e.g., 'FIF.json'). The appropriate key in the JSON (e.g., 'FIF_MEG_LOBE') is constructed
    using `device`, `which_layout`, and `which_sensor`.

    Parameters
    ----------
    df : pd.DataFrame
        A DataFrame where each column represents a channel and each row a sample (subject or epoch).
    device : str
        The recording file type (e.g., 'FIF', 'DS'). Used to locate the correct layout file.
    which_layout : str
        Layout type to use: 'all' for global averaging or 'lobe' for region-based averaging.
    which_sensor : dict
        Dictionary indicating which sensor modalities to include (e.g., {'meg': True, 'eeg': False}).

    Returns
    -------
    pd.DataFrame
        A new DataFrame where columns represent averaged parcels and rows represent samples.
    """
    df.dropna(axis=0, how="all", inplace=True)
    summrized_df = pd.DataFrame(index=df.index)

    # TODO: If both meg and eeg is True, this won't work!
    if which_layout == "all":
        summrized_df[which_layout] = df.mean(axis=1)

    else:
        modality = [
            s_type for s_type, if_alculate in which_sensor.items() if if_alculate
        ][0]

        layout_name = (
            device.upper() + "_" + modality.upper() + "_" + which_layout.upper()
        )
        layout = load_specific_layout(device.upper(), layout_name)

        for parcel_name, channels_list in layout.items():
            summrized_df[parcel_name] = df[list(channels_list)].mean(axis=1)

    return summrized_df




[docs]
def band_power_ratio(psd, freqs, fmin_num, fmax_num, fmin_den, fmax_den):
    """
    Calculates the log ratio of power between two frequency bands.

    Parameters
    ----------
    psd : np.ndarray
        Power spectral density values (linear scale).
    freqs : np.ndarray
        Frequency values corresponding to the PSD.
    fmin_num, fmax_num : float
        Frequency bounds for the numerator band.
    fmin_den, fmax_den : float
        Frequency bounds for the denominator band.

    Returns
    -------
    float
        log10(power_numerator / power_denominator), or np.nan if denominator is zero.
    """
    idx_num = np.logical_and(freqs >= fmin_num, freqs <= fmax_num)
    idx_den = np.logical_and(freqs >= fmin_den, freqs <= fmax_den)

    power_num = np.trapezoid(psd[idx_num], freqs[idx_num])
    power_den = np.trapezoid(psd[idx_den], freqs[idx_den])

    if power_den == 0:
        return np.nan

    return np.log10(power_num / power_den)




[docs]
def compute_hemispheric_asymmetry(
    final_df: pd.DataFrame, base_features: List[str] = None
) -> pd.DataFrame:
    """
    Computes hemispheric asymmetry indices between left and right hemisphere channels.

    For each base feature, finds matching left/right hemisphere column pairs (identified
    by '_lh_' and '_rh_' in column names) and computes their difference as an asymmetry index.

    Parameters
    ----------
    final_df : pd.DataFrame
        Flattened feature DataFrame with columns named in the format
        '{feature}__{band}__{channel}'.
    base_features : List[str], optional
        List of feature name prefixes to compute asymmetry for.
        Defaults to ["Adjusted_Canonical_Absolute_Power", "OriginalPSD_Canonical_Absolute_Power"].

    Returns
    -------
    pd.DataFrame
        Input DataFrame with additional asymmetry columns appended.
        New columns are named with 'Hemispheric_Asymmetry__{base_feat}' and '_lh_vs_rh_'.
    """
    if base_features is None:
        base_features = [
            "Adjusted_Canonical_Absolute_Power",
            "OriginalPSD_Canonical_Absolute_Power",
        ]

    asymmetry_cols = {}

    for base_feat in base_features:
        df_temp = final_df.loc[:, final_df.columns.str.startswith(base_feat)]

        for col in df_temp.columns:
            if "_lh_" in col:
                rh_col = col.replace("_lh_", "_rh_")
                if rh_col in df_temp.columns:
                    ai_col = col.replace("_lh_", "_lh_vs_rh_").replace(
                        base_feat, f"Hemispheric_Asymmetry__{base_feat}"
                    )
                    asymmetry_cols[ai_col] = (
                        df_temp[col].astype(float).values
                        - df_temp[rh_col].astype(float).values
                    )
                else:
                    logger.warning(f"No matching rh column found for {col}, skipping.")

    if asymmetry_cols:
        df_assym = pd.DataFrame(asymmetry_cols, index=final_df.index)
        final_df = pd.concat([final_df, df_assym], axis=1)

    return final_df




[docs]
def create_feature_container(
    feature_categories, freq_bands, channel_names, BAND_RATIOS=None
):
    """
    Creates a DataFrame to store features for each channel, with feature names corresponding to
    the specified categories and frequency bands.

    Parameters
    ----------
    feature_categories : dict
        Dictionary with feature names as keys and booleans indicating
        whether the feature should be calculated.
    freq_bands : dict
        Dictionary of frequency bands (e.g., {'Theta': (4, 8), 'Alpha': (8, 12)}).
    channel_names : list
        List of channel names (e.g., ['ch1', 'ch2', 'ch3']).

    Returns
    -------
    pd.DataFrame
        A DataFrame with feature names as rows and channels as columns.
    """
    # Features that do not need frequency band appended
    no_freq = [
        "Offset",
        "Exponent",
        "Exponent_2",
    ]

    # Features that are per-band but use ratio naming (num_over_den) instead of band names
    ratio_features = ["Adjusted_Band_Ratio", "OriginalPSD_Band_Ratio"]

    # Features handled separately outside the channel loop — skip here
    skip_features = ["Hemispheric_Asymmetry_index"]

    feature_names = []

    for feature, if_calculate in feature_categories.items():
        if not if_calculate:
            continue

        if feature in skip_features:
            # Hemispheric asymmetry rows are added dynamically after the channel loop
            continue

        elif feature in ratio_features and BAND_RATIOS:
            for ratio in BAND_RATIOS:
                num_band, den_band = ratio.numerator, ratio.denominator
                if num_band in freq_bands and den_band in freq_bands:
                    feature_names.append(f"{feature}__{num_band}_over_{den_band}")

        elif feature in no_freq:
            feature_names.append(f"{feature}__")  # trailing __ kept for backward compat

        else:
            for band_name in freq_bands:
                if "Relative" in feature and band_name == "Broadband":
                    continue
                feature_names.append(f"{feature}__{band_name}")

    return pd.DataFrame(columns=channel_names, index=feature_names)




[docs]
def add_feature(feature_container, feature_arr, feature_name, channel_name, band_name):
    """
    Add a feature value to the feature container for a specific channel and frequency band.

    This function appends a feature to a DataFrame by assigning a value (e.g., from an array)
    to a row labeled with the combined feature and band name, and a column labeled with the
    channel name.

    Parameters
    ----------
    feature_container : pd.DataFrame
        DataFrame used to store features, where rows represent feature names and columns represent channels.
    feature_arr : np.ndarray
        Array containing the feature value(s) to add.
    feature_name : str
        Name of the feature (e.g., 'RelativePower_').
    channel_name : str
        Name of the channel (e.g., 'MEG0121') to which the feature value should be assigned.
    band_name : str
        Frequency band to append to the feature name (e.g., 'Alpha').

    Returns
    -------
    pd.DataFrame
        Updated DataFrame with the new feature added.
    """
    feature_name = feature_name + "__" + band_name
    feature_container.at[feature_name, channel_name] = feature_arr

    return feature_container




[docs]
def feature_extract(
    subject_id: str,
    spectral_models,
    psds: np.ndarray,
    feature_categories: Dict[str, bool],
    freqs: np.ndarray,
    freq_bands: Dict[str, tuple],
    channel_names: List[str],
    individualized_band_ranges: Dict[str, tuple],
    device: str,
    which_layout: str,
    which_sensor: Dict[str, bool],
    aperiodic_mode: str,
    min_r_squared: float,
    power_band_ratios_list: List[tuple],
) -> pd.DataFrame:
    """
    Extract features from FOOOF models for each channel and frequency band.

    This function computes various features from FOOOF models for each channel,
    based on specified frequency bands. Features such as offset, exponent, peak
    characteristics, and canonical power are calculated and stored in a DataFrame.

    Parameters
    ----------
    subject_id : str
        The unique identifier for the subject whose data is being processed.
    spectral_models :
        Group of FOOOF models or PYRASA models, where each model corresponds to a channel and
        its power spectral data.
    psds : np.ndarray
        Original power spectral density values, with shape (n_channels, n_freqs).
    feature_categories : Dict[str, bool]
        A dictionary where keys are feature names (e.g., 'Offset', 'Exponent') and values are
        booleans indicating whether to compute the feature.
    freqs : np.ndarray
        Frequency values corresponding to the power values in the `psds` array.
    freq_bands : Dict[str, tuple]
        Dictionary mapping frequency band names (e.g., 'Alpha', 'Beta') to their
        corresponding frequency ranges (min_freq, max_freq).
    channel_names : List[str]
        List of channel names corresponding to the rows of the `psds` array.
    individualized_band_ranges : Dict[str, tuple]
        A dictionary mapping band names to individualized frequency ranges, which may differ
        across subjects or datasets.
    device : str
        The device of the subject's recording (e.g., 'FIF', 'DS'). Used to read the
        appropriate layout file from the layout directory.
    which_layout : str
        Specifies the sensor layout for feature averaging, either 'all' for global averaging
        or 'lobe' for averaging within lobes.
    which_sensor : Dict[str, bool]
        A dictionary indicating which modalities (e.g., 'meg', 'eeg') should be included
        in the feature extraction.
    aperiodic_mode : str
        Defines the aperiodic component fitting mode for FOOOF. Options are 'knee' or 'fixed'.
    min_r_squared : float
        Minimum acceptable R-squared value for FOOOF model fitting. Channels with
        R-squared values below this threshold are excluded.
    power_band_ratios_list : List[tuple]
        List of ratio specifications (each exposing `numerator` and `denominator`
        band names) for which band-power ratio features should be computed.

    Returns
    -------
    pd.DataFrame
        A DataFrame with features extracted for each channel and frequency band. The
        DataFrame has features as rows and channels (and frequency bands) as columns.

    Raises
    ------
    ValueError
        If `aperiodic_mode` is not 'knee' or 'fixed'.
    TypeError
        If `spectral_models` is not an instance of f.FOOOF or
        pyrasa.irasa_mne.mne_objs.IrasaEpoched.
    """

    if aperiodic_mode not in ["knee", "fixed"]:
        raise ValueError(
            f"Unknown aperiodic_mode: {aperiodic_mode}. Expected 'knee' or 'fixed'."
        )
    if not isinstance(spectral_models, f.FOOOF) and not isinstance(
        spectral_models, pyrasa.irasa_mne.mne_objs.IrasaEpoched
    ):
        raise TypeError(
            "Expected a f.FOOOF or pyrasa.irasa_mne.mne_objs.IrasaEpoched object instance."
        )

    # Store features in a pandas DataFrame with channel names as columns
    # and feature names as the index,
    feature_container = create_feature_container(
        feature_categories, freq_bands, channel_names, power_band_ratios_list
    )

    if isinstance(spectral_models, pyrasa.irasa_mne.mne_objs.IrasaEpoched):
        try:
            ap = spectral_models.aperiodic.fit_aperiodic_model(
                fit_func=aperiodic_mode, scale=False
            )
        except Exception as e:
            ap = spectral_models.aperiodic.fit_aperiodic_model(
                fit_func=aperiodic_mode, scale=True
            )
            logger.info(f"Data was rescaled in PYRASA due to numerical instability!")

    for channel_num, channel_name in enumerate(channel_names):

        if isinstance(spectral_models, f.FOOOF):
            spectral_model = FOOOFDecomposer(
                spectral_models, mode=aperiodic_mode, ch_num=channel_num
            )

        elif isinstance(spectral_models, pyrasa.irasa_mne.mne_objs.IrasaEpoched):
            spectral_model = PYRASADecomposer(
                spectral_models,
                mode=aperiodic_mode,
                ch_name=channel_name,
                ch_num=channel_num,
                aperiodic=ap,
            )

        else:
            raise TypeError(f"Unknown spectral model type: {type(spectral_models)}")

        # fitness SQC
        logger.info(
            f"The R**2 in PSD parametrization of the channel {channel_name} was {spectral_model.get_r_squared()}"
        )
        if spectral_model.get_r_squared() < min_r_squared:
            logger.info(
                f"The {channel_num}th channel, {channel_name}, was removed"
                " since it's corresponding R2 score in PSD parametrization "
                f"was less than the threshold: {spectral_model.get_r_squared()} > min_r_squared"
            )
            continue

        # # offset ==================================
        if feature_categories["Offset"]:
            feature_arr = spectral_model.get_aperiodic_params()[0]
            feature_container = add_feature(
                feature_container, feature_arr, "Offset", channel_name, ""
            )
        # # Exponent ==================================
        if feature_categories["Exponent"]:
            feature_arr = spectral_model.get_aperiodic_params()[1]
            feature_container = add_feature(
                feature_container, feature_arr, "Exponent", channel_name, ""
            )

            if aperiodic_mode == "knee" and isinstance(
                spectral_models, pyrasa.irasa_mne.mne_objs.IrasaEpoched
            ):
                feature_arr = spectral_model.get_aperiodic_params()[2]
                feature_container = add_feature(
                    feature_container, feature_arr, "Exponent_2", channel_name, ""
                )

        # isolate periodic parts of signals
        flattened_psd = spectral_model.get_periodic_spectrum(original_psds=psds)
        original_psd = psds[channel_num, :]

        # # whenever aperidic activity is higher than periodic activity
        # # => set the preiodic acitivity to zero
        flattened_psd = np.array(list(map(lambda x: max(0, x), flattened_psd)))

        for ratio in power_band_ratios_list:
            num_band, den_band = ratio.numerator, ratio.denominator
            if num_band not in freq_bands or den_band not in freq_bands:
                continue

            fmin_num, fmax_num = freq_bands[num_band]
            fmin_den, fmax_den = freq_bands[den_band]
            ratio_name = f"{num_band}_over_{den_band}"

            if feature_categories["Adjusted_Band_Ratio"]:
                feature_arr = band_power_ratio(
                    psd=flattened_psd,
                    freqs=freqs,
                    fmin_num=fmin_num,
                    fmax_num=fmax_num,
                    fmin_den=fmin_den,
                    fmax_den=fmax_den,
                )
                feature_name = f"Adjusted_Band_Ratio__{ratio_name}"
                feature_container.at[feature_name, channel_name] = feature_arr

            if feature_categories["OriginalPSD_Band_Ratio"]:
                feature_arr = band_power_ratio(
                    psd=original_psd,
                    freqs=freqs,
                    fmin_num=fmin_num,
                    fmax_num=fmax_num,
                    fmin_den=fmin_den,
                    fmax_den=fmax_den,
                )
                feature_name = f"OriginalPSD_Band_Ratio__{ratio_name}"
                feature_container.at[feature_name, channel_name] = feature_arr

        # Loop through each frequency band
        for band_name, (fmin, fmax) in freq_bands.items():

            # Peak Features ==================================
            peak_params, band_peaks = spectral_model.get_peak_params(
                fmin=fmin, fmax=fmax
            )
            if peak_params is not None:
                if feature_categories["Peak_Center"] and peak_params[0] is not None:
                    feature_container = add_feature(
                        feature_container,
                        peak_params[0],
                        "Peak_Center",
                        channel_name,
                        band_name,
                    )

                if feature_categories["Peak_Power"] and peak_params[1] is not None:
                    feature_container = add_feature(
                        feature_container,
                        peak_params[1],
                        "Peak_Power",
                        channel_name,
                        band_name,
                    )

                if feature_categories["Peak_Width"] and peak_params[2] is not None:
                    feature_container = add_feature(
                        feature_container,
                        peak_params[2],
                        "Peak_Width",
                        channel_name,
                        band_name,
                    )

            # Adjusted absolute canonical power ==================================
            if feature_categories["Adjusted_Canonical_Absolute_Power"]:
                feature_arr = abs_canonical_power(
                    psd=flattened_psd, freqs=freqs, fmin=fmin, fmax=fmax
                )
                feature_container = add_feature(
                    feature_container,
                    feature_arr,
                    "Adjusted_Canonical_Absolute_Power",
                    channel_name,
                    band_name,
                )

            # Adjusted relative canonical power ==================================
            if (
                feature_categories["Adjusted_Canonical_Relative_Power"]
                and band_name != "Broadband"
            ):
                feature_arr = rel_canonical_power(
                    psd=flattened_psd, freqs=freqs, fmin=fmin, fmax=fmax
                )
                feature_container = add_feature(
                    feature_container,
                    feature_arr,
                    "Adjusted_Canonical_Relative_Power",
                    channel_name,
                    band_name,
                )

            # OriginalPSD absolute canonical power ==================================
            if feature_categories["OriginalPSD_Canonical_Absolute_Power"]:
                feature_arr = abs_canonical_power(
                    psd=original_psd, freqs=freqs, fmin=fmin, fmax=fmax
                )
                feature_container = add_feature(
                    feature_container,
                    feature_arr,
                    "OriginalPSD_Canonical_Absolute_Power",
                    channel_name,
                    band_name,
                )

            # OriginalPSD relative canonical power ==================================
            if (
                feature_categories["OriginalPSD_Canonical_Relative_Power"]
                and band_name != "Broadband"
            ):
                feature_arr = rel_canonical_power(
                    psd=original_psd, freqs=freqs, fmin=fmin, fmax=fmax
                )
                feature_container = add_feature(
                    feature_container,
                    feature_arr,
                    "OriginalPSD_Canonical_Relative_Power",
                    channel_name,
                    band_name,
                )

            if band_name != "Broadband" and band_peaks is not None:

                # Adjusted absolute Relative power ==================================
                if feature_categories["Adjusted_Individualized_Absolute_Power"]:
                    feature_arr = abs_individual_power(
                        psd=flattened_psd,
                        freqs=freqs,
                        band_peaks=band_peaks,
                        individualized_band_ranges=individualized_band_ranges,
                        band_name=band_name,
                    )
                    feature_container = add_feature(
                        feature_container,
                        feature_arr,
                        "Adjusted_Individualized_Absolute_Power",
                        channel_name,
                        band_name,
                    )

                # Adjusted relative Relative power ==================================
                if feature_categories["Adjusted_Individualized_Relative_Power"]:
                    feature_arr = rel_individual_power(
                        psd=flattened_psd,
                        freqs=freqs,
                        band_peaks=band_peaks,
                        individualized_band_ranges=individualized_band_ranges,
                        band_name=band_name,
                    )
                    feature_container = add_feature(
                        feature_container,
                        feature_arr,
                        "Adjusted_Individualized_Relative_Power",
                        channel_name,
                        band_name,
                    )

                # OriginalPSD absolute Relative power ==================================
                if feature_categories["OriginalPSD_Individualized_Absolute_Power"]:
                    feature_arr = abs_individual_power(
                        psd=original_psd,
                        freqs=freqs,
                        band_peaks=band_peaks,
                        individualized_band_ranges=individualized_band_ranges,
                        band_name=band_name,
                    )
                    feature_container = add_feature(
                        feature_container,
                        feature_arr,
                        "OriginalPSD_Individualized_Absolute_Power",
                        channel_name,
                        band_name,
                    )

                # OriginalPSD relative Relative power ==================================
                if feature_categories["OriginalPSD_Individualized_Relative_Power"]:
                    feature_arr = rel_individual_power(
                        psd=original_psd,
                        freqs=freqs,
                        band_peaks=band_peaks,
                        individualized_band_ranges=individualized_band_ranges,
                        band_name=band_name,
                    )
                    feature_container = add_feature(
                        feature_container,
                        feature_arr,
                        "OriginalPSD_Individualized_Relative_Power",
                        channel_name,
                        band_name,
                    )

    # # feature summarization ================================================================
    if which_layout:
        feature_container = summarizeFeatures(
            df=feature_container,
            device=device,
            which_layout=which_layout,
            which_sensor=which_sensor,
        )

    # Flatten the DataFrame and create neww column names
    final_df = pd.DataFrame(feature_container.values.flatten()).T
    final_df.columns = [
        f"{index}__{col}"
        for index in feature_container.index
        for col in feature_container.columns
    ]

    if feature_categories["Hemispheric_Asymmetry_index"]:
        final_df = compute_hemispheric_asymmetry(final_df)

    logger.info(f"The shape of the extracted features: {final_df.shape}")
    final_df.index = [subject_id]

    return final_df




[docs]
class SpectralDecomposer(ABC):
    """Abstract base class for spectral decomposition methods."""


[docs]
    @abstractmethod
    def get_aperiodic_params(self):
        """
        Return the fitted aperiodic parameters.

        Returns
        -------
        list
            Aperiodic parameters in the order [offset, exponent] for
            'fixed' mode, or [offset, exponent_1, exponent_2] for
            'knee' mode.
        """
        pass



[docs]
    @abstractmethod
    def get_periodic_spectrum(self, original_psds):
        """
        Isolate the periodic component of the power spectrum by removing
        the fitted aperiodic component.

        Parameters
        ----------
        original_psds : np.ndarray
            Original power spectral density values, shape
            (n_channels, n_freqs).

        Returns
        -------
        np.ndarray
            Periodic (flattened) power spectrum for the current channel,
            shape (n_freqs,).
        """
        pass



[docs]
    @abstractmethod
    def get_peak_params(self, fmin, fmax):
        """
        Return peak parameters within a given frequency range.

        Parameters
        ----------
        fmin : float
            Lower bound of the frequency range.
        fmax : float
            Upper bound of the frequency range.

        Returns
        -------
        dominant_peak : tuple or None
            Parameters (center frequency, power, width) of the dominant
            peak in the range, or None if no peak is found.
        band_peaks : list of tuple or None
            All peaks found within the frequency range, or None if none
            are found.
        """
        pass



[docs]
    @abstractmethod
    def get_r_squared(self):
        """
        Return the goodness-of-fit metric for the spectral model.

        Returns
        -------
        float
            R-squared value of the model fit.
        """
        pass





[docs]
class FOOOFDecomposer(SpectralDecomposer):
    """Spectral decomposer wrapping a FOOOF model for a single channel."""

    def __init__(self, fooof_model, mode, ch_num):
        """
        Parameters
        ----------
        fooof_model :
            Group of FOOOF models, one per channel.
        mode : str
            Aperiodic fitting mode, either 'knee' or 'fixed'.
        ch_num : int
            Index of the channel to decompose.
        """
        self.ch_num = ch_num
        self.model = fooof_model.get_fooof(ind=ch_num)
        self.mode = mode


[docs]
    def get_aperiodic_params(self):
        """
        Return the aperiodic parameters for the channel's FOOOF fit.

        Returns
        -------
        list
            [offset, exponent], with exponent taken from the correct
            index depending on `mode`.

        Raises
        ------
        ValueError
            If `mode` is not 'knee' or 'fixed'.
        """

        reordered_params = []
        params = self.model.get_params("aperiodic_params")
        # offset
        reordered_params.append(params[0])

        # exponent
        if self.mode == "knee":
            exponent_index = 2
        elif self.mode == "fixed":
            exponent_index = 1
        else:
            raise ValueError(
                f"Unknown aperiodic_mode: {self.mode}. Expected 'knee' or 'fixed'."
            )
        reordered_params.append(params[exponent_index])

        return reordered_params



[docs]
    def get_periodic_spectrum(self, original_psds):
        """
        Compute the periodic component by subtracting the fitted
        aperiodic component (in log space) from the original PSD.

        Parameters
        ----------
        original_psds : np.ndarray
            Original power spectral density values, shape
            (n_channels, n_freqs).

        Returns
        -------
        np.ndarray
            Periodic power spectrum for the channel, shape (n_freqs,).
        """
        original_psd = original_psds[self.ch_num, :]
        return original_psd - 10**self.model._ap_fit



[docs]
    def get_peak_params(self, fmin, fmax):
        """
        Extract the dominant peak and all peaks within a frequency band
        from the FOOOF model's peak parameters.

        Parameters
        ----------
        fmin : float
            Lower bound of the frequency band.
        fmax : float
            Upper bound of the frequency band.

        Returns
        -------
        dominant_peak : tuple or None
            (center frequency, power, width) of the peak with maximum
            power within the band, or None if no valid peak is found.
        band_peaks : list of tuple or None
            All non-NaN peaks within the frequency band, or None if
            none are found.
        """

        peaks = self.model.get_params("peak_params")

        # filter peaks: check for NaNs and then within thee frequency band
        band_peaks = [
            peak
            for peak in peaks
            if not np.any(np.isnan(peak)) and fmin <= peak[0] <= fmax
        ]

        if not band_peaks:
            return None, None

        # Get the dominant peak by selecting the one with the maximum second element (e.g., power)
        dominant_peak = max(band_peaks, key=lambda x: x[1])
        # Return the frequency of the dominant peak (first element of the tuple)

        return dominant_peak, band_peaks



[docs]
    def get_r_squared(self):
        """
        Return the R-squared value of the FOOOF model fit.

        Returns
        -------
        float
            R-squared value.
        """
        return self.model.r_squared_





[docs]
class PYRASADecomposer(SpectralDecomposer):
    """
    Spectral decomposer wrapping a PYRASA (IRASA) model for a single
    channel.
    """

    def __init__(self, model, mode, ch_name, ch_num, aperiodic):
        """
        Parameters
        ----------
        model :
            PYRASA IrasaEpoched model containing periodic and aperiodic
            components for all channels.
        mode : str
            Aperiodic fitting mode, either 'knee' or 'fixed'.
        ch_name : str
            Name of the channel to decompose.
        ch_num : int
            Index of the channel to decompose.
        aperiodic :
            Fitted aperiodic model object containing aperiodic
            parameters and goodness-of-fit statistics per channel.
        """
        self.mode = mode
        self.model = model
        self.aperiodic = aperiodic
        self.ch_name = ch_name
        self.ch_num = ch_num


[docs]
    def get_aperiodic_params(self):
        """
        Return the aperiodic parameters for the channel from the fitted
        aperiodic model.

        Returns
        -------
        list
            [offset, exponent_1, exponent_2] for the channel.
        """

        aperiodic_params = self.aperiodic.aperiodic_params
        aperiodic_params_of_interest = aperiodic_params[
            aperiodic_params["ch_name"] == self.ch_name
        ]

        params = []

        # offset
        params.append(aperiodic_params_of_interest["Offset"].item())
        # exponent
        params.append(aperiodic_params_of_interest["Exponent_1"].item())
        params.append(aperiodic_params_of_interest["Exponent_2"].item())

        return params



[docs]
    def get_periodic_spectrum(self, original_psds=None):
        """
        Return the periodic component of the spectrum for the channel
        as computed by PYRASA.

        Parameters
        ----------
        original_psds : np.ndarray, optional
            Unused; present for interface compatibility.

        Returns
        -------
        np.ndarray
            Periodic power spectrum for the channel, shape (n_freqs,).
        """
        # print(self.model.periodic.get_data().squeeze().shape)
        return self.model.periodic.get_data().squeeze()[self.ch_num, :]



[docs]
    def get_peak_params(self, fmin, fmax):
        """
        Placeholder for peak parameter extraction (not implemented for
        PYRASA models).

        Parameters
        ----------
        fmin : float
            Lower bound of the frequency band.
        fmax : float
            Upper bound of the frequency band.

        Returns
        -------
        None, None
        """
        return None, None  # TODO



[docs]
    def get_r_squared(self):
        """
        Return the R-squared value of the aperiodic fit for the channel.

        Returns
        -------
        float
            R-squared value.
        """
        gof = self.aperiodic.gof
        return gof[gof["ch_name"] == self.ch_name]["R2"].item()